Junghwa Lee
commited on
Commit
·
467f40d
1
Parent(s):
db57d2c
Add redpajama-3b instruct model weights
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mlc-chat-config.json +41 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
mlc-chat-config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "gpt_neox",
|
3 |
+
"quantization": "q4f16_1",
|
4 |
+
"model_config": {
|
5 |
+
"use_parallel_residual": false,
|
6 |
+
"hidden_size": 2560,
|
7 |
+
"intermediate_size": 10240,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"layer_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 50432,
|
12 |
+
"rotary_pct": 1.0,
|
13 |
+
"position_embedding_base": 10000,
|
14 |
+
"context_window_size": 2048,
|
15 |
+
"head_dim": 80,
|
16 |
+
"prefill_chunk_size": 2048,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"ffn_out_dtype": "float32"
|
19 |
+
},
|
20 |
+
"vocab_size": 50432,
|
21 |
+
"context_window_size": 2048,
|
22 |
+
"sliding_window_size": -1,
|
23 |
+
"prefill_chunk_size": 2048,
|
24 |
+
"attention_sink_size": -1,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"mean_gen_len": 128,
|
27 |
+
"max_gen_len": 512,
|
28 |
+
"shift_fill_factor": 0.3,
|
29 |
+
"temperature": 0.7,
|
30 |
+
"repetition_penalty": 1.0,
|
31 |
+
"top_p": 0.95,
|
32 |
+
"conv_template": "redpajama_chat",
|
33 |
+
"pad_token_id": 0,
|
34 |
+
"bos_token_id": 0,
|
35 |
+
"eos_token_id": 0,
|
36 |
+
"tokenizer_files": [
|
37 |
+
"tokenizer.json",
|
38 |
+
"tokenizer_config.json"
|
39 |
+
],
|
40 |
+
"version": "0.1.0"
|
41 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:395c376368812d96572e8b38c8cd36b9b90a93d602e1f631abf3b51894aed018
|
3 |
+
size 64552960
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8836f35e0fb2cf2c7a00edb04dde8aaae5c65c7073fdd7508a6a42e64ac9bdd1
|
3 |
+
size 22855680
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bd3ed82df33b6cc95b5bd7ba3a859c9deaa2f1b1533bc402ece3b286ce7433d
|
3 |
+
size 29537280
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f326398c57657b154dd9c972b52880cb7ec336e3917abf5f1e3a6244ff722304
|
3 |
+
size 29537280
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6065a96a418a09af296c12b1059255c3d97d2bbe92f70765f23750596d6c3e9a
|
3 |
+
size 29532160
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fc121058abdb9ad6196de358b6d23c4040da978a343c82fa619da4bbe72726d
|
3 |
+
size 29537280
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee25024156cd62a5ae10c7b4bbc465878c5efe65bd63870780969cd87898e7b2
|
3 |
+
size 29537280
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a13bb0aff4556d39f45d8bfbcbbe03eac4f68d86bea1fbd537dba0c67662ea6f
|
3 |
+
size 29532160
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5634c7f45d1334ef1727b2d764fab65a84685a25f3ce5373fa6ee6138d3fa59c
|
3 |
+
size 29537280
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7b81f1d09228bf71629e2c3900dab614f183109c5dcb28d0f32345f906ce93b
|
3 |
+
size 29537280
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d435ba9a92c1b2a51a9d62bbc95fc9b0e740306213f80d687cbb5bd12abc8227
|
3 |
+
size 29532160
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bdd1301b6afbd2024b5e38f0ab40a5f3a97f203f289158b1cba158d44e304c59
|
3 |
+
size 29537280
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03f36b98e93c785b9f955ad3dec7a22f0ff44ba0955d5444afcbd78a1ea5723e
|
3 |
+
size 29537280
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1e3bcce856cc643aec17625755f41655bcabef3feac3dc0cdba402fef23d0ad
|
3 |
+
size 29537280
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6c2b06d02b2930eb63da020efaa0de8eb9017d10dbeac272f51e60896f102ca
|
3 |
+
size 29532160
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afe608ebf3261ac3af3ae2b72a19784f458be8742f38c1ab7bdacc8a6f8c2a32
|
3 |
+
size 29537280
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53f21e4de88c85e607d98e66d876f06cf3ead97cdcdb79b6a6b81f80bac03e35
|
3 |
+
size 29537280
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e00ca077724c83a38c2fa4c1392d11969b7b4596254607942888e62137f13b16
|
3 |
+
size 29532160
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:608f5de7d3f9d0ba91d6ffbf33493d06f86fe19bc886826f41580fe5d44066ae
|
3 |
+
size 29537280
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:159b85c3025857edeb7c390bc65763bc61ec705ba912efc061b4b8c362391c71
|
3 |
+
size 29537280
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f27aabfa180af3feac5d6512eda81cb58c09b9a2ddfbe1a37a218a4b39f844c
|
3 |
+
size 29532160
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe48b2a8bfdbb37e511fc25bbd26d67beeb1923e0aaed8cafc00fba25356484a
|
3 |
+
size 29537280
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e79a8197a70d4c9ac5792bc87a0f968e73f4306015876ded827316a61fe0e88
|
3 |
+
size 29537280
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2075e09491fb4e01e0281e5bac65bc552f27b2133fa796f93e352c783a4202d
|
3 |
+
size 29532160
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6d8ee477de5036da20596d93893e6d8885058949f45e028465ac99a271a5ca3
|
3 |
+
size 29532160
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:254ad29630dfde91b16ead6aa1b1e5a991d3229af3b0f9f342030267c7526f8c
|
3 |
+
size 29537280
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e63e53f35347e476332092402a2229d06f351f8742b93b244e038f27e7141c70
|
3 |
+
size 29537280
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4b93ee664fbd7925b9c640e5db60f99010a951ed6fe8d6197869d1a5a05af3b
|
3 |
+
size 29532160
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec3f2d229495b28f6162140ebd70910a09640e92c8a83335365c41ca16bf9418
|
3 |
+
size 29537280
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af537de1cc74bf451e47f25e82f218f5a8f0ef09265daa3246cdced9bd793fee
|
3 |
+
size 29537280
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da99b5efde1bb8e2facc67011e8404b4559bfb7d98d552be70ed84582830e6d0
|
3 |
+
size 29532160
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5f5f27a183e97670d2f75ef3a944d0b50f8c6a77474340a2aca14189f4de545
|
3 |
+
size 29537280
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e137e6a8a53467745eea4aaa3d5eabcbd777493b934db870a5515492114d610a
|
3 |
+
size 29537280
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad82980e67d9a46b796210c217b3c2e87843b8bf81ece18b31c97f3a48b144c6
|
3 |
+
size 29532160
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41abe0eaccfce065cf7649e0c0f03ff1e90f11e749f5ecc56201753a00f72b1e
|
3 |
+
size 29537280
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d40a5b1c174dc15e799483f25f30a4433d6d894138dd3c547670436df0eccb5c
|
3 |
+
size 29537280
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:722a75046e0875e81ff0704eff78bb264c288e74f26776a8ea60ed7907165e66
|
3 |
+
size 29537280
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48ce350036198ed0155dbc1834a755a81f5058bbe6d5515c703db093663ff20d
|
3 |
+
size 29532160
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e46282cb8bdbf02f16659610d5a0e91ee7c13bbf54815efc001f177a8b068199
|
3 |
+
size 29537280
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26f56b11cf42078d5911597cf0527ff492f0bf3527427dd205f63b4443a064a9
|
3 |
+
size 29537280
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e10a9cd191d5319a8b2728cc98e7f05230b543c9ad1d37958d7859d92123e529
|
3 |
+
size 29532160
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94a8ca5be62a1c3dc5ee69995272fd253044b03267b5e85adedb8940a0cfb8b5
|
3 |
+
size 29537280
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a7a0f1a1c7018277e67b0ed925a6e710535236caa09cd46e87b550064e1636d
|
3 |
+
size 29537280
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b83e7fcb76ae692c2ccde67da0b74c00bb3a5eef9d775cd033d7190958debc8
|
3 |
+
size 29532160
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf58ee34789f25de6cd18624bc03ecc66cf811e4794883253ed771439fae935d
|
3 |
+
size 64552960
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fe7659668cf993efc67a84e5a261e7fd626af595a732ea90f0967e7e9b45c7a
|
3 |
+
size 29537280
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e1c3655de1f8954e07a10dffcca8f9b2ed54e629363d6ac49601da967cc280c
|
3 |
+
size 22830080
|