Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- mlc-chat-config.json +78 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "cohere",
|
4 |
+
"quantization": "q4f16_1",
|
5 |
+
"model_config": {
|
6 |
+
"model_type": "cohere",
|
7 |
+
"hidden_size": 8192,
|
8 |
+
"vocab_size": 256000,
|
9 |
+
"num_hidden_layers": 40,
|
10 |
+
"num_attention_heads": 64,
|
11 |
+
"num_key_value_heads": 8,
|
12 |
+
"intermediate_size": 24576,
|
13 |
+
"layer_norm_eps": 1e-05,
|
14 |
+
"position_embedding_base": 4000000,
|
15 |
+
"context_window_size": 131072,
|
16 |
+
"prefill_chunk_size": 2048,
|
17 |
+
"head_dim": 128,
|
18 |
+
"tensor_parallel_shards": 1,
|
19 |
+
"max_batch_size": 80
|
20 |
+
},
|
21 |
+
"vocab_size": 256000,
|
22 |
+
"context_window_size": 131072,
|
23 |
+
"sliding_window_size": -1,
|
24 |
+
"prefill_chunk_size": 2048,
|
25 |
+
"attention_sink_size": -1,
|
26 |
+
"tensor_parallel_shards": 1,
|
27 |
+
"pipeline_parallel_stages": 1,
|
28 |
+
"temperature": 1.0,
|
29 |
+
"presence_penalty": 0.0,
|
30 |
+
"frequency_penalty": 0.0,
|
31 |
+
"repetition_penalty": 1.0,
|
32 |
+
"top_p": 1.0,
|
33 |
+
"tokenizer_files": [
|
34 |
+
"tokenizer.json",
|
35 |
+
"tokenizer_config.json"
|
36 |
+
],
|
37 |
+
"tokenizer_info": {
|
38 |
+
"token_postproc_method": "byte_level",
|
39 |
+
"prepend_space_in_encode": false,
|
40 |
+
"strip_space_in_decode": false
|
41 |
+
},
|
42 |
+
"conv_template": {
|
43 |
+
"name": "aya-23",
|
44 |
+
"system_template": "<|START_OF_TURN_TOKEN|><|SYSTEM_TOKEN|>{system_message}<|END_OF_TURN_TOKEN|>",
|
45 |
+
"system_message": "You are Command-R, a brilliant, sophisticated, AI-assistant trained to assist human users by providing thorough responses.",
|
46 |
+
"system_prefix_token_ids": [
|
47 |
+
5
|
48 |
+
],
|
49 |
+
"add_role_after_system_message": true,
|
50 |
+
"roles": {
|
51 |
+
"user": "<|START_OF_TURN_TOKEN|><|USER_TOKEN|>",
|
52 |
+
"assistant": "<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>"
|
53 |
+
},
|
54 |
+
"role_templates": {
|
55 |
+
"user": "{user_message}",
|
56 |
+
"assistant": "{assistant_message}",
|
57 |
+
"tool": "{tool_message}"
|
58 |
+
},
|
59 |
+
"messages": [],
|
60 |
+
"seps": [
|
61 |
+
"<|END_OF_TURN_TOKEN|>"
|
62 |
+
],
|
63 |
+
"role_content_sep": "",
|
64 |
+
"role_empty_sep": "",
|
65 |
+
"stop_str": [
|
66 |
+
"<|END_OF_TURN_TOKEN|>"
|
67 |
+
],
|
68 |
+
"stop_token_ids": [
|
69 |
+
6,
|
70 |
+
255001
|
71 |
+
],
|
72 |
+
"function_string": "",
|
73 |
+
"use_function_calling": false
|
74 |
+
},
|
75 |
+
"pad_token_id": 0,
|
76 |
+
"bos_token_id": 5,
|
77 |
+
"eos_token_id": 255001
|
78 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9af90520f4a5b06e967ffd246f0c224a9cac05746703c1ee1def76bee2b498d
|
3 |
+
size 1048576000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f072fe96910774a3cb719c286b428d59424b6262501207eea30cba66e7d3060b
|
3 |
+
size 131072000
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5cc8575fb6fe6529f3481424ea8c669e61bf4ccc02181e08e8d861344c8f5be5
|
3 |
+
size 100663296
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f301d534331def8994c8beb9aab4233433fb4aec4791763d5ae1f823bbae774
|
3 |
+
size 41943040
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62d1639f118a938f071c2df18363f5b478f70a87953c429cb0bdb28946cba855
|
3 |
+
size 33554432
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53d86c25de2091a82b7a116aae8d879ae40b4c6f15f630d98d36a67918acc581
|
3 |
+
size 30408704
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:562d79aaf64398d855a62723b34f825346945e795bdb4270cdfde498ecbc161f
|
3 |
+
size 100663296
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:776febf12ae1adfe3492e1bce1f59c6c52eb8d3bb0c17d55fd5c711fd102aa69
|
3 |
+
size 100663296
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:773a28a75d74cf27ff5413cbe13c1b5f347a0090adab459ef273557a44a81e57
|
3 |
+
size 100663296
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ead38fb3b900349e8df9d15201375fa6449dc7eb069e5787b8bba7481623b97e
|
3 |
+
size 29376512
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68390637ae684bd3614fd79aa30c66cb852406d8bd39cae77bf7f7172b02f04c
|
3 |
+
size 41943040
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32738a4ed866836d76f80d23216cbcdb3c169a951ba80a7396f42a333f61bc0c
|
3 |
+
size 33554432
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f67f1430beb805deca44a5b2f580ad1b899cdd55005c66345008b1449fa1d807
|
3 |
+
size 100663296
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:024bad1bc25440d0902f51af2aa530c0a51e798c3d778b68cd38ce1a62787276
|
3 |
+
size 100663296
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8e095cad69728bd0c5db2777283fad0e40c58d4ad1b20e1af360d1296d760fc
|
3 |
+
size 22036480
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:724845c80938f509d88ceb114108dc936a397a038dff8bcf85fb1447aa036d29
|
3 |
+
size 100663296
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42b59ecbadeff1b53f42859950db53c6f4578d3ff47e75d217ca5c95d03aa2e1
|
3 |
+
size 100663296
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1731654893ef95e782bfd10cdaf34b5b035ab820516b52fa3239a781202ca867
|
3 |
+
size 25165824
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc35ffa5657bbfc1b173983ec66025487c4bb03f6f536034987322cb12294eb1
|
3 |
+
size 41943040
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdc4103fd287062df029109d54ef7a40c50fbbe667cdf9c99dbba49b9af5eec5
|
3 |
+
size 33554432
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3edc3e26144230785cfb794a4dc389761c4e275122b0c7a37a7fd091f6c8337
|
3 |
+
size 100663296
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aabe22f54942d1c805535559d6e7ba3b8a2095d0704d16f189a65a38c953381
|
3 |
+
size 22036480
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10937549c4f7bbc5443860ac14ac4b4c4f96f7bbe7b783c3991a16e8bf062721
|
3 |
+
size 100663296
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2773b9e86e9643eceddf148e0e9ceb190bad80534b390ecd5afa102a4ef730a2
|
3 |
+
size 100663296
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40c8f09d02c02575acaebb1c6df379dca05261040d46fedbf21d79374ee4dce6
|
3 |
+
size 25165824
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6d5bfc6835a2811769b15058a6beda4077c9b1232228109ae281c717ebe870e
|
3 |
+
size 25165824
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c81f081e8c692c2f636df07be41355a5cf9aaa919472872bb741f0871125aa8f
|
3 |
+
size 41943040
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6e4b8605ee2f5db8ab85ec244c0000df838fbc8a080b66da3f146af2fdc1c72d
|
3 |
+
size 33554432
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38e723cf3eeb9d236f587171f7cee67a2f9fd8f6fdef151173a698b313cfe1e7
|
3 |
+
size 100663296
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:856f32627e54eadc64a7fcd2bf4eb7687abee7fa61cb2791fe9999ccfa1c10af
|
3 |
+
size 22036480
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:939fbfdebdc27338d9d2cfa941943c1584f1733a8f40c2d1450547b0de47cb88
|
3 |
+
size 100663296
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a8fc326f48b8ee77f16434e0071db55e7ff515cee58b02213eee4fb9eafe5e4
|
3 |
+
size 100663296
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98908b2dcfe2713b7e15043c3da8ab8e7510782c7b99c994f0bc5dca68d039fe
|
3 |
+
size 25165824
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1ccc490e03a8b677145425f88f5616c534890ad3f481169910d7b0a0b4a6504
|
3 |
+
size 41943040
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9445c63fb0a4cdfad9ad47014cf3fbd711a68bc8f333734e3a2a10437f889d38
|
3 |
+
size 33554432
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e676226c16f4373a4c1b5a85f3687834401fb60f3c6a3ee6a75e35ebf7740ea
|
3 |
+
size 41943040
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5501d3a7511e92b7acb5d6007193ffc3975e3d7d44c1c4e60295c6be107a698a
|
3 |
+
size 100663296
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5c4a608d643e4b4091f4bf972ebce8e5d2338eb22a7b0072d17433e20ef4750
|
3 |
+
size 22036480
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:112dd3d1f55ee04340e09080464fecd9e32678bd5b6d800e48ece8321fccf832
|
3 |
+
size 100663296
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a0bcb210826282c0f7fa72935cdee346ce1c841ee1ad1b3e1c25bc3526f1251
|
3 |
+
size 100663296
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a4e51d4c2889294dd8f3c6e87683778839d3dcb3704f881f5adc001fd879e29
|
3 |
+
size 25165824
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f8cbf712f70018c13788c20f940687d5012d800dc5940c27884ab9a2256ee99
|
3 |
+
size 41943040
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e48b84ddfa54850e68cbfc5d4e3483e802d49bba207cc86b4ee8e215c30c6f8a
|
3 |
+
size 33554432
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49227e7dd8058b9104ad4324a51d6b929531c9e09bf866492a67e2b3ed028bf8
|
3 |
+
size 41943040
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:37200147e3e3ba20999807428ab2b1c8ad5531e1721846b46b7732e2f78b97bf
|
3 |
+
size 33554432
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b020cb7d79382ac701e03f0af3d654f5666e05f2011c3170269842d4385a0dde
|
3 |
+
size 100663296
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e2df686859515b5df672ea1e0142236978aed8720bcb865683fb5c112f54db8
|
3 |
+
size 33554432
|