Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +2 -1
- generation_config.json +1 -1
- pytorch_model-00001-of-00129.bin +3 -0
- pytorch_model-00002-of-00129.bin +3 -0
- pytorch_model-00003-of-00129.bin +3 -0
- pytorch_model-00004-of-00129.bin +3 -0
- pytorch_model-00005-of-00129.bin +3 -0
- pytorch_model-00006-of-00129.bin +3 -0
- pytorch_model-00007-of-00129.bin +3 -0
- pytorch_model-00008-of-00129.bin +3 -0
- pytorch_model-00009-of-00129.bin +3 -0
- pytorch_model-00010-of-00129.bin +3 -0
- pytorch_model-00011-of-00129.bin +3 -0
- pytorch_model-00012-of-00129.bin +3 -0
- pytorch_model-00013-of-00129.bin +3 -0
- pytorch_model-00014-of-00129.bin +3 -0
- pytorch_model-00015-of-00129.bin +3 -0
- pytorch_model-00016-of-00129.bin +3 -0
- pytorch_model-00017-of-00129.bin +3 -0
- pytorch_model-00018-of-00129.bin +3 -0
- pytorch_model-00019-of-00129.bin +3 -0
- pytorch_model-00020-of-00129.bin +3 -0
- pytorch_model-00021-of-00129.bin +3 -0
- pytorch_model-00022-of-00129.bin +3 -0
- pytorch_model-00023-of-00129.bin +3 -0
- pytorch_model-00024-of-00129.bin +3 -0
- pytorch_model-00025-of-00129.bin +3 -0
- pytorch_model-00026-of-00129.bin +3 -0
- pytorch_model-00027-of-00129.bin +3 -0
- pytorch_model-00028-of-00129.bin +3 -0
- pytorch_model-00029-of-00129.bin +3 -0
- pytorch_model-00030-of-00129.bin +3 -0
- pytorch_model-00031-of-00129.bin +3 -0
- pytorch_model-00032-of-00129.bin +3 -0
- pytorch_model-00033-of-00129.bin +3 -0
- pytorch_model-00034-of-00129.bin +3 -0
- pytorch_model-00035-of-00129.bin +3 -0
- pytorch_model-00036-of-00129.bin +3 -0
- pytorch_model-00037-of-00129.bin +3 -0
- pytorch_model-00038-of-00129.bin +3 -0
- pytorch_model-00039-of-00129.bin +3 -0
- pytorch_model-00040-of-00129.bin +3 -0
- pytorch_model-00041-of-00129.bin +3 -0
- pytorch_model-00042-of-00129.bin +3 -0
- pytorch_model-00043-of-00129.bin +3 -0
- pytorch_model-00044-of-00129.bin +3 -0
- pytorch_model-00045-of-00129.bin +3 -0
- pytorch_model-00046-of-00129.bin +3 -0
- pytorch_model-00047-of-00129.bin +3 -0
- pytorch_model-00048-of-00129.bin +3 -0
config.json
CHANGED
@@ -4,6 +4,7 @@
|
|
4 |
"architectures": [
|
5 |
"FSGPTMoEForCausalLM"
|
6 |
],
|
|
|
7 |
"attention_dropout": 0.1,
|
8 |
"attention_heads": 16,
|
9 |
"batch_prioritized_routing": false,
|
@@ -28,7 +29,7 @@
|
|
28 |
"pad_token_id": 50258,
|
29 |
"resid_dropout": 0.1,
|
30 |
"router_bias": false,
|
31 |
-
"router_dtype": "
|
32 |
"router_ignore_padding_tokens": true,
|
33 |
"second_expert_policy": "all",
|
34 |
"sparse_step": 2,
|
|
|
4 |
"architectures": [
|
5 |
"FSGPTMoEForCausalLM"
|
6 |
],
|
7 |
+
"model_type": "fairseq-moe",
|
8 |
"attention_dropout": 0.1,
|
9 |
"attention_heads": 16,
|
10 |
"batch_prioritized_routing": false,
|
|
|
29 |
"pad_token_id": 50258,
|
30 |
"resid_dropout": 0.1,
|
31 |
"router_bias": false,
|
32 |
+
"router_dtype": "bfloat16",
|
33 |
"router_ignore_padding_tokens": true,
|
34 |
"second_expert_policy": "all",
|
35 |
"sparse_step": 2,
|
generation_config.json
CHANGED
@@ -3,5 +3,5 @@
|
|
3 |
"bos_token_id": 50257,
|
4 |
"eos_token_id": 50259,
|
5 |
"pad_token_id": 50258,
|
6 |
-
"transformers_version": "4.
|
7 |
}
|
|
|
3 |
"bos_token_id": 50257,
|
4 |
"eos_token_id": 50259,
|
5 |
"pad_token_id": 50258,
|
6 |
+
"transformers_version": "4.35.2"
|
7 |
}
|
pytorch_model-00001-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86601ee8a46846d71645d06d7958b59d38b1a0b93ef2b1b7d3c0ff99b697ada1
|
3 |
+
size 805863719
|
pytorch_model-00002-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c71e90696aedaa0e2a6745e69c4f49941a40624a411c0edb8351f21d7a019e8
|
3 |
+
size 805863719
|
pytorch_model-00003-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc401f17791cdf22626866d1748d44594a51938fd7c850b293e75defecb99089
|
3 |
+
size 805863783
|
pytorch_model-00004-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a0968d478fd16d8b57ff1b6c9ffa5b337e5111ef34802dff5e0905d9c62e66b
|
3 |
+
size 805863911
|
pytorch_model-00005-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57be95afaee854d5dfaadec6f95ddab45935aee8cc3991b73fa0b6822ddf2907
|
3 |
+
size 805863911
|
pytorch_model-00006-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f05157c4514d68c786cf5aa1636714040992b1d21798b57f806cf1443d3376a
|
3 |
+
size 805863911
|
pytorch_model-00007-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85726e3a23a92154d13c018401b00114049a98c3d1b56c249b6f9ec85883c32d
|
3 |
+
size 805863911
|
pytorch_model-00008-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7c689c11f2da39d0d855a8ac8ff0278bc695957b1a54ebb6ed46a1ec88166d4
|
3 |
+
size 805863911
|
pytorch_model-00009-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e455418ac3cc296e344286a915febd3259fd9ffc548076387b4ef735af0c4ef
|
3 |
+
size 805863911
|
pytorch_model-00010-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:344f01ee728c6ddc6cdf5bcc87629bdf8e2d42d1f7639a09e6056e291481cadc
|
3 |
+
size 805863911
|
pytorch_model-00011-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e867474f1e4e69dddd729b84dc3fbed76abca66ce68b5856f1332bcc68b86e96
|
3 |
+
size 805863911
|
pytorch_model-00012-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d46c82ff17f0bee7509773236c0333c7b64cce27b63d1fc9072c55fd7ad41e2
|
3 |
+
size 805863911
|
pytorch_model-00013-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d845d981401980c86847a505ae39f1362070a40ce4ce35f1b499fa3ae678de46
|
3 |
+
size 805863911
|
pytorch_model-00014-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9974bc4a62178dd2da3a0ce2c75ce148e86b740e8c4d7ff30ffe5db57649bc2b
|
3 |
+
size 805863911
|
pytorch_model-00015-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca956683ca9e7b4949cf7623c182333367c4f67da3066187f75bb75452188392
|
3 |
+
size 805863911
|
pytorch_model-00016-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83379b28761925cc4f08468135a09423a91444c56531b7c628b6342845fd1f9e
|
3 |
+
size 805863911
|
pytorch_model-00017-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e38f88c719432807a4d510b3784be867ab77fe9c9f4815d7ce84cc3866f6ab07
|
3 |
+
size 805863911
|
pytorch_model-00018-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed47c602051553a1bd96c8647a8a5fcb5639a54ae3bff19392ed6638e133f79f
|
3 |
+
size 805863911
|
pytorch_model-00019-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53e31bae07b5f2a69fbb2aab80949993550fcb6a38d1a130b6965a259d664644
|
3 |
+
size 805863911
|
pytorch_model-00020-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:925f232df288b51a24bc1b30d0310bcceb081838c466967db8a5e6113d0f2583
|
3 |
+
size 805863911
|
pytorch_model-00021-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e661a80c042a189159c81c29bd234f878313d6ae522d19b303379011a11d6f5
|
3 |
+
size 805863911
|
pytorch_model-00022-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5498281cf04bd187490f0d4334852e0d4ed5e87083c1af9bc64978ac00fa5735
|
3 |
+
size 805863911
|
pytorch_model-00023-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39ccf3e11b7d9a1d3c662ae5d85bf1d2502cc040ebaf0fff78db541a5caaebb1
|
3 |
+
size 805863911
|
pytorch_model-00024-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db45df5bcafe3f86da122a98f58519d1f1104ea8fcfac14dacec56cf5d8807e2
|
3 |
+
size 805863911
|
pytorch_model-00025-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc5f469c82883caf20eb0f8531a1387caf129d76b5e0258312e5d952d32af08e
|
3 |
+
size 805863911
|
pytorch_model-00026-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a36de78bd83d474cc71aab1ac7ee66b19207020fcedc167acbab949802c86e8
|
3 |
+
size 805864103
|
pytorch_model-00027-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9bbf8f9fb75a5a24515940e12f300a8a2405a7f9cc206f4f6a8066b714de7904
|
3 |
+
size 805864103
|
pytorch_model-00028-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:325e94d9fdbd43e7107f19a93b50a9b2b958752187801fdb165207e887a85e5c
|
3 |
+
size 805864103
|
pytorch_model-00029-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9694df632accdef5417efd96d35fb32114b177bbd87e3256c6420c9eeaa3dbb7
|
3 |
+
size 805864103
|
pytorch_model-00030-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3bf4acb18f9f1fcd53c504e4da1b8b69718cc85f3a9dce1f0e5f1ba2fb7dc2ea
|
3 |
+
size 805864103
|
pytorch_model-00031-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf8f5919ebba7393fe5353d1630569b67498a19e9dcb972690986f214e8ea4f1
|
3 |
+
size 805864103
|
pytorch_model-00032-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1098ea66577e21fea402f9aae090ff0f326490b0c22abfed765ede75868d68a6
|
3 |
+
size 805864103
|
pytorch_model-00033-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32731f543f13bf822547b5443b51719805878fa74d52f49660872c18e871cafe
|
3 |
+
size 805864103
|
pytorch_model-00034-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6ceb74ef8b5532cb61d2e1150f98dea2f992b6ded12508a357c93dca1ce6601
|
3 |
+
size 805864103
|
pytorch_model-00035-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bef6be88e1845b0b4803eaea312d25d5ac6ff4766ba2f9e9acffc684a6fd1a87
|
3 |
+
size 805864103
|
pytorch_model-00036-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d09352ca55737c00f25cd2d8da427623eb0eef698067eddc3b57b4a188f36988
|
3 |
+
size 805864103
|
pytorch_model-00037-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f0f842d94fc4c4402e09a667cf695610256e52c1a2b4265feb105cb11b135f9
|
3 |
+
size 805864103
|
pytorch_model-00038-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d288b3b8d1499304c2b3e4f2d8354ac09a82dbf3e7ba249382861c6793c58c9
|
3 |
+
size 805864103
|
pytorch_model-00039-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f250184e62af5b10f8922ec3388533421d42afb214d723680a8c290cd2030913
|
3 |
+
size 805864103
|
pytorch_model-00040-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ed0cc976baa2230c40dfe781482dd85e47a40c838cb9a041cab4775eb3ef4bd
|
3 |
+
size 805864103
|
pytorch_model-00041-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1eb4ae326ba957ea0ad5b4e5d809b020152c33ef131f401d0f7dd8f20514a240
|
3 |
+
size 805864103
|
pytorch_model-00042-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2f061cc81342734309de48590c792bf4ee90261674eed607036c175916ac947
|
3 |
+
size 805864103
|
pytorch_model-00043-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d71406e68bca7f4709547747d1fb6957cc335efcca016afef113d0396778d20f
|
3 |
+
size 805864103
|
pytorch_model-00044-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e89197e0a685965bed15b34e8765a3003086d759a8435b3f4d060c3313f9b44c
|
3 |
+
size 805864103
|
pytorch_model-00045-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3c2a1c9b56560f98c5fc2eaff55f39221b7a582edf118af7e686a8b712c88d7
|
3 |
+
size 805864103
|
pytorch_model-00046-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd2af36c9752848000d7470db4f1cf82573ba0645e64bb371b32c78c2b058866
|
3 |
+
size 805864103
|
pytorch_model-00047-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4c6606321c5f684898c31fc1c08450574bca881affb76b7a03f44154937ac31
|
3 |
+
size 805864103
|
pytorch_model-00048-of-00129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95b29aed8f540b71201283799a55c5a8dcfc38e21de101a1fc1ef1ddfec31e4f
|
3 |
+
size 805864103
|