Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +17 -0
- added_tokens.json +3 -0
- config.json +30 -0
- mergekit_config.yml +30 -0
- merges.txt +0 -0
- model-00001-of-00082.safetensors +3 -0
- model-00002-of-00082.safetensors +3 -0
- model-00003-of-00082.safetensors +3 -0
- model-00004-of-00082.safetensors +3 -0
- model-00005-of-00082.safetensors +3 -0
- model-00006-of-00082.safetensors +3 -0
- model-00007-of-00082.safetensors +3 -0
- model-00008-of-00082.safetensors +3 -0
- model-00009-of-00082.safetensors +3 -0
- model-00010-of-00082.safetensors +3 -0
- model-00011-of-00082.safetensors +3 -0
- model-00012-of-00082.safetensors +3 -0
- model-00013-of-00082.safetensors +3 -0
- model-00014-of-00082.safetensors +3 -0
- model-00015-of-00082.safetensors +3 -0
- model-00016-of-00082.safetensors +3 -0
- model-00017-of-00082.safetensors +3 -0
- model-00018-of-00082.safetensors +3 -0
- model-00019-of-00082.safetensors +3 -0
- model-00020-of-00082.safetensors +3 -0
- model-00021-of-00082.safetensors +3 -0
- model-00022-of-00082.safetensors +3 -0
- model-00023-of-00082.safetensors +3 -0
- model-00024-of-00082.safetensors +3 -0
- model-00025-of-00082.safetensors +3 -0
- model-00026-of-00082.safetensors +3 -0
- model-00027-of-00082.safetensors +3 -0
- model-00028-of-00082.safetensors +3 -0
- model-00029-of-00082.safetensors +3 -0
- model-00030-of-00082.safetensors +3 -0
- model-00031-of-00082.safetensors +3 -0
- model-00032-of-00082.safetensors +3 -0
- model-00033-of-00082.safetensors +3 -0
- model-00034-of-00082.safetensors +3 -0
- model-00035-of-00082.safetensors +3 -0
- model-00036-of-00082.safetensors +3 -0
- model-00037-of-00082.safetensors +3 -0
- model-00038-of-00082.safetensors +3 -0
- model-00039-of-00082.safetensors +3 -0
- model-00040-of-00082.safetensors +3 -0
- model-00041-of-00082.safetensors +3 -0
- model-00042-of-00082.safetensors +3 -0
- model-00043-of-00082.safetensors +3 -0
- model-00044-of-00082.safetensors +3 -0
- model-00045-of-00082.safetensors +3 -0
README.md
ADDED
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: apache-2.0
|
3 |
+
tags:
|
4 |
+
- merge
|
5 |
+
- mergekit
|
6 |
+
- lazymergekit
|
7 |
+
- migtissera/Tess-72B-v1.5b
|
8 |
+
- abacusai/Smaug-72B-v0.1
|
9 |
+
---
|
10 |
+
|
11 |
+
# ECE-TW3-JRGL-V3
|
12 |
+
|
13 |
+
ECE-TW3-JRGL-V3 is a merge of the following models using [mergekit](https://github.com/cg123/mergekit):
|
14 |
+
* [migtissera/Tess-72B-v1.5b](https://huggingface.co/migtissera/Tess-72B-v1.5b)
|
15 |
+
* [abacusai/Smaug-72B-v0.1](https://huggingface.co/abacusai/Smaug-72B-v0.1)
|
16 |
+
|
17 |
+
## 🧩 Configuration
|
added_tokens.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"[PAD]": 151851
|
3 |
+
}
|
config.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "migtissera/Tess-72B-v1.5b",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128245,
|
9 |
+
"eos_token_id": 128247,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 24576,
|
14 |
+
"max_position_embeddings": 32768,
|
15 |
+
"model_type": "llama",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_hidden_layers": 80,
|
18 |
+
"num_key_value_heads": 64,
|
19 |
+
"pad_token_id": 151643,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"rms_norm_eps": 1e-06,
|
22 |
+
"rope_scaling": null,
|
23 |
+
"rope_theta": 1000000,
|
24 |
+
"seq_length": 32768,
|
25 |
+
"tie_word_embeddings": false,
|
26 |
+
"torch_dtype": "bfloat16",
|
27 |
+
"transformers_version": "4.39.3",
|
28 |
+
"use_cache": false,
|
29 |
+
"vocab_size": 152064
|
30 |
+
}
|
mergekit_config.yml
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
base_model: migtissera/Tess-72B-v1.5b
|
2 |
+
dtype: bfloat16
|
3 |
+
merge_method: slerp
|
4 |
+
parameters:
|
5 |
+
t:
|
6 |
+
- filter: self_attn
|
7 |
+
value:
|
8 |
+
- 0
|
9 |
+
- 0.5
|
10 |
+
- 0.3
|
11 |
+
- 0.7
|
12 |
+
- 1
|
13 |
+
- filter: mlp
|
14 |
+
value:
|
15 |
+
- 1
|
16 |
+
- 0.5
|
17 |
+
- 0.7
|
18 |
+
- 0.3
|
19 |
+
- 0
|
20 |
+
- value: 0.5
|
21 |
+
slices:
|
22 |
+
- sources:
|
23 |
+
- layer_range:
|
24 |
+
- 0
|
25 |
+
- 80
|
26 |
+
model: migtissera/Tess-72B-v1.5b
|
27 |
+
- layer_range:
|
28 |
+
- 0
|
29 |
+
- 80
|
30 |
+
model: abacusai/Smaug-72B-v0.1
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
model-00001-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03c556d40850abccf7d25cf0fb1a081f51efb98af6bb627540641606be68c6b5
|
3 |
+
size 1879065656
|
model-00002-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67b881bbc5bc354c89978e8ec3535c1cb851b853891bb6de1ea8a0bb0ebfece0
|
3 |
+
size 402670048
|
model-00003-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a43130851c7ad8e89a98e9efe296ded2bde233d177d5ae3ccd92e44e3a5a9df
|
3 |
+
size 2491416720
|
model-00004-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f86236f418804108814d2d1791b23c7be957daa26a4c04bbbe9c93c1b13d4748
|
3 |
+
size 1879065656
|
model-00005-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd8b3835945902167d58e11592aebb582c7430d4e7c75bc135e5ccbd6afefde7
|
3 |
+
size 1879098632
|
model-00006-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b06578db796a63bc59f176f26121f8fc75c553e4562b605048382e67d27d750e
|
3 |
+
size 1610646216
|
model-00007-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a45576ce2744b561922a1b3da4e59da617a938b10e8c37ba66650c3778713492
|
3 |
+
size 1744864304
|
model-00008-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31574066e39a71fedd6073237dd92043951667b9d613e5fef5b547050092423e
|
3 |
+
size 1744864304
|
model-00009-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ede497a15f3235a377fe0f752c937240118f028bdf7433a35b72bcedeb0aab4b
|
3 |
+
size 1879081896
|
model-00010-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a4da81c5fb72d955350c4702c0f6f5f31a6903feccc00d0999560fda1012676
|
3 |
+
size 1879065656
|
model-00011-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b5d3f46cd504572fca62ec960adade4d7f9f0663ccf87527e76646a9c6a0139
|
3 |
+
size 1879082152
|
model-00012-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ed723de14eacd841fb27527ffeddac58cd41e04a1d0d4e9406822165bfd7945
|
3 |
+
size 1610630200
|
model-00013-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0bbf6dbfb817c36d5161f3bb1c2ef12fb58e397b5b9ff8efbf2ae0b15280c88
|
3 |
+
size 1744864312
|
model-00014-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c73b98095d58341ec1a463dad09a2eb7f0bffc7ceb04f3b88b14105b52dffdf9
|
3 |
+
size 1879115144
|
model-00015-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f0e72a42be44b636d073567d86775514b7144c1c4cbcd6a0a6417a49c29e612
|
3 |
+
size 1879065664
|
model-00016-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3f822f03e2c9be0dc4b450bd18bebedab6356dc7d7d2896361e4874ed71ba16
|
3 |
+
size 1879082160
|
model-00017-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:456801ddd7d3a0d0904e0f9facf6301b6d21881691f03dd5c46122a9fdc40bc3
|
3 |
+
size 1610662944
|
model-00018-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4de87aeaeccc7350a6196e1d4a003d587538734318b2d957dcb66c0f9675cc3
|
3 |
+
size 1744864312
|
model-00019-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3821233823a0a8dadd2ecf3c6e292802653d5974e0720540f6e638f12f82744
|
3 |
+
size 1744864312
|
model-00020-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89b6e53e939ff3c3167f4a0579364dadb2043c046df6a26f6bc4ad1a122875bd
|
3 |
+
size 1610646216
|
model-00021-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47d4845f3f34c503f14a327cf8dd2de1b9cfdf69d3b77277356594e8c73afadd
|
3 |
+
size 1744864312
|
model-00022-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2da51f9ae3eae4028fd12ce3714e98a8d98d76707a9d4511748d59b7375ada3
|
3 |
+
size 1744864312
|
model-00023-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36cb3ddfc41ec7c2022bd60f7f6e045dc0503f62959647299920e2971fa1fde9
|
3 |
+
size 1879082144
|
model-00024-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c315034611cf7e0edfb2fb65d1a8fb5087552c0e60e6ecfb814026a2838a20bd
|
3 |
+
size 1879082152
|
model-00025-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c76f96266ee13b843b91084c935a935e8d77ac5a0cb3278c46f5d3ec72a2f37
|
3 |
+
size 1744864304
|
model-00026-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:423a2e424c479976e3a862e684bc0f82127b015d71e11e30b00c964ce4029d5b
|
3 |
+
size 1744831312
|
model-00027-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ae121d73df2cad4057ee0e44a8fcb4938d4c92be0e4c0a2a571bdd30af6f72a
|
3 |
+
size 1744864312
|
model-00028-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20b84c3134ed316aa81308bd291af244f6b53904557f0cb9591bdf210e08b440
|
3 |
+
size 1879115384
|
model-00029-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5330afce9065b0380e1b5e14f1ff02e0f16bcba21a6416be8dad077984853b5
|
3 |
+
size 1744864304
|
model-00030-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f04df0219207c9ed395fd2f4f6283ec8b7023944d52159510fd3dee1bd221938
|
3 |
+
size 1744864304
|
model-00031-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d15ebf1489cc3594ed7e4f80b4b5d0ea89c1574c3ce7f92a5820d38598e76bdd
|
3 |
+
size 1879081912
|
model-00032-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f63eb3780cd0740ec1585ae836018a8731f2ba54ea9ea914a5424ffe131de8ec
|
3 |
+
size 1744864312
|
model-00033-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2df405a3a5bfea83001cd54db2573a1610de3335b6f696dd38a2ada17be1aca4
|
3 |
+
size 1744864312
|
model-00034-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b465295db14e645fe7c2a43f1a129964797b9ef0d1f3c3c1df970d9c576821d2
|
3 |
+
size 1879098416
|
model-00035-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad61aa98cf99902fcd255a4f6553f04fda5795b25d404c104d4859f8b621bd08
|
3 |
+
size 1879082160
|
model-00036-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e93a85a5ad272acdb10b14f46096ead98e342d838aca8fcdf4dacc03ff51002
|
3 |
+
size 1610662952
|
model-00037-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82f3751472212ddd67ebeae7340bb546eb5125c66a4b5f76307a28e7f21c65c9
|
3 |
+
size 1744831312
|
model-00038-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab36745bb6e06b60ab65ead009f66acc47e9c080010cdb4e9efc0663da3ceb7b
|
3 |
+
size 1744864312
|
model-00039-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7c0afdbf59b15dc412cca6cd76d579b1a19e101df5c025e1069dc816b92558c
|
3 |
+
size 1879082144
|
model-00040-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75206caa7a632d535e15871654a5c579bd385e0d534466578a53419b7387cf4f
|
3 |
+
size 1879065664
|
model-00041-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bcc6e409cbda48126c43cca861dd2b0fdbf6bb304150f16a8694591bdc55a4a
|
3 |
+
size 1879082160
|
model-00042-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72b1163ac7d9f71ff3057f7d152f58932df85687d975f388a2b1f55ff775a653
|
3 |
+
size 1879098640
|
model-00043-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df5504c6ea45c53a32711750f9caba3dd3801b30624884e2f4f856a2aaa3226a
|
3 |
+
size 1744864312
|
model-00044-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9cb1e5ff93a598e9f354d4d54af797899fed000b1762990c5309934035600c8
|
3 |
+
size 1879115144
|
model-00045-of-00082.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:067ded147fab7f3fee24fe43a1077e16dd9a4dac457689456cb99da96c6a6d8d
|
3 |
+
size 1879082152
|