Upload model
Browse files- README.md +369 -369
- config.json +27 -0
- model-00001-of-00006.safetensors +3 -0
- model-00002-of-00006.safetensors +3 -0
- model-00003-of-00006.safetensors +3 -0
- model-00004-of-00006.safetensors +3 -0
- model-00005-of-00006.safetensors +3 -0
- model-00006-of-00006.safetensors +3 -0
- model.safetensors.index.json +297 -0
README.md
CHANGED
@@ -9,12 +9,14 @@ tags:
|
|
9 |
model-index:
|
10 |
- name: Gouzi3618/LENS-8000
|
11 |
results:
|
12 |
-
-
|
13 |
-
|
|
|
14 |
name: MTEB AmazonCounterfactualClassification (en)
|
15 |
-
revision: e8379541af4e31359cca9fbcf4b00f2671dba205
|
16 |
-
split: test
|
17 |
type: mteb/amazon_counterfactual
|
|
|
|
|
|
|
18 |
metrics:
|
19 |
- type: accuracy
|
20 |
value: 93.6865671641791
|
@@ -28,14 +30,14 @@ model-index:
|
|
28 |
value: 93.87207694461506
|
29 |
- type: main_score
|
30 |
value: 93.6865671641791
|
31 |
-
|
32 |
type: Classification
|
33 |
-
|
34 |
-
config: default
|
35 |
name: MTEB AmazonPolarityClassification (default)
|
36 |
-
revision: e2d317d38cd51312af73b3d32a06d1a08b442046
|
37 |
-
split: test
|
38 |
type: mteb/amazon_polarity
|
|
|
|
|
|
|
39 |
metrics:
|
40 |
- type: accuracy
|
41 |
value: 97.06832499999999
|
@@ -49,14 +51,14 @@ model-index:
|
|
49 |
value: 97.06781792337515
|
50 |
- type: main_score
|
51 |
value: 97.06832499999999
|
52 |
-
|
53 |
type: Classification
|
54 |
-
|
55 |
-
config: en
|
56 |
name: MTEB AmazonReviewsClassification (en)
|
57 |
-
revision: 1399c76144fd37290681b995c656ef9b2e06e26d
|
58 |
-
split: test
|
59 |
type: mteb/amazon_reviews_multi
|
|
|
|
|
|
|
60 |
metrics:
|
61 |
- type: accuracy
|
62 |
value: 63.608
|
@@ -66,14 +68,14 @@ model-index:
|
|
66 |
value: 62.41274991021244
|
67 |
- type: main_score
|
68 |
value: 63.608
|
69 |
-
|
70 |
-
type:
|
71 |
-
|
72 |
-
config: default
|
73 |
name: MTEB ArguAna (default)
|
74 |
-
revision: c22ab2a51041ffd869aaddef7af8d8215647e41a
|
75 |
-
split: test
|
76 |
type: mteb/arguana
|
|
|
|
|
|
|
77 |
metrics:
|
78 |
- type: main_score
|
79 |
value: 76.019
|
@@ -357,14 +359,14 @@ model-index:
|
|
357 |
value: 81.57900000000001
|
358 |
- type: recall_at_5
|
359 |
value: 89.403
|
360 |
-
|
361 |
-
type:
|
362 |
-
|
363 |
-
config: default
|
364 |
name: MTEB ArxivClusteringP2P (default)
|
365 |
-
revision: a122ad7f3f0291bf49cc6f4d32aa80929df69d5d
|
366 |
-
split: test
|
367 |
type: mteb/arxiv-clustering-p2p
|
|
|
|
|
|
|
368 |
metrics:
|
369 |
- type: main_score
|
370 |
value: 54.809064728970625
|
@@ -372,14 +374,14 @@ model-index:
|
|
372 |
value: 54.809064728970625
|
373 |
- type: v_measure_std
|
374 |
value: 14.497861425102215
|
375 |
-
|
376 |
type: Clustering
|
377 |
-
|
378 |
-
config: default
|
379 |
name: MTEB ArxivClusteringS2S (default)
|
380 |
-
revision: f910caf1a6075f7329cdf8c1a6135696f37dbd53
|
381 |
-
split: test
|
382 |
type: mteb/arxiv-clustering-s2s
|
|
|
|
|
|
|
383 |
metrics:
|
384 |
- type: main_score
|
385 |
value: 50.144159631474416
|
@@ -387,14 +389,14 @@ model-index:
|
|
387 |
value: 50.144159631474416
|
388 |
- type: v_measure_std
|
389 |
value: 14.596959041091187
|
390 |
-
|
391 |
-
type:
|
392 |
-
|
393 |
-
config: default
|
394 |
name: MTEB AskUbuntuDupQuestions (default)
|
395 |
-
revision: 2000358ca161889fa9c082cb41daa8dcfb161a54
|
396 |
-
split: test
|
397 |
type: mteb/askubuntudupquestions-reranking
|
|
|
|
|
|
|
398 |
metrics:
|
399 |
- type: main_score
|
400 |
value: 65.74396432331054
|
@@ -414,14 +416,14 @@ model-index:
|
|
414 |
value: 34.51981156443003
|
415 |
- type: nAUC_mrr_std
|
416 |
value: 28.863440464092747
|
417 |
-
|
418 |
-
type:
|
419 |
-
|
420 |
-
config: default
|
421 |
name: MTEB BIOSSES (default)
|
422 |
-
revision: d3fb88f8f02e40887cd149695127462bbcf29b4a
|
423 |
-
split: test
|
424 |
type: mteb/biosses-sts
|
|
|
|
|
|
|
425 |
metrics:
|
426 |
- type: cosine_pearson
|
427 |
value: 86.59612727828603
|
@@ -441,14 +443,14 @@ model-index:
|
|
441 |
value: 86.59612727828603
|
442 |
- type: spearman
|
443 |
value: 85.83087137728063
|
444 |
-
|
445 |
-
type:
|
446 |
-
|
447 |
-
config: default
|
448 |
name: MTEB Banking77Classification (default)
|
449 |
-
revision: 0fd18e25b25c072e09e0d92ab615fda904d66300
|
450 |
-
split: test
|
451 |
type: mteb/banking77
|
|
|
|
|
|
|
452 |
metrics:
|
453 |
- type: accuracy
|
454 |
value: 90.19155844155846
|
@@ -458,14 +460,14 @@ model-index:
|
|
458 |
value: 90.05716678902826
|
459 |
- type: main_score
|
460 |
value: 90.19155844155846
|
461 |
-
|
462 |
-
type:
|
463 |
-
|
464 |
-
config: default
|
465 |
name: MTEB BiorxivClusteringP2P (default)
|
466 |
-
revision: 65b79d1d13f80053f67aca9498d9402c2d9f1f40
|
467 |
-
split: test
|
468 |
type: mteb/biorxiv-clustering-p2p
|
|
|
|
|
|
|
469 |
metrics:
|
470 |
- type: main_score
|
471 |
value: 52.480294793961924
|
@@ -473,14 +475,14 @@ model-index:
|
|
473 |
value: 52.480294793961924
|
474 |
- type: v_measure_std
|
475 |
value: 0.5558452294416437
|
476 |
-
|
477 |
type: Clustering
|
478 |
-
|
479 |
-
config: default
|
480 |
name: MTEB BiorxivClusteringS2S (default)
|
481 |
-
revision: 258694dd0231531bc1fd9de6ceb52a0853c6d908
|
482 |
-
split: test
|
483 |
type: mteb/biorxiv-clustering-s2s
|
|
|
|
|
|
|
484 |
metrics:
|
485 |
- type: main_score
|
486 |
value: 48.51901581759115
|
@@ -488,14 +490,14 @@ model-index:
|
|
488 |
value: 48.51901581759115
|
489 |
- type: v_measure_std
|
490 |
value: 1.1094735884191569
|
491 |
-
|
492 |
-
type:
|
493 |
-
|
494 |
-
config: default
|
495 |
name: MTEB CQADupstackAndroidRetrieval (default)
|
496 |
-
revision: f46a197baaae43b4f621051089b82a364682dfeb
|
497 |
-
split: test
|
498 |
type: mteb/cqadupstack-android
|
|
|
|
|
|
|
499 |
metrics:
|
500 |
- type: main_score
|
501 |
value: 57.9
|
@@ -779,14 +781,14 @@ model-index:
|
|
779 |
value: 54.764
|
780 |
- type: recall_at_5
|
781 |
value: 62.089000000000006
|
782 |
-
|
783 |
type: Retrieval
|
784 |
-
|
785 |
-
config: default
|
786 |
name: MTEB CQADupstackEnglishRetrieval (default)
|
787 |
-
revision: ad9991cb51e31e31e430383c75ffb2885547b5f0
|
788 |
-
split: test
|
789 |
type: mteb/cqadupstack-english
|
|
|
|
|
|
|
790 |
metrics:
|
791 |
- type: main_score
|
792 |
value: 55.474000000000004
|
@@ -1070,14 +1072,14 @@ model-index:
|
|
1070 |
value: 53.36300000000001
|
1071 |
- type: recall_at_5
|
1072 |
value: 58.987
|
1073 |
-
|
1074 |
type: Retrieval
|
1075 |
-
|
1076 |
-
config: default
|
1077 |
name: MTEB CQADupstackGamingRetrieval (default)
|
1078 |
-
revision: 4885aa143210c98657558c04aaf3dc47cfb54340
|
1079 |
-
split: test
|
1080 |
type: mteb/cqadupstack-gaming
|
|
|
|
|
|
|
1081 |
metrics:
|
1082 |
- type: main_score
|
1083 |
value: 65.236
|
@@ -1361,14 +1363,14 @@ model-index:
|
|
1361 |
value: 65.359
|
1362 |
- type: recall_at_5
|
1363 |
value: 71.439
|
1364 |
-
|
1365 |
type: Retrieval
|
1366 |
-
|
1367 |
-
config: default
|
1368 |
name: MTEB CQADupstackGisRetrieval (default)
|
1369 |
-
revision: 5003b3064772da1887988e05400cf3806fe491f2
|
1370 |
-
split: test
|
1371 |
type: mteb/cqadupstack-gis
|
|
|
|
|
|
|
1372 |
metrics:
|
1373 |
- type: main_score
|
1374 |
value: 43.736999999999995
|
@@ -1652,14 +1654,14 @@ model-index:
|
|
1652 |
value: 42.295
|
1653 |
- type: recall_at_5
|
1654 |
value: 49.275999999999996
|
1655 |
-
|
1656 |
type: Retrieval
|
1657 |
-
|
1658 |
-
config: default
|
1659 |
name: MTEB CQADupstackMathematicaRetrieval (default)
|
1660 |
-
revision: 90fceea13679c63fe563ded68f3b6f06e50061de
|
1661 |
-
split: test
|
1662 |
type: mteb/cqadupstack-mathematica
|
|
|
|
|
|
|
1663 |
metrics:
|
1664 |
- type: main_score
|
1665 |
value: 38.766
|
@@ -1943,14 +1945,14 @@ model-index:
|
|
1943 |
value: 36.278
|
1944 |
- type: recall_at_5
|
1945 |
value: 43.38
|
1946 |
-
|
1947 |
type: Retrieval
|
1948 |
-
|
1949 |
-
config: default
|
1950 |
name: MTEB CQADupstackPhysicsRetrieval (default)
|
1951 |
-
revision: 79531abbd1fb92d06c6d6315a0cbbbf5bb247ea4
|
1952 |
-
split: test
|
1953 |
type: mteb/cqadupstack-physics
|
|
|
|
|
|
|
1954 |
metrics:
|
1955 |
- type: main_score
|
1956 |
value: 53.893
|
@@ -2234,14 +2236,14 @@ model-index:
|
|
2234 |
value: 52.5
|
2235 |
- type: recall_at_5
|
2236 |
value: 59.489000000000004
|
2237 |
-
|
2238 |
type: Retrieval
|
2239 |
-
|
2240 |
-
config: default
|
2241 |
name: MTEB CQADupstackProgrammersRetrieval (default)
|
2242 |
-
revision: 6184bc1440d2dbc7612be22b50686b8826d22b32
|
2243 |
-
split: test
|
2244 |
type: mteb/cqadupstack-programmers
|
|
|
|
|
|
|
2245 |
metrics:
|
2246 |
- type: main_score
|
2247 |
value: 51.151
|
@@ -2525,27 +2527,27 @@ model-index:
|
|
2525 |
value: 48.254000000000005
|
2526 |
- type: recall_at_5
|
2527 |
value: 55.595000000000006
|
2528 |
-
|
2529 |
type: Retrieval
|
2530 |
-
|
2531 |
-
config: default
|
2532 |
name: MTEB CQADupstackRetrieval (default)
|
2533 |
-
revision: CQADupstackRetrieval_is_a_combined_dataset
|
2534 |
-
split: test
|
2535 |
type: CQADupstackRetrieval_is_a_combined_dataset
|
|
|
|
|
|
|
2536 |
metrics:
|
2537 |
- type: main_score
|
2538 |
value: 48.669000000000004
|
2539 |
- type: ndcg_at_10
|
2540 |
value: 48.669000000000004
|
2541 |
-
|
2542 |
type: Retrieval
|
2543 |
-
|
2544 |
-
config: default
|
2545 |
name: MTEB CQADupstackStatsRetrieval (default)
|
2546 |
-
revision: 65ac3a16b8e91f9cee4c9828cc7c335575432a2a
|
2547 |
-
split: test
|
2548 |
type: mteb/cqadupstack-stats
|
|
|
|
|
|
|
2549 |
metrics:
|
2550 |
- type: main_score
|
2551 |
value: 41.521
|
@@ -2829,14 +2831,14 @@ model-index:
|
|
2829 |
value: 40.373
|
2830 |
- type: recall_at_5
|
2831 |
value: 46.421
|
2832 |
-
|
2833 |
type: Retrieval
|
2834 |
-
|
2835 |
-
config: default
|
2836 |
name: MTEB CQADupstackTexRetrieval (default)
|
2837 |
-
revision: 46989137a86843e03a6195de44b09deda022eec7
|
2838 |
-
split: test
|
2839 |
type: mteb/cqadupstack-tex
|
|
|
|
|
|
|
2840 |
metrics:
|
2841 |
- type: main_score
|
2842 |
value: 37.183
|
@@ -3120,14 +3122,14 @@ model-index:
|
|
3120 |
value: 35.522999999999996
|
3121 |
- type: recall_at_5
|
3122 |
value: 41.746
|
3123 |
-
|
3124 |
type: Retrieval
|
3125 |
-
|
3126 |
-
config: default
|
3127 |
name: MTEB CQADupstackUnixRetrieval (default)
|
3128 |
-
revision: 6c6430d3a6d36f8d2a829195bc5dc94d7e063e53
|
3129 |
-
split: test
|
3130 |
type: mteb/cqadupstack-unix
|
|
|
|
|
|
|
3131 |
metrics:
|
3132 |
- type: main_score
|
3133 |
value: 51.396
|
@@ -3411,14 +3413,14 @@ model-index:
|
|
3411 |
value: 49.833
|
3412 |
- type: recall_at_5
|
3413 |
value: 55.145999999999994
|
3414 |
-
|
3415 |
type: Retrieval
|
3416 |
-
|
3417 |
-
config: default
|
3418 |
name: MTEB CQADupstackWebmastersRetrieval (default)
|
3419 |
-
revision: 160c094312a0e1facb97e55eeddb698c0abe3571
|
3420 |
-
split: test
|
3421 |
type: mteb/cqadupstack-webmasters
|
|
|
|
|
|
|
3422 |
metrics:
|
3423 |
- type: main_score
|
3424 |
value: 48.229
|
@@ -3702,14 +3704,14 @@ model-index:
|
|
3702 |
value: 45.072
|
3703 |
- type: recall_at_5
|
3704 |
value: 52.993
|
3705 |
-
|
3706 |
type: Retrieval
|
3707 |
-
|
3708 |
-
config: default
|
3709 |
name: MTEB CQADupstackWordpressRetrieval (default)
|
3710 |
-
revision: 4ffe81d471b1924886b33c7567bfb200e9eec5c4
|
3711 |
-
split: test
|
3712 |
type: mteb/cqadupstack-wordpress
|
|
|
|
|
|
|
3713 |
metrics:
|
3714 |
- type: main_score
|
3715 |
value: 39.542
|
@@ -3993,14 +3995,14 @@ model-index:
|
|
3993 |
value: 38.29
|
3994 |
- type: recall_at_5
|
3995 |
value: 43.817
|
3996 |
-
|
3997 |
type: Retrieval
|
3998 |
-
|
3999 |
-
config: default
|
4000 |
name: MTEB ClimateFEVER (default)
|
4001 |
-
revision: 47f2ac6acb640fc46020b02a5b59fdda04d39380
|
4002 |
-
split: test
|
4003 |
type: mteb/climate-fever
|
|
|
|
|
|
|
4004 |
metrics:
|
4005 |
- type: main_score
|
4006 |
value: 45.765
|
@@ -4284,14 +4286,14 @@ model-index:
|
|
4284 |
value: 34.846
|
4285 |
- type: recall_at_5
|
4286 |
value: 43.504
|
4287 |
-
|
4288 |
type: Retrieval
|
4289 |
-
|
4290 |
-
config: default
|
4291 |
name: MTEB DBPedia (default)
|
4292 |
-
revision: c0f706b76e590d620bd6618b3ca8efdd34e2d659
|
4293 |
-
split: test
|
4294 |
type: mteb/dbpedia
|
|
|
|
|
|
|
4295 |
metrics:
|
4296 |
- type: main_score
|
4297 |
value: 49.747
|
@@ -4575,14 +4577,14 @@ model-index:
|
|
4575 |
value: 17.218
|
4576 |
- type: recall_at_5
|
4577 |
value: 21.275
|
4578 |
-
|
4579 |
-
type:
|
4580 |
-
|
4581 |
-
config: default
|
4582 |
name: MTEB EmotionClassification (default)
|
4583 |
-
revision: 4f58c6b202a23cf9a4da393831edf4f9183cad37
|
4584 |
-
split: test
|
4585 |
type: mteb/emotion
|
|
|
|
|
|
|
4586 |
metrics:
|
4587 |
- type: accuracy
|
4588 |
value: 91.86500000000001
|
@@ -4592,14 +4594,14 @@ model-index:
|
|
4592 |
value: 92.0659899919408
|
4593 |
- type: main_score
|
4594 |
value: 91.86500000000001
|
4595 |
-
|
4596 |
-
type:
|
4597 |
-
|
4598 |
-
config: default
|
4599 |
name: MTEB FEVER (default)
|
4600 |
-
revision: bea83ef9e8fb933d90a2f1d5515737465d613e12
|
4601 |
-
split: test
|
4602 |
type: mteb/fever
|
|
|
|
|
|
|
4603 |
metrics:
|
4604 |
- type: main_score
|
4605 |
value: 92.324
|
@@ -4883,14 +4885,14 @@ model-index:
|
|
4883 |
value: 93.806
|
4884 |
- type: recall_at_5
|
4885 |
value: 95.36
|
4886 |
-
|
4887 |
type: Retrieval
|
4888 |
-
|
4889 |
-
config: default
|
4890 |
name: MTEB FiQA2018 (default)
|
4891 |
-
revision: 27a168819829fe9bcd655c2df245fb19452e8e06
|
4892 |
-
split: test
|
4893 |
type: mteb/fiqa
|
|
|
|
|
|
|
4894 |
metrics:
|
4895 |
- type: main_score
|
4896 |
value: 61.565999999999995
|
@@ -5174,14 +5176,14 @@ model-index:
|
|
5174 |
value: 51.782
|
5175 |
- type: recall_at_5
|
5176 |
value: 59.911
|
5177 |
-
|
5178 |
type: Retrieval
|
5179 |
-
|
5180 |
-
config: default
|
5181 |
name: MTEB HotpotQA (default)
|
5182 |
-
revision: ab518f4d6fcca38d87c25209f94beba119d02014
|
5183 |
-
split: test
|
5184 |
type: mteb/hotpotqa
|
|
|
|
|
|
|
5185 |
metrics:
|
5186 |
- type: main_score
|
5187 |
value: 85.71
|
@@ -5465,14 +5467,14 @@ model-index:
|
|
5465 |
value: 80.891
|
5466 |
- type: recall_at_5
|
5467 |
value: 85.307
|
5468 |
-
|
5469 |
-
type:
|
5470 |
-
|
5471 |
-
config: default
|
5472 |
name: MTEB ImdbClassification (default)
|
5473 |
-
revision: 3d86128a09e091d6018b6d26cad27f2739fc2db7
|
5474 |
-
split: test
|
5475 |
type: mteb/imdb
|
|
|
|
|
|
|
5476 |
metrics:
|
5477 |
- type: accuracy
|
5478 |
value: 96.9972
|
@@ -5486,14 +5488,14 @@ model-index:
|
|
5486 |
value: 96.99685931130435
|
5487 |
- type: main_score
|
5488 |
value: 96.9972
|
5489 |
-
|
5490 |
-
type:
|
5491 |
-
|
5492 |
-
config: default
|
5493 |
name: MTEB MSMARCO (default)
|
5494 |
-
revision: c5a29a104738b98a9e76336939199e264163d4a0
|
5495 |
-
split: dev
|
5496 |
type: mteb/msmarco
|
|
|
|
|
|
|
5497 |
metrics:
|
5498 |
- type: main_score
|
5499 |
value: 47.238
|
@@ -5777,14 +5779,14 @@ model-index:
|
|
5777 |
value: 47.714
|
5778 |
- type: recall_at_5
|
5779 |
value: 57.913000000000004
|
5780 |
-
|
5781 |
-
type:
|
5782 |
-
|
5783 |
-
config: en
|
5784 |
name: MTEB MTOPDomainClassification (en)
|
5785 |
-
revision: d80d48c1eb48d3562165c59d59d0034df9fff0bf
|
5786 |
-
split: test
|
5787 |
type: mteb/mtop_domain
|
|
|
|
|
|
|
5788 |
metrics:
|
5789 |
- type: accuracy
|
5790 |
value: 97.43502051983585
|
@@ -5794,14 +5796,14 @@ model-index:
|
|
5794 |
value: 97.44797640554678
|
5795 |
- type: main_score
|
5796 |
value: 97.43502051983585
|
5797 |
-
|
5798 |
type: Classification
|
5799 |
-
|
5800 |
-
config: en
|
5801 |
name: MTEB MTOPIntentClassification (en)
|
5802 |
-
revision: ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba
|
5803 |
-
split: test
|
5804 |
type: mteb/mtop_intent
|
|
|
|
|
|
|
5805 |
metrics:
|
5806 |
- type: accuracy
|
5807 |
value: 92.80665754673961
|
@@ -5811,14 +5813,14 @@ model-index:
|
|
5811 |
value: 93.45063761064331
|
5812 |
- type: main_score
|
5813 |
value: 92.80665754673961
|
5814 |
-
|
5815 |
type: Classification
|
5816 |
-
|
5817 |
-
config: en
|
5818 |
name: MTEB MassiveIntentClassification (en)
|
5819 |
-
revision: 4672e20407010da34463acc759c162ca9734bca6
|
5820 |
-
split: test
|
5821 |
type: mteb/amazon_massive_intent
|
|
|
|
|
|
|
5822 |
metrics:
|
5823 |
- type: accuracy
|
5824 |
value: 81.14324142568931
|
@@ -5828,14 +5830,14 @@ model-index:
|
|
5828 |
value: 80.06102282439677
|
5829 |
- type: main_score
|
5830 |
value: 81.14324142568931
|
5831 |
-
|
5832 |
type: Classification
|
5833 |
-
|
5834 |
-
config: en
|
5835 |
name: MTEB MassiveScenarioClassification (en)
|
5836 |
-
revision: fad2c6e8459f9e1c45d9315f4953d921437d70f8
|
5837 |
-
split: test
|
5838 |
type: mteb/amazon_massive_scenario
|
|
|
|
|
|
|
5839 |
metrics:
|
5840 |
- type: accuracy
|
5841 |
value: 83.52723604572965
|
@@ -5845,14 +5847,14 @@ model-index:
|
|
5845 |
value: 83.18340208761732
|
5846 |
- type: main_score
|
5847 |
value: 83.52723604572965
|
5848 |
-
|
5849 |
-
type:
|
5850 |
-
|
5851 |
-
config: default
|
5852 |
name: MTEB MedrxivClusteringP2P (default)
|
5853 |
-
revision: e7a26af6f3ae46b30dde8737f02c07b1505bcc73
|
5854 |
-
split: test
|
5855 |
type: mteb/medrxiv-clustering-p2p
|
|
|
|
|
|
|
5856 |
metrics:
|
5857 |
- type: main_score
|
5858 |
value: 46.38149873605036
|
@@ -5860,14 +5862,14 @@ model-index:
|
|
5860 |
value: 46.38149873605036
|
5861 |
- type: v_measure_std
|
5862 |
value: 1.0749788856434186
|
5863 |
-
|
5864 |
type: Clustering
|
5865 |
-
|
5866 |
-
config: default
|
5867 |
name: MTEB MedrxivClusteringS2S (default)
|
5868 |
-
revision: 35191c8c0dca72d8ff3efcd72aa802307d469663
|
5869 |
-
split: test
|
5870 |
type: mteb/medrxiv-clustering-s2s
|
|
|
|
|
|
|
5871 |
metrics:
|
5872 |
- type: main_score
|
5873 |
value: 44.8945524407664
|
@@ -5875,14 +5877,14 @@ model-index:
|
|
5875 |
value: 44.8945524407664
|
5876 |
- type: v_measure_std
|
5877 |
value: 1.2389193370528488
|
5878 |
-
|
5879 |
-
type:
|
5880 |
-
|
5881 |
-
config: default
|
5882 |
name: MTEB MindSmallReranking (default)
|
5883 |
-
revision: 59042f120c80e8afa9cdbb224f67076cec0fc9a7
|
5884 |
-
split: test
|
5885 |
type: mteb/mind_small
|
|
|
|
|
|
|
5886 |
metrics:
|
5887 |
- type: main_score
|
5888 |
value: 31.464871623418794
|
@@ -5902,14 +5904,14 @@ model-index:
|
|
5902 |
value: -19.359704641723024
|
5903 |
- type: nAUC_mrr_std
|
5904 |
value: 0.2553333974009825
|
5905 |
-
|
5906 |
-
type:
|
5907 |
-
|
5908 |
-
config: default
|
5909 |
name: MTEB NFCorpus (default)
|
5910 |
-
revision: ec0fa4fe99da2ff19ca1214b7966684033a58814
|
5911 |
-
split: test
|
5912 |
type: mteb/nfcorpus
|
|
|
|
|
|
|
5913 |
metrics:
|
5914 |
- type: main_score
|
5915 |
value: 40.608
|
@@ -6193,14 +6195,14 @@ model-index:
|
|
6193 |
value: 12.592999999999998
|
6194 |
- type: recall_at_5
|
6195 |
value: 15.847
|
6196 |
-
|
6197 |
type: Retrieval
|
6198 |
-
|
6199 |
-
config: default
|
6200 |
name: MTEB NQ (default)
|
6201 |
-
revision: b774495ed302d8c44a3a7ea25c90dbce03968f31
|
6202 |
-
split: test
|
6203 |
type: mteb/nq
|
|
|
|
|
|
|
6204 |
metrics:
|
6205 |
- type: main_score
|
6206 |
value: 74.639
|
@@ -6484,14 +6486,14 @@ model-index:
|
|
6484 |
value: 76.32
|
6485 |
- type: recall_at_5
|
6486 |
value: 83.992
|
6487 |
-
|
6488 |
type: Retrieval
|
6489 |
-
|
6490 |
-
config: default
|
6491 |
name: MTEB QuoraRetrieval (default)
|
6492 |
-
revision: e4e08e0b7dbe3c8700f0daef558ff32256715259
|
6493 |
-
split: test
|
6494 |
type: mteb/quora
|
|
|
|
|
|
|
6495 |
metrics:
|
6496 |
- type: main_score
|
6497 |
value: 90.78500000000001
|
@@ -6775,14 +6777,14 @@ model-index:
|
|
6775 |
value: 89.85499999999999
|
6776 |
- type: recall_at_5
|
6777 |
value: 93.758
|
6778 |
-
|
6779 |
-
type:
|
6780 |
-
|
6781 |
-
config: default
|
6782 |
name: MTEB RedditClustering (default)
|
6783 |
-
revision: 24640382cdbf8abc73003fb0fa6d111a705499eb
|
6784 |
-
split: test
|
6785 |
type: mteb/reddit-clustering
|
|
|
|
|
|
|
6786 |
metrics:
|
6787 |
- type: main_score
|
6788 |
value: 72.36527124460562
|
@@ -6790,14 +6792,14 @@ model-index:
|
|
6790 |
value: 72.36527124460562
|
6791 |
- type: v_measure_std
|
6792 |
value: 2.7778891945364195
|
6793 |
-
|
6794 |
type: Clustering
|
6795 |
-
|
6796 |
-
config: default
|
6797 |
name: MTEB RedditClusteringP2P (default)
|
6798 |
-
revision: 385e3cb46b4cfa89021f56c4380204149d0efe33
|
6799 |
-
split: test
|
6800 |
type: mteb/reddit-clustering-p2p
|
|
|
|
|
|
|
6801 |
metrics:
|
6802 |
- type: main_score
|
6803 |
value: 73.89142551084535
|
@@ -6805,14 +6807,14 @@ model-index:
|
|
6805 |
value: 73.89142551084535
|
6806 |
- type: v_measure_std
|
6807 |
value: 11.258242813412751
|
6808 |
-
|
6809 |
-
type:
|
6810 |
-
|
6811 |
-
config: default
|
6812 |
name: MTEB SCIDOCS (default)
|
6813 |
-
revision: f8c2fcf00f625baaa80f62ec5bd9e1fff3b8ae88
|
6814 |
-
split: test
|
6815 |
type: mteb/scidocs
|
|
|
|
|
|
|
6816 |
metrics:
|
6817 |
- type: main_score
|
6818 |
value: 28.538000000000004
|
@@ -7096,14 +7098,14 @@ model-index:
|
|
7096 |
value: 15.573
|
7097 |
- type: recall_at_5
|
7098 |
value: 20.948
|
7099 |
-
|
7100 |
-
type:
|
7101 |
-
|
7102 |
-
config: default
|
7103 |
name: MTEB SICK-R (default)
|
7104 |
-
revision: 20a6d6f312dd54037fe07a32d58e5e168867909d
|
7105 |
-
split: test
|
7106 |
type: mteb/sickr-sts
|
|
|
|
|
|
|
7107 |
metrics:
|
7108 |
- type: cosine_pearson
|
7109 |
value: 84.37281363343187
|
@@ -7123,14 +7125,14 @@ model-index:
|
|
7123 |
value: 84.37281363343187
|
7124 |
- type: spearman
|
7125 |
value: 83.30200195593044
|
7126 |
-
|
7127 |
type: STS
|
7128 |
-
|
7129 |
-
config: default
|
7130 |
name: MTEB STS12 (default)
|
7131 |
-
revision: a0d554a64d88156834ff5ae9920b964011b16384
|
7132 |
-
split: test
|
7133 |
type: mteb/sts12-sts
|
|
|
|
|
|
|
7134 |
metrics:
|
7135 |
- type: cosine_pearson
|
7136 |
value: 86.82824905521925
|
@@ -7150,14 +7152,14 @@ model-index:
|
|
7150 |
value: 86.82824905521925
|
7151 |
- type: spearman
|
7152 |
value: 80.98590815911939
|
7153 |
-
|
7154 |
type: STS
|
7155 |
-
|
7156 |
-
config: default
|
7157 |
name: MTEB STS13 (default)
|
7158 |
-
revision: 7e90230a92c190f1bf69ae9002b8cea547a64cca
|
7159 |
-
split: test
|
7160 |
type: mteb/sts13-sts
|
|
|
|
|
|
|
7161 |
metrics:
|
7162 |
- type: cosine_pearson
|
7163 |
value: 87.19722316157294
|
@@ -7177,14 +7179,14 @@ model-index:
|
|
7177 |
value: 87.19722316157294
|
7178 |
- type: spearman
|
7179 |
value: 87.34287142701457
|
7180 |
-
|
7181 |
type: STS
|
7182 |
-
|
7183 |
-
config: default
|
7184 |
name: MTEB STS14 (default)
|
7185 |
-
revision: 6031580fec1f6af667f0bd2da0a551cf4f0b2375
|
7186 |
-
split: test
|
7187 |
type: mteb/sts14-sts
|
|
|
|
|
|
|
7188 |
metrics:
|
7189 |
- type: cosine_pearson
|
7190 |
value: 84.82646675904164
|
@@ -7204,14 +7206,14 @@ model-index:
|
|
7204 |
value: 84.82646675904164
|
7205 |
- type: spearman
|
7206 |
value: 84.38843815801556
|
7207 |
-
|
7208 |
type: STS
|
7209 |
-
|
7210 |
-
config: default
|
7211 |
name: MTEB STS15 (default)
|
7212 |
-
revision: ae752c7c21bf194d8b67fd573edf7ae58183cbe3
|
7213 |
-
split: test
|
7214 |
type: mteb/sts15-sts
|
|
|
|
|
|
|
7215 |
metrics:
|
7216 |
- type: cosine_pearson
|
7217 |
value: 89.69909533656704
|
@@ -7231,14 +7233,14 @@ model-index:
|
|
7231 |
value: 89.69909533656704
|
7232 |
- type: spearman
|
7233 |
value: 89.74723322749233
|
7234 |
-
|
7235 |
type: STS
|
7236 |
-
|
7237 |
-
config: default
|
7238 |
name: MTEB STS16 (default)
|
7239 |
-
revision: 4d8694f8f0e0100860b497b999b3dbed754a0513
|
7240 |
-
split: test
|
7241 |
type: mteb/sts16-sts
|
|
|
|
|
|
|
7242 |
metrics:
|
7243 |
- type: cosine_pearson
|
7244 |
value: 86.84947603401746
|
@@ -7258,14 +7260,14 @@ model-index:
|
|
7258 |
value: 86.84947603401746
|
7259 |
- type: spearman
|
7260 |
value: 87.63022743056388
|
7261 |
-
|
7262 |
type: STS
|
7263 |
-
|
7264 |
-
config: en-en
|
7265 |
name: MTEB STS17 (en-en)
|
7266 |
-
revision: faeb762787bd10488a50c8b5be4a3b82e411949c
|
7267 |
-
split: test
|
7268 |
type: mteb/sts17-crosslingual-sts
|
|
|
|
|
|
|
7269 |
metrics:
|
7270 |
- type: cosine_pearson
|
7271 |
value: 91.43391567649913
|
@@ -7285,14 +7287,14 @@ model-index:
|
|
7285 |
value: 91.43391567649913
|
7286 |
- type: spearman
|
7287 |
value: 90.86953801008369
|
7288 |
-
|
7289 |
type: STS
|
7290 |
-
|
7291 |
-
config: en
|
7292 |
name: MTEB STS22 (en)
|
7293 |
-
revision: de9d86b3b84231dc21f76c7b7af1f28e2f57f6e3
|
7294 |
-
split: test
|
7295 |
type: mteb/sts22-crosslingual-sts
|
|
|
|
|
|
|
7296 |
metrics:
|
7297 |
- type: cosine_pearson
|
7298 |
value: 68.81338409687908
|
@@ -7312,14 +7314,14 @@ model-index:
|
|
7312 |
value: 68.81338409687908
|
7313 |
- type: spearman
|
7314 |
value: 68.09215270009086
|
7315 |
-
|
7316 |
type: STS
|
7317 |
-
|
7318 |
-
config: default
|
7319 |
name: MTEB STSBenchmark (default)
|
7320 |
-
revision: b0fddb56ed78048fa8b90373c8a3cfc37b684831
|
7321 |
-
split: test
|
7322 |
type: mteb/stsbenchmark-sts
|
|
|
|
|
|
|
7323 |
metrics:
|
7324 |
- type: cosine_pearson
|
7325 |
value: 87.93191595794555
|
@@ -7339,14 +7341,14 @@ model-index:
|
|
7339 |
value: 87.93191595794555
|
7340 |
- type: spearman
|
7341 |
value: 88.46646307403641
|
7342 |
-
|
7343 |
-
type:
|
7344 |
-
|
7345 |
-
config: default
|
7346 |
name: MTEB SciDocsRR (default)
|
7347 |
-
revision: d3c5e1fc0b855ab6097bf1cda04dd73947d7caab
|
7348 |
-
split: test
|
7349 |
type: mteb/scidocs-reranking
|
|
|
|
|
|
|
7350 |
metrics:
|
7351 |
- type: main_score
|
7352 |
value: 87.62672056519489
|
@@ -7366,14 +7368,14 @@ model-index:
|
|
7366 |
value: 82.4844792677926
|
7367 |
- type: nAUC_mrr_std
|
7368 |
value: 82.0357865297397
|
7369 |
-
|
7370 |
-
type:
|
7371 |
-
|
7372 |
-
config: default
|
7373 |
name: MTEB SciFact (default)
|
7374 |
-
revision: 0228b52cf27578f30900b9e5271d331663a030d7
|
7375 |
-
split: test
|
7376 |
type: mteb/scifact
|
|
|
|
|
|
|
7377 |
metrics:
|
7378 |
- type: main_score
|
7379 |
value: 79.745
|
@@ -7657,14 +7659,14 @@ model-index:
|
|
7657 |
value: 81.072
|
7658 |
- type: recall_at_5
|
7659 |
value: 87.339
|
7660 |
-
|
7661 |
-
type:
|
7662 |
-
|
7663 |
-
config: default
|
7664 |
name: MTEB SprintDuplicateQuestions (default)
|
7665 |
-
revision: d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46
|
7666 |
-
split: test
|
7667 |
type: mteb/sprintduplicatequestions-pairclassification
|
|
|
|
|
|
|
7668 |
metrics:
|
7669 |
- type: cosine_accuracy
|
7670 |
value: 99.86039603960396
|
@@ -7748,14 +7750,14 @@ model-index:
|
|
7748 |
value: 93.69277721261444
|
7749 |
- type: similarity_recall
|
7750 |
value: 92.10000000000001
|
7751 |
-
|
7752 |
-
type:
|
7753 |
-
|
7754 |
-
config: default
|
7755 |
name: MTEB StackExchangeClustering (default)
|
7756 |
-
revision: 6cbc1f7b2bc0622f2e39d2c77fa502909748c259
|
7757 |
-
split: test
|
7758 |
type: mteb/stackexchange-clustering
|
|
|
|
|
|
|
7759 |
metrics:
|
7760 |
- type: main_score
|
7761 |
value: 81.5950420419382
|
@@ -7763,14 +7765,14 @@ model-index:
|
|
7763 |
value: 81.5950420419382
|
7764 |
- type: v_measure_std
|
7765 |
value: 2.3518861207789126
|
7766 |
-
|
7767 |
type: Clustering
|
7768 |
-
|
7769 |
-
config: default
|
7770 |
name: MTEB StackExchangeClusteringP2P (default)
|
7771 |
-
revision: 815ca46b2622cec33ccafc3735d572c266efdb44
|
7772 |
-
split: test
|
7773 |
type: mteb/stackexchange-clustering-p2p
|
|
|
|
|
|
|
7774 |
metrics:
|
7775 |
- type: main_score
|
7776 |
value: 44.40836435329055
|
@@ -7778,14 +7780,14 @@ model-index:
|
|
7778 |
value: 44.40836435329055
|
7779 |
- type: v_measure_std
|
7780 |
value: 1.3850659888959282
|
7781 |
-
|
7782 |
-
type:
|
7783 |
-
|
7784 |
-
config: default
|
7785 |
name: MTEB StackOverflowDupQuestions (default)
|
7786 |
-
revision: e185fbe320c72810689fc5848eb6114e1ef5ec69
|
7787 |
-
split: test
|
7788 |
type: mteb/stackoverflowdupquestions-reranking
|
|
|
|
|
|
|
7789 |
metrics:
|
7790 |
- type: main_score
|
7791 |
value: 58.792345747482436
|
@@ -7805,14 +7807,14 @@ model-index:
|
|
7805 |
value: 14.587424770057197
|
7806 |
- type: nAUC_mrr_std
|
7807 |
value: 6.683981115477786
|
7808 |
-
|
7809 |
-
type:
|
7810 |
-
|
7811 |
-
config: default
|
7812 |
name: MTEB SummEval (default)
|
7813 |
-
revision: cda12ad7615edc362dbf25a00fdd61d3b1eaf93c
|
7814 |
-
split: test
|
7815 |
type: mteb/summeval
|
|
|
|
|
|
|
7816 |
metrics:
|
7817 |
- type: cosine_pearson
|
7818 |
value: 29.605378173647523
|
@@ -7828,14 +7830,14 @@ model-index:
|
|
7828 |
value: 29.605378173647523
|
7829 |
- type: spearman
|
7830 |
value: 29.538937618105475
|
7831 |
-
|
7832 |
-
type:
|
7833 |
-
|
7834 |
-
config: default
|
7835 |
name: MTEB TRECCOVID (default)
|
7836 |
-
revision: bb9466bac8153a0349341eb1b22e06409e78ef4e
|
7837 |
-
split: test
|
7838 |
type: mteb/trec-covid
|
|
|
|
|
|
|
7839 |
metrics:
|
7840 |
- type: main_score
|
7841 |
value: 77.17500000000001
|
@@ -8119,14 +8121,14 @@ model-index:
|
|
8119 |
value: 0.677
|
8120 |
- type: recall_at_5
|
8121 |
value: 1.087
|
8122 |
-
|
8123 |
type: Retrieval
|
8124 |
-
|
8125 |
-
config: default
|
8126 |
name: MTEB Touche2020 (default)
|
8127 |
-
revision: a34f9a33db75fa0cbb21bb5cfc3dae8dc8bec93f
|
8128 |
-
split: test
|
8129 |
type: mteb/touche2020
|
|
|
|
|
|
|
8130 |
metrics:
|
8131 |
- type: main_score
|
8132 |
value: 29.343000000000004
|
@@ -8410,14 +8412,14 @@ model-index:
|
|
8410 |
value: 7.868
|
8411 |
- type: recall_at_5
|
8412 |
value: 11.413
|
8413 |
-
|
8414 |
-
type:
|
8415 |
-
|
8416 |
-
config: default
|
8417 |
name: MTEB ToxicConversationsClassification (default)
|
8418 |
-
revision: edfaf9da55d3dd50d43143d90c1ac476895ae6de
|
8419 |
-
split: test
|
8420 |
type: mteb/toxic_conversations_50k
|
|
|
|
|
|
|
8421 |
metrics:
|
8422 |
- type: accuracy
|
8423 |
value: 92.3681640625
|
@@ -8431,14 +8433,14 @@ model-index:
|
|
8431 |
value: 93.14474638528736
|
8432 |
- type: main_score
|
8433 |
value: 92.3681640625
|
8434 |
-
|
8435 |
type: Classification
|
8436 |
-
|
8437 |
-
config: default
|
8438 |
name: MTEB TweetSentimentExtractionClassification (default)
|
8439 |
-
revision: d604517c81ca91fe16a244d1248fc021f9ecee7a
|
8440 |
-
split: test
|
8441 |
type: mteb/tweet_sentiment_extraction
|
|
|
|
|
|
|
8442 |
metrics:
|
8443 |
- type: accuracy
|
8444 |
value: 80.42161856253539
|
@@ -8448,14 +8450,14 @@ model-index:
|
|
8448 |
value: 80.3228654725881
|
8449 |
- type: main_score
|
8450 |
value: 80.42161856253539
|
8451 |
-
|
8452 |
-
type:
|
8453 |
-
|
8454 |
-
config: default
|
8455 |
name: MTEB TwentyNewsgroupsClustering (default)
|
8456 |
-
revision: 6125ec4e24fa026cec8a478383ee943acfbd5449
|
8457 |
-
split: test
|
8458 |
type: mteb/twentynewsgroups-clustering
|
|
|
|
|
|
|
8459 |
metrics:
|
8460 |
- type: main_score
|
8461 |
value: 68.78385330772423
|
@@ -8463,14 +8465,14 @@ model-index:
|
|
8463 |
value: 68.78385330772423
|
8464 |
- type: v_measure_std
|
8465 |
value: 1.4814035017480702
|
8466 |
-
|
8467 |
-
type:
|
8468 |
-
|
8469 |
-
config: default
|
8470 |
name: MTEB TwitterSemEval2015 (default)
|
8471 |
-
revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
|
8472 |
-
split: test
|
8473 |
type: mteb/twittersemeval2015-pairclassification
|
|
|
|
|
|
|
8474 |
metrics:
|
8475 |
- type: cosine_accuracy
|
8476 |
value: 87.96566728258925
|
@@ -8554,14 +8556,14 @@ model-index:
|
|
8554 |
value: 68.30357142857143
|
8555 |
- type: similarity_recall
|
8556 |
value: 76.7018469656992
|
8557 |
-
|
8558 |
type: PairClassification
|
8559 |
-
|
8560 |
-
config: default
|
8561 |
name: MTEB TwitterURLCorpus (default)
|
8562 |
-
revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
|
8563 |
-
split: test
|
8564 |
type: mteb/twitterurlcorpus-pairclassification
|
|
|
|
|
|
|
8565 |
metrics:
|
8566 |
- type: cosine_accuracy
|
8567 |
value: 89.48073116777273
|
@@ -8645,6 +8647,4 @@ model-index:
|
|
8645 |
value: 75.27245137260311
|
8646 |
- type: similarity_recall
|
8647 |
value: 84.02371419772098
|
8648 |
-
task:
|
8649 |
-
type: PairClassification
|
8650 |
---
|
|
|
9 |
model-index:
|
10 |
- name: Gouzi3618/LENS-8000
|
11 |
results:
|
12 |
+
- task:
|
13 |
+
type: Classification
|
14 |
+
dataset:
|
15 |
name: MTEB AmazonCounterfactualClassification (en)
|
|
|
|
|
16 |
type: mteb/amazon_counterfactual
|
17 |
+
config: en
|
18 |
+
split: test
|
19 |
+
revision: e8379541af4e31359cca9fbcf4b00f2671dba205
|
20 |
metrics:
|
21 |
- type: accuracy
|
22 |
value: 93.6865671641791
|
|
|
30 |
value: 93.87207694461506
|
31 |
- type: main_score
|
32 |
value: 93.6865671641791
|
33 |
+
- task:
|
34 |
type: Classification
|
35 |
+
dataset:
|
|
|
36 |
name: MTEB AmazonPolarityClassification (default)
|
|
|
|
|
37 |
type: mteb/amazon_polarity
|
38 |
+
config: default
|
39 |
+
split: test
|
40 |
+
revision: e2d317d38cd51312af73b3d32a06d1a08b442046
|
41 |
metrics:
|
42 |
- type: accuracy
|
43 |
value: 97.06832499999999
|
|
|
51 |
value: 97.06781792337515
|
52 |
- type: main_score
|
53 |
value: 97.06832499999999
|
54 |
+
- task:
|
55 |
type: Classification
|
56 |
+
dataset:
|
|
|
57 |
name: MTEB AmazonReviewsClassification (en)
|
|
|
|
|
58 |
type: mteb/amazon_reviews_multi
|
59 |
+
config: en
|
60 |
+
split: test
|
61 |
+
revision: 1399c76144fd37290681b995c656ef9b2e06e26d
|
62 |
metrics:
|
63 |
- type: accuracy
|
64 |
value: 63.608
|
|
|
68 |
value: 62.41274991021244
|
69 |
- type: main_score
|
70 |
value: 63.608
|
71 |
+
- task:
|
72 |
+
type: Retrieval
|
73 |
+
dataset:
|
|
|
74 |
name: MTEB ArguAna (default)
|
|
|
|
|
75 |
type: mteb/arguana
|
76 |
+
config: default
|
77 |
+
split: test
|
78 |
+
revision: c22ab2a51041ffd869aaddef7af8d8215647e41a
|
79 |
metrics:
|
80 |
- type: main_score
|
81 |
value: 76.019
|
|
|
359 |
value: 81.57900000000001
|
360 |
- type: recall_at_5
|
361 |
value: 89.403
|
362 |
+
- task:
|
363 |
+
type: Clustering
|
364 |
+
dataset:
|
|
|
365 |
name: MTEB ArxivClusteringP2P (default)
|
|
|
|
|
366 |
type: mteb/arxiv-clustering-p2p
|
367 |
+
config: default
|
368 |
+
split: test
|
369 |
+
revision: a122ad7f3f0291bf49cc6f4d32aa80929df69d5d
|
370 |
metrics:
|
371 |
- type: main_score
|
372 |
value: 54.809064728970625
|
|
|
374 |
value: 54.809064728970625
|
375 |
- type: v_measure_std
|
376 |
value: 14.497861425102215
|
377 |
+
- task:
|
378 |
type: Clustering
|
379 |
+
dataset:
|
|
|
380 |
name: MTEB ArxivClusteringS2S (default)
|
|
|
|
|
381 |
type: mteb/arxiv-clustering-s2s
|
382 |
+
config: default
|
383 |
+
split: test
|
384 |
+
revision: f910caf1a6075f7329cdf8c1a6135696f37dbd53
|
385 |
metrics:
|
386 |
- type: main_score
|
387 |
value: 50.144159631474416
|
|
|
389 |
value: 50.144159631474416
|
390 |
- type: v_measure_std
|
391 |
value: 14.596959041091187
|
392 |
+
- task:
|
393 |
+
type: Reranking
|
394 |
+
dataset:
|
|
|
395 |
name: MTEB AskUbuntuDupQuestions (default)
|
|
|
|
|
396 |
type: mteb/askubuntudupquestions-reranking
|
397 |
+
config: default
|
398 |
+
split: test
|
399 |
+
revision: 2000358ca161889fa9c082cb41daa8dcfb161a54
|
400 |
metrics:
|
401 |
- type: main_score
|
402 |
value: 65.74396432331054
|
|
|
416 |
value: 34.51981156443003
|
417 |
- type: nAUC_mrr_std
|
418 |
value: 28.863440464092747
|
419 |
+
- task:
|
420 |
+
type: STS
|
421 |
+
dataset:
|
|
|
422 |
name: MTEB BIOSSES (default)
|
|
|
|
|
423 |
type: mteb/biosses-sts
|
424 |
+
config: default
|
425 |
+
split: test
|
426 |
+
revision: d3fb88f8f02e40887cd149695127462bbcf29b4a
|
427 |
metrics:
|
428 |
- type: cosine_pearson
|
429 |
value: 86.59612727828603
|
|
|
443 |
value: 86.59612727828603
|
444 |
- type: spearman
|
445 |
value: 85.83087137728063
|
446 |
+
- task:
|
447 |
+
type: Classification
|
448 |
+
dataset:
|
|
|
449 |
name: MTEB Banking77Classification (default)
|
|
|
|
|
450 |
type: mteb/banking77
|
451 |
+
config: default
|
452 |
+
split: test
|
453 |
+
revision: 0fd18e25b25c072e09e0d92ab615fda904d66300
|
454 |
metrics:
|
455 |
- type: accuracy
|
456 |
value: 90.19155844155846
|
|
|
460 |
value: 90.05716678902826
|
461 |
- type: main_score
|
462 |
value: 90.19155844155846
|
463 |
+
- task:
|
464 |
+
type: Clustering
|
465 |
+
dataset:
|
|
|
466 |
name: MTEB BiorxivClusteringP2P (default)
|
|
|
|
|
467 |
type: mteb/biorxiv-clustering-p2p
|
468 |
+
config: default
|
469 |
+
split: test
|
470 |
+
revision: 65b79d1d13f80053f67aca9498d9402c2d9f1f40
|
471 |
metrics:
|
472 |
- type: main_score
|
473 |
value: 52.480294793961924
|
|
|
475 |
value: 52.480294793961924
|
476 |
- type: v_measure_std
|
477 |
value: 0.5558452294416437
|
478 |
+
- task:
|
479 |
type: Clustering
|
480 |
+
dataset:
|
|
|
481 |
name: MTEB BiorxivClusteringS2S (default)
|
|
|
|
|
482 |
type: mteb/biorxiv-clustering-s2s
|
483 |
+
config: default
|
484 |
+
split: test
|
485 |
+
revision: 258694dd0231531bc1fd9de6ceb52a0853c6d908
|
486 |
metrics:
|
487 |
- type: main_score
|
488 |
value: 48.51901581759115
|
|
|
490 |
value: 48.51901581759115
|
491 |
- type: v_measure_std
|
492 |
value: 1.1094735884191569
|
493 |
+
- task:
|
494 |
+
type: Retrieval
|
495 |
+
dataset:
|
|
|
496 |
name: MTEB CQADupstackAndroidRetrieval (default)
|
|
|
|
|
497 |
type: mteb/cqadupstack-android
|
498 |
+
config: default
|
499 |
+
split: test
|
500 |
+
revision: f46a197baaae43b4f621051089b82a364682dfeb
|
501 |
metrics:
|
502 |
- type: main_score
|
503 |
value: 57.9
|
|
|
781 |
value: 54.764
|
782 |
- type: recall_at_5
|
783 |
value: 62.089000000000006
|
784 |
+
- task:
|
785 |
type: Retrieval
|
786 |
+
dataset:
|
|
|
787 |
name: MTEB CQADupstackEnglishRetrieval (default)
|
|
|
|
|
788 |
type: mteb/cqadupstack-english
|
789 |
+
config: default
|
790 |
+
split: test
|
791 |
+
revision: ad9991cb51e31e31e430383c75ffb2885547b5f0
|
792 |
metrics:
|
793 |
- type: main_score
|
794 |
value: 55.474000000000004
|
|
|
1072 |
value: 53.36300000000001
|
1073 |
- type: recall_at_5
|
1074 |
value: 58.987
|
1075 |
+
- task:
|
1076 |
type: Retrieval
|
1077 |
+
dataset:
|
|
|
1078 |
name: MTEB CQADupstackGamingRetrieval (default)
|
|
|
|
|
1079 |
type: mteb/cqadupstack-gaming
|
1080 |
+
config: default
|
1081 |
+
split: test
|
1082 |
+
revision: 4885aa143210c98657558c04aaf3dc47cfb54340
|
1083 |
metrics:
|
1084 |
- type: main_score
|
1085 |
value: 65.236
|
|
|
1363 |
value: 65.359
|
1364 |
- type: recall_at_5
|
1365 |
value: 71.439
|
1366 |
+
- task:
|
1367 |
type: Retrieval
|
1368 |
+
dataset:
|
|
|
1369 |
name: MTEB CQADupstackGisRetrieval (default)
|
|
|
|
|
1370 |
type: mteb/cqadupstack-gis
|
1371 |
+
config: default
|
1372 |
+
split: test
|
1373 |
+
revision: 5003b3064772da1887988e05400cf3806fe491f2
|
1374 |
metrics:
|
1375 |
- type: main_score
|
1376 |
value: 43.736999999999995
|
|
|
1654 |
value: 42.295
|
1655 |
- type: recall_at_5
|
1656 |
value: 49.275999999999996
|
1657 |
+
- task:
|
1658 |
type: Retrieval
|
1659 |
+
dataset:
|
|
|
1660 |
name: MTEB CQADupstackMathematicaRetrieval (default)
|
|
|
|
|
1661 |
type: mteb/cqadupstack-mathematica
|
1662 |
+
config: default
|
1663 |
+
split: test
|
1664 |
+
revision: 90fceea13679c63fe563ded68f3b6f06e50061de
|
1665 |
metrics:
|
1666 |
- type: main_score
|
1667 |
value: 38.766
|
|
|
1945 |
value: 36.278
|
1946 |
- type: recall_at_5
|
1947 |
value: 43.38
|
1948 |
+
- task:
|
1949 |
type: Retrieval
|
1950 |
+
dataset:
|
|
|
1951 |
name: MTEB CQADupstackPhysicsRetrieval (default)
|
|
|
|
|
1952 |
type: mteb/cqadupstack-physics
|
1953 |
+
config: default
|
1954 |
+
split: test
|
1955 |
+
revision: 79531abbd1fb92d06c6d6315a0cbbbf5bb247ea4
|
1956 |
metrics:
|
1957 |
- type: main_score
|
1958 |
value: 53.893
|
|
|
2236 |
value: 52.5
|
2237 |
- type: recall_at_5
|
2238 |
value: 59.489000000000004
|
2239 |
+
- task:
|
2240 |
type: Retrieval
|
2241 |
+
dataset:
|
|
|
2242 |
name: MTEB CQADupstackProgrammersRetrieval (default)
|
|
|
|
|
2243 |
type: mteb/cqadupstack-programmers
|
2244 |
+
config: default
|
2245 |
+
split: test
|
2246 |
+
revision: 6184bc1440d2dbc7612be22b50686b8826d22b32
|
2247 |
metrics:
|
2248 |
- type: main_score
|
2249 |
value: 51.151
|
|
|
2527 |
value: 48.254000000000005
|
2528 |
- type: recall_at_5
|
2529 |
value: 55.595000000000006
|
2530 |
+
- task:
|
2531 |
type: Retrieval
|
2532 |
+
dataset:
|
|
|
2533 |
name: MTEB CQADupstackRetrieval (default)
|
|
|
|
|
2534 |
type: CQADupstackRetrieval_is_a_combined_dataset
|
2535 |
+
config: default
|
2536 |
+
split: test
|
2537 |
+
revision: CQADupstackRetrieval_is_a_combined_dataset
|
2538 |
metrics:
|
2539 |
- type: main_score
|
2540 |
value: 48.669000000000004
|
2541 |
- type: ndcg_at_10
|
2542 |
value: 48.669000000000004
|
2543 |
+
- task:
|
2544 |
type: Retrieval
|
2545 |
+
dataset:
|
|
|
2546 |
name: MTEB CQADupstackStatsRetrieval (default)
|
|
|
|
|
2547 |
type: mteb/cqadupstack-stats
|
2548 |
+
config: default
|
2549 |
+
split: test
|
2550 |
+
revision: 65ac3a16b8e91f9cee4c9828cc7c335575432a2a
|
2551 |
metrics:
|
2552 |
- type: main_score
|
2553 |
value: 41.521
|
|
|
2831 |
value: 40.373
|
2832 |
- type: recall_at_5
|
2833 |
value: 46.421
|
2834 |
+
- task:
|
2835 |
type: Retrieval
|
2836 |
+
dataset:
|
|
|
2837 |
name: MTEB CQADupstackTexRetrieval (default)
|
|
|
|
|
2838 |
type: mteb/cqadupstack-tex
|
2839 |
+
config: default
|
2840 |
+
split: test
|
2841 |
+
revision: 46989137a86843e03a6195de44b09deda022eec7
|
2842 |
metrics:
|
2843 |
- type: main_score
|
2844 |
value: 37.183
|
|
|
3122 |
value: 35.522999999999996
|
3123 |
- type: recall_at_5
|
3124 |
value: 41.746
|
3125 |
+
- task:
|
3126 |
type: Retrieval
|
3127 |
+
dataset:
|
|
|
3128 |
name: MTEB CQADupstackUnixRetrieval (default)
|
|
|
|
|
3129 |
type: mteb/cqadupstack-unix
|
3130 |
+
config: default
|
3131 |
+
split: test
|
3132 |
+
revision: 6c6430d3a6d36f8d2a829195bc5dc94d7e063e53
|
3133 |
metrics:
|
3134 |
- type: main_score
|
3135 |
value: 51.396
|
|
|
3413 |
value: 49.833
|
3414 |
- type: recall_at_5
|
3415 |
value: 55.145999999999994
|
3416 |
+
- task:
|
3417 |
type: Retrieval
|
3418 |
+
dataset:
|
|
|
3419 |
name: MTEB CQADupstackWebmastersRetrieval (default)
|
|
|
|
|
3420 |
type: mteb/cqadupstack-webmasters
|
3421 |
+
config: default
|
3422 |
+
split: test
|
3423 |
+
revision: 160c094312a0e1facb97e55eeddb698c0abe3571
|
3424 |
metrics:
|
3425 |
- type: main_score
|
3426 |
value: 48.229
|
|
|
3704 |
value: 45.072
|
3705 |
- type: recall_at_5
|
3706 |
value: 52.993
|
3707 |
+
- task:
|
3708 |
type: Retrieval
|
3709 |
+
dataset:
|
|
|
3710 |
name: MTEB CQADupstackWordpressRetrieval (default)
|
|
|
|
|
3711 |
type: mteb/cqadupstack-wordpress
|
3712 |
+
config: default
|
3713 |
+
split: test
|
3714 |
+
revision: 4ffe81d471b1924886b33c7567bfb200e9eec5c4
|
3715 |
metrics:
|
3716 |
- type: main_score
|
3717 |
value: 39.542
|
|
|
3995 |
value: 38.29
|
3996 |
- type: recall_at_5
|
3997 |
value: 43.817
|
3998 |
+
- task:
|
3999 |
type: Retrieval
|
4000 |
+
dataset:
|
|
|
4001 |
name: MTEB ClimateFEVER (default)
|
|
|
|
|
4002 |
type: mteb/climate-fever
|
4003 |
+
config: default
|
4004 |
+
split: test
|
4005 |
+
revision: 47f2ac6acb640fc46020b02a5b59fdda04d39380
|
4006 |
metrics:
|
4007 |
- type: main_score
|
4008 |
value: 45.765
|
|
|
4286 |
value: 34.846
|
4287 |
- type: recall_at_5
|
4288 |
value: 43.504
|
4289 |
+
- task:
|
4290 |
type: Retrieval
|
4291 |
+
dataset:
|
|
|
4292 |
name: MTEB DBPedia (default)
|
|
|
|
|
4293 |
type: mteb/dbpedia
|
4294 |
+
config: default
|
4295 |
+
split: test
|
4296 |
+
revision: c0f706b76e590d620bd6618b3ca8efdd34e2d659
|
4297 |
metrics:
|
4298 |
- type: main_score
|
4299 |
value: 49.747
|
|
|
4577 |
value: 17.218
|
4578 |
- type: recall_at_5
|
4579 |
value: 21.275
|
4580 |
+
- task:
|
4581 |
+
type: Classification
|
4582 |
+
dataset:
|
|
|
4583 |
name: MTEB EmotionClassification (default)
|
|
|
|
|
4584 |
type: mteb/emotion
|
4585 |
+
config: default
|
4586 |
+
split: test
|
4587 |
+
revision: 4f58c6b202a23cf9a4da393831edf4f9183cad37
|
4588 |
metrics:
|
4589 |
- type: accuracy
|
4590 |
value: 91.86500000000001
|
|
|
4594 |
value: 92.0659899919408
|
4595 |
- type: main_score
|
4596 |
value: 91.86500000000001
|
4597 |
+
- task:
|
4598 |
+
type: Retrieval
|
4599 |
+
dataset:
|
|
|
4600 |
name: MTEB FEVER (default)
|
|
|
|
|
4601 |
type: mteb/fever
|
4602 |
+
config: default
|
4603 |
+
split: test
|
4604 |
+
revision: bea83ef9e8fb933d90a2f1d5515737465d613e12
|
4605 |
metrics:
|
4606 |
- type: main_score
|
4607 |
value: 92.324
|
|
|
4885 |
value: 93.806
|
4886 |
- type: recall_at_5
|
4887 |
value: 95.36
|
4888 |
+
- task:
|
4889 |
type: Retrieval
|
4890 |
+
dataset:
|
|
|
4891 |
name: MTEB FiQA2018 (default)
|
|
|
|
|
4892 |
type: mteb/fiqa
|
4893 |
+
config: default
|
4894 |
+
split: test
|
4895 |
+
revision: 27a168819829fe9bcd655c2df245fb19452e8e06
|
4896 |
metrics:
|
4897 |
- type: main_score
|
4898 |
value: 61.565999999999995
|
|
|
5176 |
value: 51.782
|
5177 |
- type: recall_at_5
|
5178 |
value: 59.911
|
5179 |
+
- task:
|
5180 |
type: Retrieval
|
5181 |
+
dataset:
|
|
|
5182 |
name: MTEB HotpotQA (default)
|
|
|
|
|
5183 |
type: mteb/hotpotqa
|
5184 |
+
config: default
|
5185 |
+
split: test
|
5186 |
+
revision: ab518f4d6fcca38d87c25209f94beba119d02014
|
5187 |
metrics:
|
5188 |
- type: main_score
|
5189 |
value: 85.71
|
|
|
5467 |
value: 80.891
|
5468 |
- type: recall_at_5
|
5469 |
value: 85.307
|
5470 |
+
- task:
|
5471 |
+
type: Classification
|
5472 |
+
dataset:
|
|
|
5473 |
name: MTEB ImdbClassification (default)
|
|
|
|
|
5474 |
type: mteb/imdb
|
5475 |
+
config: default
|
5476 |
+
split: test
|
5477 |
+
revision: 3d86128a09e091d6018b6d26cad27f2739fc2db7
|
5478 |
metrics:
|
5479 |
- type: accuracy
|
5480 |
value: 96.9972
|
|
|
5488 |
value: 96.99685931130435
|
5489 |
- type: main_score
|
5490 |
value: 96.9972
|
5491 |
+
- task:
|
5492 |
+
type: Retrieval
|
5493 |
+
dataset:
|
|
|
5494 |
name: MTEB MSMARCO (default)
|
|
|
|
|
5495 |
type: mteb/msmarco
|
5496 |
+
config: default
|
5497 |
+
split: dev
|
5498 |
+
revision: c5a29a104738b98a9e76336939199e264163d4a0
|
5499 |
metrics:
|
5500 |
- type: main_score
|
5501 |
value: 47.238
|
|
|
5779 |
value: 47.714
|
5780 |
- type: recall_at_5
|
5781 |
value: 57.913000000000004
|
5782 |
+
- task:
|
5783 |
+
type: Classification
|
5784 |
+
dataset:
|
|
|
5785 |
name: MTEB MTOPDomainClassification (en)
|
|
|
|
|
5786 |
type: mteb/mtop_domain
|
5787 |
+
config: en
|
5788 |
+
split: test
|
5789 |
+
revision: d80d48c1eb48d3562165c59d59d0034df9fff0bf
|
5790 |
metrics:
|
5791 |
- type: accuracy
|
5792 |
value: 97.43502051983585
|
|
|
5796 |
value: 97.44797640554678
|
5797 |
- type: main_score
|
5798 |
value: 97.43502051983585
|
5799 |
+
- task:
|
5800 |
type: Classification
|
5801 |
+
dataset:
|
|
|
5802 |
name: MTEB MTOPIntentClassification (en)
|
|
|
|
|
5803 |
type: mteb/mtop_intent
|
5804 |
+
config: en
|
5805 |
+
split: test
|
5806 |
+
revision: ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba
|
5807 |
metrics:
|
5808 |
- type: accuracy
|
5809 |
value: 92.80665754673961
|
|
|
5813 |
value: 93.45063761064331
|
5814 |
- type: main_score
|
5815 |
value: 92.80665754673961
|
5816 |
+
- task:
|
5817 |
type: Classification
|
5818 |
+
dataset:
|
|
|
5819 |
name: MTEB MassiveIntentClassification (en)
|
|
|
|
|
5820 |
type: mteb/amazon_massive_intent
|
5821 |
+
config: en
|
5822 |
+
split: test
|
5823 |
+
revision: 4672e20407010da34463acc759c162ca9734bca6
|
5824 |
metrics:
|
5825 |
- type: accuracy
|
5826 |
value: 81.14324142568931
|
|
|
5830 |
value: 80.06102282439677
|
5831 |
- type: main_score
|
5832 |
value: 81.14324142568931
|
5833 |
+
- task:
|
5834 |
type: Classification
|
5835 |
+
dataset:
|
|
|
5836 |
name: MTEB MassiveScenarioClassification (en)
|
|
|
|
|
5837 |
type: mteb/amazon_massive_scenario
|
5838 |
+
config: en
|
5839 |
+
split: test
|
5840 |
+
revision: fad2c6e8459f9e1c45d9315f4953d921437d70f8
|
5841 |
metrics:
|
5842 |
- type: accuracy
|
5843 |
value: 83.52723604572965
|
|
|
5847 |
value: 83.18340208761732
|
5848 |
- type: main_score
|
5849 |
value: 83.52723604572965
|
5850 |
+
- task:
|
5851 |
+
type: Clustering
|
5852 |
+
dataset:
|
|
|
5853 |
name: MTEB MedrxivClusteringP2P (default)
|
|
|
|
|
5854 |
type: mteb/medrxiv-clustering-p2p
|
5855 |
+
config: default
|
5856 |
+
split: test
|
5857 |
+
revision: e7a26af6f3ae46b30dde8737f02c07b1505bcc73
|
5858 |
metrics:
|
5859 |
- type: main_score
|
5860 |
value: 46.38149873605036
|
|
|
5862 |
value: 46.38149873605036
|
5863 |
- type: v_measure_std
|
5864 |
value: 1.0749788856434186
|
5865 |
+
- task:
|
5866 |
type: Clustering
|
5867 |
+
dataset:
|
|
|
5868 |
name: MTEB MedrxivClusteringS2S (default)
|
|
|
|
|
5869 |
type: mteb/medrxiv-clustering-s2s
|
5870 |
+
config: default
|
5871 |
+
split: test
|
5872 |
+
revision: 35191c8c0dca72d8ff3efcd72aa802307d469663
|
5873 |
metrics:
|
5874 |
- type: main_score
|
5875 |
value: 44.8945524407664
|
|
|
5877 |
value: 44.8945524407664
|
5878 |
- type: v_measure_std
|
5879 |
value: 1.2389193370528488
|
5880 |
+
- task:
|
5881 |
+
type: Reranking
|
5882 |
+
dataset:
|
|
|
5883 |
name: MTEB MindSmallReranking (default)
|
|
|
|
|
5884 |
type: mteb/mind_small
|
5885 |
+
config: default
|
5886 |
+
split: test
|
5887 |
+
revision: 59042f120c80e8afa9cdbb224f67076cec0fc9a7
|
5888 |
metrics:
|
5889 |
- type: main_score
|
5890 |
value: 31.464871623418794
|
|
|
5904 |
value: -19.359704641723024
|
5905 |
- type: nAUC_mrr_std
|
5906 |
value: 0.2553333974009825
|
5907 |
+
- task:
|
5908 |
+
type: Retrieval
|
5909 |
+
dataset:
|
|
|
5910 |
name: MTEB NFCorpus (default)
|
|
|
|
|
5911 |
type: mteb/nfcorpus
|
5912 |
+
config: default
|
5913 |
+
split: test
|
5914 |
+
revision: ec0fa4fe99da2ff19ca1214b7966684033a58814
|
5915 |
metrics:
|
5916 |
- type: main_score
|
5917 |
value: 40.608
|
|
|
6195 |
value: 12.592999999999998
|
6196 |
- type: recall_at_5
|
6197 |
value: 15.847
|
6198 |
+
- task:
|
6199 |
type: Retrieval
|
6200 |
+
dataset:
|
|
|
6201 |
name: MTEB NQ (default)
|
|
|
|
|
6202 |
type: mteb/nq
|
6203 |
+
config: default
|
6204 |
+
split: test
|
6205 |
+
revision: b774495ed302d8c44a3a7ea25c90dbce03968f31
|
6206 |
metrics:
|
6207 |
- type: main_score
|
6208 |
value: 74.639
|
|
|
6486 |
value: 76.32
|
6487 |
- type: recall_at_5
|
6488 |
value: 83.992
|
6489 |
+
- task:
|
6490 |
type: Retrieval
|
6491 |
+
dataset:
|
|
|
6492 |
name: MTEB QuoraRetrieval (default)
|
|
|
|
|
6493 |
type: mteb/quora
|
6494 |
+
config: default
|
6495 |
+
split: test
|
6496 |
+
revision: e4e08e0b7dbe3c8700f0daef558ff32256715259
|
6497 |
metrics:
|
6498 |
- type: main_score
|
6499 |
value: 90.78500000000001
|
|
|
6777 |
value: 89.85499999999999
|
6778 |
- type: recall_at_5
|
6779 |
value: 93.758
|
6780 |
+
- task:
|
6781 |
+
type: Clustering
|
6782 |
+
dataset:
|
|
|
6783 |
name: MTEB RedditClustering (default)
|
|
|
|
|
6784 |
type: mteb/reddit-clustering
|
6785 |
+
config: default
|
6786 |
+
split: test
|
6787 |
+
revision: 24640382cdbf8abc73003fb0fa6d111a705499eb
|
6788 |
metrics:
|
6789 |
- type: main_score
|
6790 |
value: 72.36527124460562
|
|
|
6792 |
value: 72.36527124460562
|
6793 |
- type: v_measure_std
|
6794 |
value: 2.7778891945364195
|
6795 |
+
- task:
|
6796 |
type: Clustering
|
6797 |
+
dataset:
|
|
|
6798 |
name: MTEB RedditClusteringP2P (default)
|
|
|
|
|
6799 |
type: mteb/reddit-clustering-p2p
|
6800 |
+
config: default
|
6801 |
+
split: test
|
6802 |
+
revision: 385e3cb46b4cfa89021f56c4380204149d0efe33
|
6803 |
metrics:
|
6804 |
- type: main_score
|
6805 |
value: 73.89142551084535
|
|
|
6807 |
value: 73.89142551084535
|
6808 |
- type: v_measure_std
|
6809 |
value: 11.258242813412751
|
6810 |
+
- task:
|
6811 |
+
type: Retrieval
|
6812 |
+
dataset:
|
|
|
6813 |
name: MTEB SCIDOCS (default)
|
|
|
|
|
6814 |
type: mteb/scidocs
|
6815 |
+
config: default
|
6816 |
+
split: test
|
6817 |
+
revision: f8c2fcf00f625baaa80f62ec5bd9e1fff3b8ae88
|
6818 |
metrics:
|
6819 |
- type: main_score
|
6820 |
value: 28.538000000000004
|
|
|
7098 |
value: 15.573
|
7099 |
- type: recall_at_5
|
7100 |
value: 20.948
|
7101 |
+
- task:
|
7102 |
+
type: STS
|
7103 |
+
dataset:
|
|
|
7104 |
name: MTEB SICK-R (default)
|
|
|
|
|
7105 |
type: mteb/sickr-sts
|
7106 |
+
config: default
|
7107 |
+
split: test
|
7108 |
+
revision: 20a6d6f312dd54037fe07a32d58e5e168867909d
|
7109 |
metrics:
|
7110 |
- type: cosine_pearson
|
7111 |
value: 84.37281363343187
|
|
|
7125 |
value: 84.37281363343187
|
7126 |
- type: spearman
|
7127 |
value: 83.30200195593044
|
7128 |
+
- task:
|
7129 |
type: STS
|
7130 |
+
dataset:
|
|
|
7131 |
name: MTEB STS12 (default)
|
|
|
|
|
7132 |
type: mteb/sts12-sts
|
7133 |
+
config: default
|
7134 |
+
split: test
|
7135 |
+
revision: a0d554a64d88156834ff5ae9920b964011b16384
|
7136 |
metrics:
|
7137 |
- type: cosine_pearson
|
7138 |
value: 86.82824905521925
|
|
|
7152 |
value: 86.82824905521925
|
7153 |
- type: spearman
|
7154 |
value: 80.98590815911939
|
7155 |
+
- task:
|
7156 |
type: STS
|
7157 |
+
dataset:
|
|
|
7158 |
name: MTEB STS13 (default)
|
|
|
|
|
7159 |
type: mteb/sts13-sts
|
7160 |
+
config: default
|
7161 |
+
split: test
|
7162 |
+
revision: 7e90230a92c190f1bf69ae9002b8cea547a64cca
|
7163 |
metrics:
|
7164 |
- type: cosine_pearson
|
7165 |
value: 87.19722316157294
|
|
|
7179 |
value: 87.19722316157294
|
7180 |
- type: spearman
|
7181 |
value: 87.34287142701457
|
7182 |
+
- task:
|
7183 |
type: STS
|
7184 |
+
dataset:
|
|
|
7185 |
name: MTEB STS14 (default)
|
|
|
|
|
7186 |
type: mteb/sts14-sts
|
7187 |
+
config: default
|
7188 |
+
split: test
|
7189 |
+
revision: 6031580fec1f6af667f0bd2da0a551cf4f0b2375
|
7190 |
metrics:
|
7191 |
- type: cosine_pearson
|
7192 |
value: 84.82646675904164
|
|
|
7206 |
value: 84.82646675904164
|
7207 |
- type: spearman
|
7208 |
value: 84.38843815801556
|
7209 |
+
- task:
|
7210 |
type: STS
|
7211 |
+
dataset:
|
|
|
7212 |
name: MTEB STS15 (default)
|
|
|
|
|
7213 |
type: mteb/sts15-sts
|
7214 |
+
config: default
|
7215 |
+
split: test
|
7216 |
+
revision: ae752c7c21bf194d8b67fd573edf7ae58183cbe3
|
7217 |
metrics:
|
7218 |
- type: cosine_pearson
|
7219 |
value: 89.69909533656704
|
|
|
7233 |
value: 89.69909533656704
|
7234 |
- type: spearman
|
7235 |
value: 89.74723322749233
|
7236 |
+
- task:
|
7237 |
type: STS
|
7238 |
+
dataset:
|
|
|
7239 |
name: MTEB STS16 (default)
|
|
|
|
|
7240 |
type: mteb/sts16-sts
|
7241 |
+
config: default
|
7242 |
+
split: test
|
7243 |
+
revision: 4d8694f8f0e0100860b497b999b3dbed754a0513
|
7244 |
metrics:
|
7245 |
- type: cosine_pearson
|
7246 |
value: 86.84947603401746
|
|
|
7260 |
value: 86.84947603401746
|
7261 |
- type: spearman
|
7262 |
value: 87.63022743056388
|
7263 |
+
- task:
|
7264 |
type: STS
|
7265 |
+
dataset:
|
|
|
7266 |
name: MTEB STS17 (en-en)
|
|
|
|
|
7267 |
type: mteb/sts17-crosslingual-sts
|
7268 |
+
config: en-en
|
7269 |
+
split: test
|
7270 |
+
revision: faeb762787bd10488a50c8b5be4a3b82e411949c
|
7271 |
metrics:
|
7272 |
- type: cosine_pearson
|
7273 |
value: 91.43391567649913
|
|
|
7287 |
value: 91.43391567649913
|
7288 |
- type: spearman
|
7289 |
value: 90.86953801008369
|
7290 |
+
- task:
|
7291 |
type: STS
|
7292 |
+
dataset:
|
|
|
7293 |
name: MTEB STS22 (en)
|
|
|
|
|
7294 |
type: mteb/sts22-crosslingual-sts
|
7295 |
+
config: en
|
7296 |
+
split: test
|
7297 |
+
revision: de9d86b3b84231dc21f76c7b7af1f28e2f57f6e3
|
7298 |
metrics:
|
7299 |
- type: cosine_pearson
|
7300 |
value: 68.81338409687908
|
|
|
7314 |
value: 68.81338409687908
|
7315 |
- type: spearman
|
7316 |
value: 68.09215270009086
|
7317 |
+
- task:
|
7318 |
type: STS
|
7319 |
+
dataset:
|
|
|
7320 |
name: MTEB STSBenchmark (default)
|
|
|
|
|
7321 |
type: mteb/stsbenchmark-sts
|
7322 |
+
config: default
|
7323 |
+
split: test
|
7324 |
+
revision: b0fddb56ed78048fa8b90373c8a3cfc37b684831
|
7325 |
metrics:
|
7326 |
- type: cosine_pearson
|
7327 |
value: 87.93191595794555
|
|
|
7341 |
value: 87.93191595794555
|
7342 |
- type: spearman
|
7343 |
value: 88.46646307403641
|
7344 |
+
- task:
|
7345 |
+
type: Reranking
|
7346 |
+
dataset:
|
|
|
7347 |
name: MTEB SciDocsRR (default)
|
|
|
|
|
7348 |
type: mteb/scidocs-reranking
|
7349 |
+
config: default
|
7350 |
+
split: test
|
7351 |
+
revision: d3c5e1fc0b855ab6097bf1cda04dd73947d7caab
|
7352 |
metrics:
|
7353 |
- type: main_score
|
7354 |
value: 87.62672056519489
|
|
|
7368 |
value: 82.4844792677926
|
7369 |
- type: nAUC_mrr_std
|
7370 |
value: 82.0357865297397
|
7371 |
+
- task:
|
7372 |
+
type: Retrieval
|
7373 |
+
dataset:
|
|
|
7374 |
name: MTEB SciFact (default)
|
|
|
|
|
7375 |
type: mteb/scifact
|
7376 |
+
config: default
|
7377 |
+
split: test
|
7378 |
+
revision: 0228b52cf27578f30900b9e5271d331663a030d7
|
7379 |
metrics:
|
7380 |
- type: main_score
|
7381 |
value: 79.745
|
|
|
7659 |
value: 81.072
|
7660 |
- type: recall_at_5
|
7661 |
value: 87.339
|
7662 |
+
- task:
|
7663 |
+
type: PairClassification
|
7664 |
+
dataset:
|
|
|
7665 |
name: MTEB SprintDuplicateQuestions (default)
|
|
|
|
|
7666 |
type: mteb/sprintduplicatequestions-pairclassification
|
7667 |
+
config: default
|
7668 |
+
split: test
|
7669 |
+
revision: d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46
|
7670 |
metrics:
|
7671 |
- type: cosine_accuracy
|
7672 |
value: 99.86039603960396
|
|
|
7750 |
value: 93.69277721261444
|
7751 |
- type: similarity_recall
|
7752 |
value: 92.10000000000001
|
7753 |
+
- task:
|
7754 |
+
type: Clustering
|
7755 |
+
dataset:
|
|
|
7756 |
name: MTEB StackExchangeClustering (default)
|
|
|
|
|
7757 |
type: mteb/stackexchange-clustering
|
7758 |
+
config: default
|
7759 |
+
split: test
|
7760 |
+
revision: 6cbc1f7b2bc0622f2e39d2c77fa502909748c259
|
7761 |
metrics:
|
7762 |
- type: main_score
|
7763 |
value: 81.5950420419382
|
|
|
7765 |
value: 81.5950420419382
|
7766 |
- type: v_measure_std
|
7767 |
value: 2.3518861207789126
|
7768 |
+
- task:
|
7769 |
type: Clustering
|
7770 |
+
dataset:
|
|
|
7771 |
name: MTEB StackExchangeClusteringP2P (default)
|
|
|
|
|
7772 |
type: mteb/stackexchange-clustering-p2p
|
7773 |
+
config: default
|
7774 |
+
split: test
|
7775 |
+
revision: 815ca46b2622cec33ccafc3735d572c266efdb44
|
7776 |
metrics:
|
7777 |
- type: main_score
|
7778 |
value: 44.40836435329055
|
|
|
7780 |
value: 44.40836435329055
|
7781 |
- type: v_measure_std
|
7782 |
value: 1.3850659888959282
|
7783 |
+
- task:
|
7784 |
+
type: Reranking
|
7785 |
+
dataset:
|
|
|
7786 |
name: MTEB StackOverflowDupQuestions (default)
|
|
|
|
|
7787 |
type: mteb/stackoverflowdupquestions-reranking
|
7788 |
+
config: default
|
7789 |
+
split: test
|
7790 |
+
revision: e185fbe320c72810689fc5848eb6114e1ef5ec69
|
7791 |
metrics:
|
7792 |
- type: main_score
|
7793 |
value: 58.792345747482436
|
|
|
7807 |
value: 14.587424770057197
|
7808 |
- type: nAUC_mrr_std
|
7809 |
value: 6.683981115477786
|
7810 |
+
- task:
|
7811 |
+
type: Summarization
|
7812 |
+
dataset:
|
|
|
7813 |
name: MTEB SummEval (default)
|
|
|
|
|
7814 |
type: mteb/summeval
|
7815 |
+
config: default
|
7816 |
+
split: test
|
7817 |
+
revision: cda12ad7615edc362dbf25a00fdd61d3b1eaf93c
|
7818 |
metrics:
|
7819 |
- type: cosine_pearson
|
7820 |
value: 29.605378173647523
|
|
|
7830 |
value: 29.605378173647523
|
7831 |
- type: spearman
|
7832 |
value: 29.538937618105475
|
7833 |
+
- task:
|
7834 |
+
type: Retrieval
|
7835 |
+
dataset:
|
|
|
7836 |
name: MTEB TRECCOVID (default)
|
|
|
|
|
7837 |
type: mteb/trec-covid
|
7838 |
+
config: default
|
7839 |
+
split: test
|
7840 |
+
revision: bb9466bac8153a0349341eb1b22e06409e78ef4e
|
7841 |
metrics:
|
7842 |
- type: main_score
|
7843 |
value: 77.17500000000001
|
|
|
8121 |
value: 0.677
|
8122 |
- type: recall_at_5
|
8123 |
value: 1.087
|
8124 |
+
- task:
|
8125 |
type: Retrieval
|
8126 |
+
dataset:
|
|
|
8127 |
name: MTEB Touche2020 (default)
|
|
|
|
|
8128 |
type: mteb/touche2020
|
8129 |
+
config: default
|
8130 |
+
split: test
|
8131 |
+
revision: a34f9a33db75fa0cbb21bb5cfc3dae8dc8bec93f
|
8132 |
metrics:
|
8133 |
- type: main_score
|
8134 |
value: 29.343000000000004
|
|
|
8412 |
value: 7.868
|
8413 |
- type: recall_at_5
|
8414 |
value: 11.413
|
8415 |
+
- task:
|
8416 |
+
type: Classification
|
8417 |
+
dataset:
|
|
|
8418 |
name: MTEB ToxicConversationsClassification (default)
|
|
|
|
|
8419 |
type: mteb/toxic_conversations_50k
|
8420 |
+
config: default
|
8421 |
+
split: test
|
8422 |
+
revision: edfaf9da55d3dd50d43143d90c1ac476895ae6de
|
8423 |
metrics:
|
8424 |
- type: accuracy
|
8425 |
value: 92.3681640625
|
|
|
8433 |
value: 93.14474638528736
|
8434 |
- type: main_score
|
8435 |
value: 92.3681640625
|
8436 |
+
- task:
|
8437 |
type: Classification
|
8438 |
+
dataset:
|
|
|
8439 |
name: MTEB TweetSentimentExtractionClassification (default)
|
|
|
|
|
8440 |
type: mteb/tweet_sentiment_extraction
|
8441 |
+
config: default
|
8442 |
+
split: test
|
8443 |
+
revision: d604517c81ca91fe16a244d1248fc021f9ecee7a
|
8444 |
metrics:
|
8445 |
- type: accuracy
|
8446 |
value: 80.42161856253539
|
|
|
8450 |
value: 80.3228654725881
|
8451 |
- type: main_score
|
8452 |
value: 80.42161856253539
|
8453 |
+
- task:
|
8454 |
+
type: Clustering
|
8455 |
+
dataset:
|
|
|
8456 |
name: MTEB TwentyNewsgroupsClustering (default)
|
|
|
|
|
8457 |
type: mteb/twentynewsgroups-clustering
|
8458 |
+
config: default
|
8459 |
+
split: test
|
8460 |
+
revision: 6125ec4e24fa026cec8a478383ee943acfbd5449
|
8461 |
metrics:
|
8462 |
- type: main_score
|
8463 |
value: 68.78385330772423
|
|
|
8465 |
value: 68.78385330772423
|
8466 |
- type: v_measure_std
|
8467 |
value: 1.4814035017480702
|
8468 |
+
- task:
|
8469 |
+
type: PairClassification
|
8470 |
+
dataset:
|
|
|
8471 |
name: MTEB TwitterSemEval2015 (default)
|
|
|
|
|
8472 |
type: mteb/twittersemeval2015-pairclassification
|
8473 |
+
config: default
|
8474 |
+
split: test
|
8475 |
+
revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
|
8476 |
metrics:
|
8477 |
- type: cosine_accuracy
|
8478 |
value: 87.96566728258925
|
|
|
8556 |
value: 68.30357142857143
|
8557 |
- type: similarity_recall
|
8558 |
value: 76.7018469656992
|
8559 |
+
- task:
|
8560 |
type: PairClassification
|
8561 |
+
dataset:
|
|
|
8562 |
name: MTEB TwitterURLCorpus (default)
|
|
|
|
|
8563 |
type: mteb/twitterurlcorpus-pairclassification
|
8564 |
+
config: default
|
8565 |
+
split: test
|
8566 |
+
revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
|
8567 |
metrics:
|
8568 |
- type: cosine_accuracy
|
8569 |
value: 89.48073116777273
|
|
|
8647 |
value: 75.27245137260311
|
8648 |
- type: similarity_recall
|
8649 |
value: 84.02371419772098
|
|
|
|
|
8650 |
---
|
config.json
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/projects/0/prjs0835/ACL25/reps-llm-2/huggingface_models/wrap_model/model_lens_8000",
|
3 |
+
"architectures": [
|
4 |
+
"MistralModel"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 1,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"head_dim": 128,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 4096,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 14336,
|
14 |
+
"max_position_embeddings": 32768,
|
15 |
+
"model_type": "mistral",
|
16 |
+
"num_attention_heads": 32,
|
17 |
+
"num_hidden_layers": 32,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"rms_norm_eps": 1e-05,
|
20 |
+
"rope_theta": 10000.0,
|
21 |
+
"sliding_window": 4096,
|
22 |
+
"tie_word_embeddings": false,
|
23 |
+
"torch_dtype": "float32",
|
24 |
+
"transformers_version": "4.43.1",
|
25 |
+
"use_cache": false,
|
26 |
+
"vocab_size": 32003
|
27 |
+
}
|
model-00001-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0bb494b856d59521f7aa3f85d267047c8bb0989e3ef3877164d090a1b73c5250
|
3 |
+
size 4987245800
|
model-00002-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db48eac273441e1ce91b8df5df3da14cb995b37b2384c414ac2944a55530aec2
|
3 |
+
size 4899116152
|
model-00003-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62b83abd1fa64fbc428083bef0cfbb1f67e49c1d83c12aa36350df787ef32907
|
3 |
+
size 4999812808
|
model-00004-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa05808ae834fa506c16f96e60264363947fe64b9978bdc2a796333866561852
|
3 |
+
size 4999812808
|
model-00005-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01441d94a31f225bff2a4a1c3a18030697ab14cd34a24d66dab290203a150309
|
3 |
+
size 4832007216
|
model-00006-of-00006.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4044180ffe3a641d301ef30b9d7c26f8fddc1a915f509579e9710d30b5a1e51f
|
3 |
+
size 3724726552
|
model.safetensors.index.json
ADDED
@@ -0,0 +1,297 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"metadata": {
|
3 |
+
"total_size": 28442689536
|
4 |
+
},
|
5 |
+
"weight_map": {
|
6 |
+
"embed_tokens.weight": "model-00001-of-00006.safetensors",
|
7 |
+
"layers.0.input_layernorm.weight": "model-00001-of-00006.safetensors",
|
8 |
+
"layers.0.mlp.down_proj.weight": "model-00001-of-00006.safetensors",
|
9 |
+
"layers.0.mlp.gate_proj.weight": "model-00001-of-00006.safetensors",
|
10 |
+
"layers.0.mlp.up_proj.weight": "model-00001-of-00006.safetensors",
|
11 |
+
"layers.0.post_attention_layernorm.weight": "model-00001-of-00006.safetensors",
|
12 |
+
"layers.0.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
|
13 |
+
"layers.0.self_attn.o_proj.weight": "model-00001-of-00006.safetensors",
|
14 |
+
"layers.0.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
|
15 |
+
"layers.0.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
|
16 |
+
"layers.1.input_layernorm.weight": "model-00001-of-00006.safetensors",
|
17 |
+
"layers.1.mlp.down_proj.weight": "model-00001-of-00006.safetensors",
|
18 |
+
"layers.1.mlp.gate_proj.weight": "model-00001-of-00006.safetensors",
|
19 |
+
"layers.1.mlp.up_proj.weight": "model-00001-of-00006.safetensors",
|
20 |
+
"layers.1.post_attention_layernorm.weight": "model-00001-of-00006.safetensors",
|
21 |
+
"layers.1.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
|
22 |
+
"layers.1.self_attn.o_proj.weight": "model-00001-of-00006.safetensors",
|
23 |
+
"layers.1.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
|
24 |
+
"layers.1.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
|
25 |
+
"layers.10.input_layernorm.weight": "model-00003-of-00006.safetensors",
|
26 |
+
"layers.10.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
|
27 |
+
"layers.10.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
|
28 |
+
"layers.10.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
|
29 |
+
"layers.10.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
|
30 |
+
"layers.10.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
|
31 |
+
"layers.10.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
|
32 |
+
"layers.10.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
|
33 |
+
"layers.10.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
|
34 |
+
"layers.11.input_layernorm.weight": "model-00003-of-00006.safetensors",
|
35 |
+
"layers.11.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
|
36 |
+
"layers.11.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
|
37 |
+
"layers.11.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
|
38 |
+
"layers.11.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
|
39 |
+
"layers.11.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
|
40 |
+
"layers.11.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
|
41 |
+
"layers.11.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
|
42 |
+
"layers.11.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
|
43 |
+
"layers.12.input_layernorm.weight": "model-00003-of-00006.safetensors",
|
44 |
+
"layers.12.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
|
45 |
+
"layers.12.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
|
46 |
+
"layers.12.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
|
47 |
+
"layers.12.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
|
48 |
+
"layers.12.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
|
49 |
+
"layers.12.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
|
50 |
+
"layers.12.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
|
51 |
+
"layers.12.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
|
52 |
+
"layers.13.input_layernorm.weight": "model-00003-of-00006.safetensors",
|
53 |
+
"layers.13.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
|
54 |
+
"layers.13.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
|
55 |
+
"layers.13.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
|
56 |
+
"layers.13.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
|
57 |
+
"layers.13.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
|
58 |
+
"layers.13.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
|
59 |
+
"layers.13.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
|
60 |
+
"layers.13.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
|
61 |
+
"layers.14.input_layernorm.weight": "model-00003-of-00006.safetensors",
|
62 |
+
"layers.14.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
|
63 |
+
"layers.14.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
|
64 |
+
"layers.14.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
|
65 |
+
"layers.14.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
|
66 |
+
"layers.14.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
|
67 |
+
"layers.14.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
|
68 |
+
"layers.14.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
|
69 |
+
"layers.14.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
|
70 |
+
"layers.15.input_layernorm.weight": "model-00003-of-00006.safetensors",
|
71 |
+
"layers.15.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
|
72 |
+
"layers.15.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
|
73 |
+
"layers.15.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
|
74 |
+
"layers.15.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
|
75 |
+
"layers.15.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
|
76 |
+
"layers.15.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
|
77 |
+
"layers.15.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
|
78 |
+
"layers.15.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
|
79 |
+
"layers.16.input_layernorm.weight": "model-00004-of-00006.safetensors",
|
80 |
+
"layers.16.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
|
81 |
+
"layers.16.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
|
82 |
+
"layers.16.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
|
83 |
+
"layers.16.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
|
84 |
+
"layers.16.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
|
85 |
+
"layers.16.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
|
86 |
+
"layers.16.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
|
87 |
+
"layers.16.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
|
88 |
+
"layers.17.input_layernorm.weight": "model-00004-of-00006.safetensors",
|
89 |
+
"layers.17.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
|
90 |
+
"layers.17.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
|
91 |
+
"layers.17.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
|
92 |
+
"layers.17.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
|
93 |
+
"layers.17.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
|
94 |
+
"layers.17.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
|
95 |
+
"layers.17.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
|
96 |
+
"layers.17.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
|
97 |
+
"layers.18.input_layernorm.weight": "model-00004-of-00006.safetensors",
|
98 |
+
"layers.18.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
|
99 |
+
"layers.18.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
|
100 |
+
"layers.18.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
|
101 |
+
"layers.18.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
|
102 |
+
"layers.18.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
|
103 |
+
"layers.18.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
|
104 |
+
"layers.18.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
|
105 |
+
"layers.18.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
|
106 |
+
"layers.19.input_layernorm.weight": "model-00004-of-00006.safetensors",
|
107 |
+
"layers.19.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
|
108 |
+
"layers.19.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
|
109 |
+
"layers.19.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
|
110 |
+
"layers.19.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
|
111 |
+
"layers.19.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
|
112 |
+
"layers.19.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
|
113 |
+
"layers.19.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
|
114 |
+
"layers.19.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
|
115 |
+
"layers.2.input_layernorm.weight": "model-00001-of-00006.safetensors",
|
116 |
+
"layers.2.mlp.down_proj.weight": "model-00001-of-00006.safetensors",
|
117 |
+
"layers.2.mlp.gate_proj.weight": "model-00001-of-00006.safetensors",
|
118 |
+
"layers.2.mlp.up_proj.weight": "model-00001-of-00006.safetensors",
|
119 |
+
"layers.2.post_attention_layernorm.weight": "model-00001-of-00006.safetensors",
|
120 |
+
"layers.2.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
|
121 |
+
"layers.2.self_attn.o_proj.weight": "model-00001-of-00006.safetensors",
|
122 |
+
"layers.2.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
|
123 |
+
"layers.2.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
|
124 |
+
"layers.20.input_layernorm.weight": "model-00004-of-00006.safetensors",
|
125 |
+
"layers.20.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
|
126 |
+
"layers.20.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
|
127 |
+
"layers.20.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
|
128 |
+
"layers.20.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
|
129 |
+
"layers.20.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
|
130 |
+
"layers.20.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
|
131 |
+
"layers.20.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
|
132 |
+
"layers.20.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
|
133 |
+
"layers.21.input_layernorm.weight": "model-00004-of-00006.safetensors",
|
134 |
+
"layers.21.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
|
135 |
+
"layers.21.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
|
136 |
+
"layers.21.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
|
137 |
+
"layers.21.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
|
138 |
+
"layers.21.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
|
139 |
+
"layers.21.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
|
140 |
+
"layers.21.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
|
141 |
+
"layers.21.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
|
142 |
+
"layers.22.input_layernorm.weight": "model-00005-of-00006.safetensors",
|
143 |
+
"layers.22.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
|
144 |
+
"layers.22.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
|
145 |
+
"layers.22.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
|
146 |
+
"layers.22.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
|
147 |
+
"layers.22.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
|
148 |
+
"layers.22.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
|
149 |
+
"layers.22.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
|
150 |
+
"layers.22.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
|
151 |
+
"layers.23.input_layernorm.weight": "model-00005-of-00006.safetensors",
|
152 |
+
"layers.23.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
|
153 |
+
"layers.23.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
|
154 |
+
"layers.23.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
|
155 |
+
"layers.23.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
|
156 |
+
"layers.23.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
|
157 |
+
"layers.23.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
|
158 |
+
"layers.23.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
|
159 |
+
"layers.23.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
|
160 |
+
"layers.24.input_layernorm.weight": "model-00005-of-00006.safetensors",
|
161 |
+
"layers.24.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
|
162 |
+
"layers.24.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
|
163 |
+
"layers.24.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
|
164 |
+
"layers.24.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
|
165 |
+
"layers.24.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
|
166 |
+
"layers.24.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
|
167 |
+
"layers.24.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
|
168 |
+
"layers.24.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
|
169 |
+
"layers.25.input_layernorm.weight": "model-00005-of-00006.safetensors",
|
170 |
+
"layers.25.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
|
171 |
+
"layers.25.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
|
172 |
+
"layers.25.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
|
173 |
+
"layers.25.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
|
174 |
+
"layers.25.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
|
175 |
+
"layers.25.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
|
176 |
+
"layers.25.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
|
177 |
+
"layers.25.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
|
178 |
+
"layers.26.input_layernorm.weight": "model-00005-of-00006.safetensors",
|
179 |
+
"layers.26.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
|
180 |
+
"layers.26.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
|
181 |
+
"layers.26.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
|
182 |
+
"layers.26.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
|
183 |
+
"layers.26.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
|
184 |
+
"layers.26.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
|
185 |
+
"layers.26.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
|
186 |
+
"layers.26.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
|
187 |
+
"layers.27.input_layernorm.weight": "model-00006-of-00006.safetensors",
|
188 |
+
"layers.27.mlp.down_proj.weight": "model-00006-of-00006.safetensors",
|
189 |
+
"layers.27.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
|
190 |
+
"layers.27.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
|
191 |
+
"layers.27.post_attention_layernorm.weight": "model-00006-of-00006.safetensors",
|
192 |
+
"layers.27.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
|
193 |
+
"layers.27.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
|
194 |
+
"layers.27.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
|
195 |
+
"layers.27.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
|
196 |
+
"layers.28.input_layernorm.weight": "model-00006-of-00006.safetensors",
|
197 |
+
"layers.28.mlp.down_proj.weight": "model-00006-of-00006.safetensors",
|
198 |
+
"layers.28.mlp.gate_proj.weight": "model-00006-of-00006.safetensors",
|
199 |
+
"layers.28.mlp.up_proj.weight": "model-00006-of-00006.safetensors",
|
200 |
+
"layers.28.post_attention_layernorm.weight": "model-00006-of-00006.safetensors",
|
201 |
+
"layers.28.self_attn.k_proj.weight": "model-00006-of-00006.safetensors",
|
202 |
+
"layers.28.self_attn.o_proj.weight": "model-00006-of-00006.safetensors",
|
203 |
+
"layers.28.self_attn.q_proj.weight": "model-00006-of-00006.safetensors",
|
204 |
+
"layers.28.self_attn.v_proj.weight": "model-00006-of-00006.safetensors",
|
205 |
+
"layers.29.input_layernorm.weight": "model-00006-of-00006.safetensors",
|
206 |
+
"layers.29.mlp.down_proj.weight": "model-00006-of-00006.safetensors",
|
207 |
+
"layers.29.mlp.gate_proj.weight": "model-00006-of-00006.safetensors",
|
208 |
+
"layers.29.mlp.up_proj.weight": "model-00006-of-00006.safetensors",
|
209 |
+
"layers.29.post_attention_layernorm.weight": "model-00006-of-00006.safetensors",
|
210 |
+
"layers.29.self_attn.k_proj.weight": "model-00006-of-00006.safetensors",
|
211 |
+
"layers.29.self_attn.o_proj.weight": "model-00006-of-00006.safetensors",
|
212 |
+
"layers.29.self_attn.q_proj.weight": "model-00006-of-00006.safetensors",
|
213 |
+
"layers.29.self_attn.v_proj.weight": "model-00006-of-00006.safetensors",
|
214 |
+
"layers.3.input_layernorm.weight": "model-00001-of-00006.safetensors",
|
215 |
+
"layers.3.mlp.down_proj.weight": "model-00001-of-00006.safetensors",
|
216 |
+
"layers.3.mlp.gate_proj.weight": "model-00001-of-00006.safetensors",
|
217 |
+
"layers.3.mlp.up_proj.weight": "model-00001-of-00006.safetensors",
|
218 |
+
"layers.3.post_attention_layernorm.weight": "model-00001-of-00006.safetensors",
|
219 |
+
"layers.3.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
|
220 |
+
"layers.3.self_attn.o_proj.weight": "model-00001-of-00006.safetensors",
|
221 |
+
"layers.3.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
|
222 |
+
"layers.3.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
|
223 |
+
"layers.30.input_layernorm.weight": "model-00006-of-00006.safetensors",
|
224 |
+
"layers.30.mlp.down_proj.weight": "model-00006-of-00006.safetensors",
|
225 |
+
"layers.30.mlp.gate_proj.weight": "model-00006-of-00006.safetensors",
|
226 |
+
"layers.30.mlp.up_proj.weight": "model-00006-of-00006.safetensors",
|
227 |
+
"layers.30.post_attention_layernorm.weight": "model-00006-of-00006.safetensors",
|
228 |
+
"layers.30.self_attn.k_proj.weight": "model-00006-of-00006.safetensors",
|
229 |
+
"layers.30.self_attn.o_proj.weight": "model-00006-of-00006.safetensors",
|
230 |
+
"layers.30.self_attn.q_proj.weight": "model-00006-of-00006.safetensors",
|
231 |
+
"layers.30.self_attn.v_proj.weight": "model-00006-of-00006.safetensors",
|
232 |
+
"layers.31.input_layernorm.weight": "model-00006-of-00006.safetensors",
|
233 |
+
"layers.31.mlp.down_proj.weight": "model-00006-of-00006.safetensors",
|
234 |
+
"layers.31.mlp.gate_proj.weight": "model-00006-of-00006.safetensors",
|
235 |
+
"layers.31.mlp.up_proj.weight": "model-00006-of-00006.safetensors",
|
236 |
+
"layers.31.post_attention_layernorm.weight": "model-00006-of-00006.safetensors",
|
237 |
+
"layers.31.self_attn.k_proj.weight": "model-00006-of-00006.safetensors",
|
238 |
+
"layers.31.self_attn.o_proj.weight": "model-00006-of-00006.safetensors",
|
239 |
+
"layers.31.self_attn.q_proj.weight": "model-00006-of-00006.safetensors",
|
240 |
+
"layers.31.self_attn.v_proj.weight": "model-00006-of-00006.safetensors",
|
241 |
+
"layers.4.input_layernorm.weight": "model-00001-of-00006.safetensors",
|
242 |
+
"layers.4.mlp.down_proj.weight": "model-00001-of-00006.safetensors",
|
243 |
+
"layers.4.mlp.gate_proj.weight": "model-00001-of-00006.safetensors",
|
244 |
+
"layers.4.mlp.up_proj.weight": "model-00001-of-00006.safetensors",
|
245 |
+
"layers.4.post_attention_layernorm.weight": "model-00001-of-00006.safetensors",
|
246 |
+
"layers.4.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
|
247 |
+
"layers.4.self_attn.o_proj.weight": "model-00001-of-00006.safetensors",
|
248 |
+
"layers.4.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
|
249 |
+
"layers.4.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
|
250 |
+
"layers.5.input_layernorm.weight": "model-00002-of-00006.safetensors",
|
251 |
+
"layers.5.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
|
252 |
+
"layers.5.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
|
253 |
+
"layers.5.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
|
254 |
+
"layers.5.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
|
255 |
+
"layers.5.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
|
256 |
+
"layers.5.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
|
257 |
+
"layers.5.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
|
258 |
+
"layers.5.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
|
259 |
+
"layers.6.input_layernorm.weight": "model-00002-of-00006.safetensors",
|
260 |
+
"layers.6.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
|
261 |
+
"layers.6.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
|
262 |
+
"layers.6.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
|
263 |
+
"layers.6.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
|
264 |
+
"layers.6.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
|
265 |
+
"layers.6.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
|
266 |
+
"layers.6.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
|
267 |
+
"layers.6.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
|
268 |
+
"layers.7.input_layernorm.weight": "model-00002-of-00006.safetensors",
|
269 |
+
"layers.7.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
|
270 |
+
"layers.7.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
|
271 |
+
"layers.7.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
|
272 |
+
"layers.7.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
|
273 |
+
"layers.7.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
|
274 |
+
"layers.7.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
|
275 |
+
"layers.7.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
|
276 |
+
"layers.7.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
|
277 |
+
"layers.8.input_layernorm.weight": "model-00002-of-00006.safetensors",
|
278 |
+
"layers.8.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
|
279 |
+
"layers.8.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
|
280 |
+
"layers.8.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
|
281 |
+
"layers.8.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
|
282 |
+
"layers.8.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
|
283 |
+
"layers.8.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
|
284 |
+
"layers.8.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
|
285 |
+
"layers.8.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
|
286 |
+
"layers.9.input_layernorm.weight": "model-00002-of-00006.safetensors",
|
287 |
+
"layers.9.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
|
288 |
+
"layers.9.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
|
289 |
+
"layers.9.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
|
290 |
+
"layers.9.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
|
291 |
+
"layers.9.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
|
292 |
+
"layers.9.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
|
293 |
+
"layers.9.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
|
294 |
+
"layers.9.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
|
295 |
+
"norm.weight": "model-00006-of-00006.safetensors"
|
296 |
+
}
|
297 |
+
}
|