yibinlei commited on
Commit
5082cf3
·
verified ·
1 Parent(s): 2aa2856

Upload model

Browse files
README.md CHANGED
@@ -9,12 +9,14 @@ tags:
9
  model-index:
10
  - name: Gouzi3618/LENS-8000
11
  results:
12
- - dataset:
13
- config: en
 
14
  name: MTEB AmazonCounterfactualClassification (en)
15
- revision: e8379541af4e31359cca9fbcf4b00f2671dba205
16
- split: test
17
  type: mteb/amazon_counterfactual
 
 
 
18
  metrics:
19
  - type: accuracy
20
  value: 93.6865671641791
@@ -28,14 +30,14 @@ model-index:
28
  value: 93.87207694461506
29
  - type: main_score
30
  value: 93.6865671641791
31
- task:
32
  type: Classification
33
- - dataset:
34
- config: default
35
  name: MTEB AmazonPolarityClassification (default)
36
- revision: e2d317d38cd51312af73b3d32a06d1a08b442046
37
- split: test
38
  type: mteb/amazon_polarity
 
 
 
39
  metrics:
40
  - type: accuracy
41
  value: 97.06832499999999
@@ -49,14 +51,14 @@ model-index:
49
  value: 97.06781792337515
50
  - type: main_score
51
  value: 97.06832499999999
52
- task:
53
  type: Classification
54
- - dataset:
55
- config: en
56
  name: MTEB AmazonReviewsClassification (en)
57
- revision: 1399c76144fd37290681b995c656ef9b2e06e26d
58
- split: test
59
  type: mteb/amazon_reviews_multi
 
 
 
60
  metrics:
61
  - type: accuracy
62
  value: 63.608
@@ -66,14 +68,14 @@ model-index:
66
  value: 62.41274991021244
67
  - type: main_score
68
  value: 63.608
69
- task:
70
- type: Classification
71
- - dataset:
72
- config: default
73
  name: MTEB ArguAna (default)
74
- revision: c22ab2a51041ffd869aaddef7af8d8215647e41a
75
- split: test
76
  type: mteb/arguana
 
 
 
77
  metrics:
78
  - type: main_score
79
  value: 76.019
@@ -357,14 +359,14 @@ model-index:
357
  value: 81.57900000000001
358
  - type: recall_at_5
359
  value: 89.403
360
- task:
361
- type: Retrieval
362
- - dataset:
363
- config: default
364
  name: MTEB ArxivClusteringP2P (default)
365
- revision: a122ad7f3f0291bf49cc6f4d32aa80929df69d5d
366
- split: test
367
  type: mteb/arxiv-clustering-p2p
 
 
 
368
  metrics:
369
  - type: main_score
370
  value: 54.809064728970625
@@ -372,14 +374,14 @@ model-index:
372
  value: 54.809064728970625
373
  - type: v_measure_std
374
  value: 14.497861425102215
375
- task:
376
  type: Clustering
377
- - dataset:
378
- config: default
379
  name: MTEB ArxivClusteringS2S (default)
380
- revision: f910caf1a6075f7329cdf8c1a6135696f37dbd53
381
- split: test
382
  type: mteb/arxiv-clustering-s2s
 
 
 
383
  metrics:
384
  - type: main_score
385
  value: 50.144159631474416
@@ -387,14 +389,14 @@ model-index:
387
  value: 50.144159631474416
388
  - type: v_measure_std
389
  value: 14.596959041091187
390
- task:
391
- type: Clustering
392
- - dataset:
393
- config: default
394
  name: MTEB AskUbuntuDupQuestions (default)
395
- revision: 2000358ca161889fa9c082cb41daa8dcfb161a54
396
- split: test
397
  type: mteb/askubuntudupquestions-reranking
 
 
 
398
  metrics:
399
  - type: main_score
400
  value: 65.74396432331054
@@ -414,14 +416,14 @@ model-index:
414
  value: 34.51981156443003
415
  - type: nAUC_mrr_std
416
  value: 28.863440464092747
417
- task:
418
- type: Reranking
419
- - dataset:
420
- config: default
421
  name: MTEB BIOSSES (default)
422
- revision: d3fb88f8f02e40887cd149695127462bbcf29b4a
423
- split: test
424
  type: mteb/biosses-sts
 
 
 
425
  metrics:
426
  - type: cosine_pearson
427
  value: 86.59612727828603
@@ -441,14 +443,14 @@ model-index:
441
  value: 86.59612727828603
442
  - type: spearman
443
  value: 85.83087137728063
444
- task:
445
- type: STS
446
- - dataset:
447
- config: default
448
  name: MTEB Banking77Classification (default)
449
- revision: 0fd18e25b25c072e09e0d92ab615fda904d66300
450
- split: test
451
  type: mteb/banking77
 
 
 
452
  metrics:
453
  - type: accuracy
454
  value: 90.19155844155846
@@ -458,14 +460,14 @@ model-index:
458
  value: 90.05716678902826
459
  - type: main_score
460
  value: 90.19155844155846
461
- task:
462
- type: Classification
463
- - dataset:
464
- config: default
465
  name: MTEB BiorxivClusteringP2P (default)
466
- revision: 65b79d1d13f80053f67aca9498d9402c2d9f1f40
467
- split: test
468
  type: mteb/biorxiv-clustering-p2p
 
 
 
469
  metrics:
470
  - type: main_score
471
  value: 52.480294793961924
@@ -473,14 +475,14 @@ model-index:
473
  value: 52.480294793961924
474
  - type: v_measure_std
475
  value: 0.5558452294416437
476
- task:
477
  type: Clustering
478
- - dataset:
479
- config: default
480
  name: MTEB BiorxivClusteringS2S (default)
481
- revision: 258694dd0231531bc1fd9de6ceb52a0853c6d908
482
- split: test
483
  type: mteb/biorxiv-clustering-s2s
 
 
 
484
  metrics:
485
  - type: main_score
486
  value: 48.51901581759115
@@ -488,14 +490,14 @@ model-index:
488
  value: 48.51901581759115
489
  - type: v_measure_std
490
  value: 1.1094735884191569
491
- task:
492
- type: Clustering
493
- - dataset:
494
- config: default
495
  name: MTEB CQADupstackAndroidRetrieval (default)
496
- revision: f46a197baaae43b4f621051089b82a364682dfeb
497
- split: test
498
  type: mteb/cqadupstack-android
 
 
 
499
  metrics:
500
  - type: main_score
501
  value: 57.9
@@ -779,14 +781,14 @@ model-index:
779
  value: 54.764
780
  - type: recall_at_5
781
  value: 62.089000000000006
782
- task:
783
  type: Retrieval
784
- - dataset:
785
- config: default
786
  name: MTEB CQADupstackEnglishRetrieval (default)
787
- revision: ad9991cb51e31e31e430383c75ffb2885547b5f0
788
- split: test
789
  type: mteb/cqadupstack-english
 
 
 
790
  metrics:
791
  - type: main_score
792
  value: 55.474000000000004
@@ -1070,14 +1072,14 @@ model-index:
1070
  value: 53.36300000000001
1071
  - type: recall_at_5
1072
  value: 58.987
1073
- task:
1074
  type: Retrieval
1075
- - dataset:
1076
- config: default
1077
  name: MTEB CQADupstackGamingRetrieval (default)
1078
- revision: 4885aa143210c98657558c04aaf3dc47cfb54340
1079
- split: test
1080
  type: mteb/cqadupstack-gaming
 
 
 
1081
  metrics:
1082
  - type: main_score
1083
  value: 65.236
@@ -1361,14 +1363,14 @@ model-index:
1361
  value: 65.359
1362
  - type: recall_at_5
1363
  value: 71.439
1364
- task:
1365
  type: Retrieval
1366
- - dataset:
1367
- config: default
1368
  name: MTEB CQADupstackGisRetrieval (default)
1369
- revision: 5003b3064772da1887988e05400cf3806fe491f2
1370
- split: test
1371
  type: mteb/cqadupstack-gis
 
 
 
1372
  metrics:
1373
  - type: main_score
1374
  value: 43.736999999999995
@@ -1652,14 +1654,14 @@ model-index:
1652
  value: 42.295
1653
  - type: recall_at_5
1654
  value: 49.275999999999996
1655
- task:
1656
  type: Retrieval
1657
- - dataset:
1658
- config: default
1659
  name: MTEB CQADupstackMathematicaRetrieval (default)
1660
- revision: 90fceea13679c63fe563ded68f3b6f06e50061de
1661
- split: test
1662
  type: mteb/cqadupstack-mathematica
 
 
 
1663
  metrics:
1664
  - type: main_score
1665
  value: 38.766
@@ -1943,14 +1945,14 @@ model-index:
1943
  value: 36.278
1944
  - type: recall_at_5
1945
  value: 43.38
1946
- task:
1947
  type: Retrieval
1948
- - dataset:
1949
- config: default
1950
  name: MTEB CQADupstackPhysicsRetrieval (default)
1951
- revision: 79531abbd1fb92d06c6d6315a0cbbbf5bb247ea4
1952
- split: test
1953
  type: mteb/cqadupstack-physics
 
 
 
1954
  metrics:
1955
  - type: main_score
1956
  value: 53.893
@@ -2234,14 +2236,14 @@ model-index:
2234
  value: 52.5
2235
  - type: recall_at_5
2236
  value: 59.489000000000004
2237
- task:
2238
  type: Retrieval
2239
- - dataset:
2240
- config: default
2241
  name: MTEB CQADupstackProgrammersRetrieval (default)
2242
- revision: 6184bc1440d2dbc7612be22b50686b8826d22b32
2243
- split: test
2244
  type: mteb/cqadupstack-programmers
 
 
 
2245
  metrics:
2246
  - type: main_score
2247
  value: 51.151
@@ -2525,27 +2527,27 @@ model-index:
2525
  value: 48.254000000000005
2526
  - type: recall_at_5
2527
  value: 55.595000000000006
2528
- task:
2529
  type: Retrieval
2530
- - dataset:
2531
- config: default
2532
  name: MTEB CQADupstackRetrieval (default)
2533
- revision: CQADupstackRetrieval_is_a_combined_dataset
2534
- split: test
2535
  type: CQADupstackRetrieval_is_a_combined_dataset
 
 
 
2536
  metrics:
2537
  - type: main_score
2538
  value: 48.669000000000004
2539
  - type: ndcg_at_10
2540
  value: 48.669000000000004
2541
- task:
2542
  type: Retrieval
2543
- - dataset:
2544
- config: default
2545
  name: MTEB CQADupstackStatsRetrieval (default)
2546
- revision: 65ac3a16b8e91f9cee4c9828cc7c335575432a2a
2547
- split: test
2548
  type: mteb/cqadupstack-stats
 
 
 
2549
  metrics:
2550
  - type: main_score
2551
  value: 41.521
@@ -2829,14 +2831,14 @@ model-index:
2829
  value: 40.373
2830
  - type: recall_at_5
2831
  value: 46.421
2832
- task:
2833
  type: Retrieval
2834
- - dataset:
2835
- config: default
2836
  name: MTEB CQADupstackTexRetrieval (default)
2837
- revision: 46989137a86843e03a6195de44b09deda022eec7
2838
- split: test
2839
  type: mteb/cqadupstack-tex
 
 
 
2840
  metrics:
2841
  - type: main_score
2842
  value: 37.183
@@ -3120,14 +3122,14 @@ model-index:
3120
  value: 35.522999999999996
3121
  - type: recall_at_5
3122
  value: 41.746
3123
- task:
3124
  type: Retrieval
3125
- - dataset:
3126
- config: default
3127
  name: MTEB CQADupstackUnixRetrieval (default)
3128
- revision: 6c6430d3a6d36f8d2a829195bc5dc94d7e063e53
3129
- split: test
3130
  type: mteb/cqadupstack-unix
 
 
 
3131
  metrics:
3132
  - type: main_score
3133
  value: 51.396
@@ -3411,14 +3413,14 @@ model-index:
3411
  value: 49.833
3412
  - type: recall_at_5
3413
  value: 55.145999999999994
3414
- task:
3415
  type: Retrieval
3416
- - dataset:
3417
- config: default
3418
  name: MTEB CQADupstackWebmastersRetrieval (default)
3419
- revision: 160c094312a0e1facb97e55eeddb698c0abe3571
3420
- split: test
3421
  type: mteb/cqadupstack-webmasters
 
 
 
3422
  metrics:
3423
  - type: main_score
3424
  value: 48.229
@@ -3702,14 +3704,14 @@ model-index:
3702
  value: 45.072
3703
  - type: recall_at_5
3704
  value: 52.993
3705
- task:
3706
  type: Retrieval
3707
- - dataset:
3708
- config: default
3709
  name: MTEB CQADupstackWordpressRetrieval (default)
3710
- revision: 4ffe81d471b1924886b33c7567bfb200e9eec5c4
3711
- split: test
3712
  type: mteb/cqadupstack-wordpress
 
 
 
3713
  metrics:
3714
  - type: main_score
3715
  value: 39.542
@@ -3993,14 +3995,14 @@ model-index:
3993
  value: 38.29
3994
  - type: recall_at_5
3995
  value: 43.817
3996
- task:
3997
  type: Retrieval
3998
- - dataset:
3999
- config: default
4000
  name: MTEB ClimateFEVER (default)
4001
- revision: 47f2ac6acb640fc46020b02a5b59fdda04d39380
4002
- split: test
4003
  type: mteb/climate-fever
 
 
 
4004
  metrics:
4005
  - type: main_score
4006
  value: 45.765
@@ -4284,14 +4286,14 @@ model-index:
4284
  value: 34.846
4285
  - type: recall_at_5
4286
  value: 43.504
4287
- task:
4288
  type: Retrieval
4289
- - dataset:
4290
- config: default
4291
  name: MTEB DBPedia (default)
4292
- revision: c0f706b76e590d620bd6618b3ca8efdd34e2d659
4293
- split: test
4294
  type: mteb/dbpedia
 
 
 
4295
  metrics:
4296
  - type: main_score
4297
  value: 49.747
@@ -4575,14 +4577,14 @@ model-index:
4575
  value: 17.218
4576
  - type: recall_at_5
4577
  value: 21.275
4578
- task:
4579
- type: Retrieval
4580
- - dataset:
4581
- config: default
4582
  name: MTEB EmotionClassification (default)
4583
- revision: 4f58c6b202a23cf9a4da393831edf4f9183cad37
4584
- split: test
4585
  type: mteb/emotion
 
 
 
4586
  metrics:
4587
  - type: accuracy
4588
  value: 91.86500000000001
@@ -4592,14 +4594,14 @@ model-index:
4592
  value: 92.0659899919408
4593
  - type: main_score
4594
  value: 91.86500000000001
4595
- task:
4596
- type: Classification
4597
- - dataset:
4598
- config: default
4599
  name: MTEB FEVER (default)
4600
- revision: bea83ef9e8fb933d90a2f1d5515737465d613e12
4601
- split: test
4602
  type: mteb/fever
 
 
 
4603
  metrics:
4604
  - type: main_score
4605
  value: 92.324
@@ -4883,14 +4885,14 @@ model-index:
4883
  value: 93.806
4884
  - type: recall_at_5
4885
  value: 95.36
4886
- task:
4887
  type: Retrieval
4888
- - dataset:
4889
- config: default
4890
  name: MTEB FiQA2018 (default)
4891
- revision: 27a168819829fe9bcd655c2df245fb19452e8e06
4892
- split: test
4893
  type: mteb/fiqa
 
 
 
4894
  metrics:
4895
  - type: main_score
4896
  value: 61.565999999999995
@@ -5174,14 +5176,14 @@ model-index:
5174
  value: 51.782
5175
  - type: recall_at_5
5176
  value: 59.911
5177
- task:
5178
  type: Retrieval
5179
- - dataset:
5180
- config: default
5181
  name: MTEB HotpotQA (default)
5182
- revision: ab518f4d6fcca38d87c25209f94beba119d02014
5183
- split: test
5184
  type: mteb/hotpotqa
 
 
 
5185
  metrics:
5186
  - type: main_score
5187
  value: 85.71
@@ -5465,14 +5467,14 @@ model-index:
5465
  value: 80.891
5466
  - type: recall_at_5
5467
  value: 85.307
5468
- task:
5469
- type: Retrieval
5470
- - dataset:
5471
- config: default
5472
  name: MTEB ImdbClassification (default)
5473
- revision: 3d86128a09e091d6018b6d26cad27f2739fc2db7
5474
- split: test
5475
  type: mteb/imdb
 
 
 
5476
  metrics:
5477
  - type: accuracy
5478
  value: 96.9972
@@ -5486,14 +5488,14 @@ model-index:
5486
  value: 96.99685931130435
5487
  - type: main_score
5488
  value: 96.9972
5489
- task:
5490
- type: Classification
5491
- - dataset:
5492
- config: default
5493
  name: MTEB MSMARCO (default)
5494
- revision: c5a29a104738b98a9e76336939199e264163d4a0
5495
- split: dev
5496
  type: mteb/msmarco
 
 
 
5497
  metrics:
5498
  - type: main_score
5499
  value: 47.238
@@ -5777,14 +5779,14 @@ model-index:
5777
  value: 47.714
5778
  - type: recall_at_5
5779
  value: 57.913000000000004
5780
- task:
5781
- type: Retrieval
5782
- - dataset:
5783
- config: en
5784
  name: MTEB MTOPDomainClassification (en)
5785
- revision: d80d48c1eb48d3562165c59d59d0034df9fff0bf
5786
- split: test
5787
  type: mteb/mtop_domain
 
 
 
5788
  metrics:
5789
  - type: accuracy
5790
  value: 97.43502051983585
@@ -5794,14 +5796,14 @@ model-index:
5794
  value: 97.44797640554678
5795
  - type: main_score
5796
  value: 97.43502051983585
5797
- task:
5798
  type: Classification
5799
- - dataset:
5800
- config: en
5801
  name: MTEB MTOPIntentClassification (en)
5802
- revision: ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba
5803
- split: test
5804
  type: mteb/mtop_intent
 
 
 
5805
  metrics:
5806
  - type: accuracy
5807
  value: 92.80665754673961
@@ -5811,14 +5813,14 @@ model-index:
5811
  value: 93.45063761064331
5812
  - type: main_score
5813
  value: 92.80665754673961
5814
- task:
5815
  type: Classification
5816
- - dataset:
5817
- config: en
5818
  name: MTEB MassiveIntentClassification (en)
5819
- revision: 4672e20407010da34463acc759c162ca9734bca6
5820
- split: test
5821
  type: mteb/amazon_massive_intent
 
 
 
5822
  metrics:
5823
  - type: accuracy
5824
  value: 81.14324142568931
@@ -5828,14 +5830,14 @@ model-index:
5828
  value: 80.06102282439677
5829
  - type: main_score
5830
  value: 81.14324142568931
5831
- task:
5832
  type: Classification
5833
- - dataset:
5834
- config: en
5835
  name: MTEB MassiveScenarioClassification (en)
5836
- revision: fad2c6e8459f9e1c45d9315f4953d921437d70f8
5837
- split: test
5838
  type: mteb/amazon_massive_scenario
 
 
 
5839
  metrics:
5840
  - type: accuracy
5841
  value: 83.52723604572965
@@ -5845,14 +5847,14 @@ model-index:
5845
  value: 83.18340208761732
5846
  - type: main_score
5847
  value: 83.52723604572965
5848
- task:
5849
- type: Classification
5850
- - dataset:
5851
- config: default
5852
  name: MTEB MedrxivClusteringP2P (default)
5853
- revision: e7a26af6f3ae46b30dde8737f02c07b1505bcc73
5854
- split: test
5855
  type: mteb/medrxiv-clustering-p2p
 
 
 
5856
  metrics:
5857
  - type: main_score
5858
  value: 46.38149873605036
@@ -5860,14 +5862,14 @@ model-index:
5860
  value: 46.38149873605036
5861
  - type: v_measure_std
5862
  value: 1.0749788856434186
5863
- task:
5864
  type: Clustering
5865
- - dataset:
5866
- config: default
5867
  name: MTEB MedrxivClusteringS2S (default)
5868
- revision: 35191c8c0dca72d8ff3efcd72aa802307d469663
5869
- split: test
5870
  type: mteb/medrxiv-clustering-s2s
 
 
 
5871
  metrics:
5872
  - type: main_score
5873
  value: 44.8945524407664
@@ -5875,14 +5877,14 @@ model-index:
5875
  value: 44.8945524407664
5876
  - type: v_measure_std
5877
  value: 1.2389193370528488
5878
- task:
5879
- type: Clustering
5880
- - dataset:
5881
- config: default
5882
  name: MTEB MindSmallReranking (default)
5883
- revision: 59042f120c80e8afa9cdbb224f67076cec0fc9a7
5884
- split: test
5885
  type: mteb/mind_small
 
 
 
5886
  metrics:
5887
  - type: main_score
5888
  value: 31.464871623418794
@@ -5902,14 +5904,14 @@ model-index:
5902
  value: -19.359704641723024
5903
  - type: nAUC_mrr_std
5904
  value: 0.2553333974009825
5905
- task:
5906
- type: Reranking
5907
- - dataset:
5908
- config: default
5909
  name: MTEB NFCorpus (default)
5910
- revision: ec0fa4fe99da2ff19ca1214b7966684033a58814
5911
- split: test
5912
  type: mteb/nfcorpus
 
 
 
5913
  metrics:
5914
  - type: main_score
5915
  value: 40.608
@@ -6193,14 +6195,14 @@ model-index:
6193
  value: 12.592999999999998
6194
  - type: recall_at_5
6195
  value: 15.847
6196
- task:
6197
  type: Retrieval
6198
- - dataset:
6199
- config: default
6200
  name: MTEB NQ (default)
6201
- revision: b774495ed302d8c44a3a7ea25c90dbce03968f31
6202
- split: test
6203
  type: mteb/nq
 
 
 
6204
  metrics:
6205
  - type: main_score
6206
  value: 74.639
@@ -6484,14 +6486,14 @@ model-index:
6484
  value: 76.32
6485
  - type: recall_at_5
6486
  value: 83.992
6487
- task:
6488
  type: Retrieval
6489
- - dataset:
6490
- config: default
6491
  name: MTEB QuoraRetrieval (default)
6492
- revision: e4e08e0b7dbe3c8700f0daef558ff32256715259
6493
- split: test
6494
  type: mteb/quora
 
 
 
6495
  metrics:
6496
  - type: main_score
6497
  value: 90.78500000000001
@@ -6775,14 +6777,14 @@ model-index:
6775
  value: 89.85499999999999
6776
  - type: recall_at_5
6777
  value: 93.758
6778
- task:
6779
- type: Retrieval
6780
- - dataset:
6781
- config: default
6782
  name: MTEB RedditClustering (default)
6783
- revision: 24640382cdbf8abc73003fb0fa6d111a705499eb
6784
- split: test
6785
  type: mteb/reddit-clustering
 
 
 
6786
  metrics:
6787
  - type: main_score
6788
  value: 72.36527124460562
@@ -6790,14 +6792,14 @@ model-index:
6790
  value: 72.36527124460562
6791
  - type: v_measure_std
6792
  value: 2.7778891945364195
6793
- task:
6794
  type: Clustering
6795
- - dataset:
6796
- config: default
6797
  name: MTEB RedditClusteringP2P (default)
6798
- revision: 385e3cb46b4cfa89021f56c4380204149d0efe33
6799
- split: test
6800
  type: mteb/reddit-clustering-p2p
 
 
 
6801
  metrics:
6802
  - type: main_score
6803
  value: 73.89142551084535
@@ -6805,14 +6807,14 @@ model-index:
6805
  value: 73.89142551084535
6806
  - type: v_measure_std
6807
  value: 11.258242813412751
6808
- task:
6809
- type: Clustering
6810
- - dataset:
6811
- config: default
6812
  name: MTEB SCIDOCS (default)
6813
- revision: f8c2fcf00f625baaa80f62ec5bd9e1fff3b8ae88
6814
- split: test
6815
  type: mteb/scidocs
 
 
 
6816
  metrics:
6817
  - type: main_score
6818
  value: 28.538000000000004
@@ -7096,14 +7098,14 @@ model-index:
7096
  value: 15.573
7097
  - type: recall_at_5
7098
  value: 20.948
7099
- task:
7100
- type: Retrieval
7101
- - dataset:
7102
- config: default
7103
  name: MTEB SICK-R (default)
7104
- revision: 20a6d6f312dd54037fe07a32d58e5e168867909d
7105
- split: test
7106
  type: mteb/sickr-sts
 
 
 
7107
  metrics:
7108
  - type: cosine_pearson
7109
  value: 84.37281363343187
@@ -7123,14 +7125,14 @@ model-index:
7123
  value: 84.37281363343187
7124
  - type: spearman
7125
  value: 83.30200195593044
7126
- task:
7127
  type: STS
7128
- - dataset:
7129
- config: default
7130
  name: MTEB STS12 (default)
7131
- revision: a0d554a64d88156834ff5ae9920b964011b16384
7132
- split: test
7133
  type: mteb/sts12-sts
 
 
 
7134
  metrics:
7135
  - type: cosine_pearson
7136
  value: 86.82824905521925
@@ -7150,14 +7152,14 @@ model-index:
7150
  value: 86.82824905521925
7151
  - type: spearman
7152
  value: 80.98590815911939
7153
- task:
7154
  type: STS
7155
- - dataset:
7156
- config: default
7157
  name: MTEB STS13 (default)
7158
- revision: 7e90230a92c190f1bf69ae9002b8cea547a64cca
7159
- split: test
7160
  type: mteb/sts13-sts
 
 
 
7161
  metrics:
7162
  - type: cosine_pearson
7163
  value: 87.19722316157294
@@ -7177,14 +7179,14 @@ model-index:
7177
  value: 87.19722316157294
7178
  - type: spearman
7179
  value: 87.34287142701457
7180
- task:
7181
  type: STS
7182
- - dataset:
7183
- config: default
7184
  name: MTEB STS14 (default)
7185
- revision: 6031580fec1f6af667f0bd2da0a551cf4f0b2375
7186
- split: test
7187
  type: mteb/sts14-sts
 
 
 
7188
  metrics:
7189
  - type: cosine_pearson
7190
  value: 84.82646675904164
@@ -7204,14 +7206,14 @@ model-index:
7204
  value: 84.82646675904164
7205
  - type: spearman
7206
  value: 84.38843815801556
7207
- task:
7208
  type: STS
7209
- - dataset:
7210
- config: default
7211
  name: MTEB STS15 (default)
7212
- revision: ae752c7c21bf194d8b67fd573edf7ae58183cbe3
7213
- split: test
7214
  type: mteb/sts15-sts
 
 
 
7215
  metrics:
7216
  - type: cosine_pearson
7217
  value: 89.69909533656704
@@ -7231,14 +7233,14 @@ model-index:
7231
  value: 89.69909533656704
7232
  - type: spearman
7233
  value: 89.74723322749233
7234
- task:
7235
  type: STS
7236
- - dataset:
7237
- config: default
7238
  name: MTEB STS16 (default)
7239
- revision: 4d8694f8f0e0100860b497b999b3dbed754a0513
7240
- split: test
7241
  type: mteb/sts16-sts
 
 
 
7242
  metrics:
7243
  - type: cosine_pearson
7244
  value: 86.84947603401746
@@ -7258,14 +7260,14 @@ model-index:
7258
  value: 86.84947603401746
7259
  - type: spearman
7260
  value: 87.63022743056388
7261
- task:
7262
  type: STS
7263
- - dataset:
7264
- config: en-en
7265
  name: MTEB STS17 (en-en)
7266
- revision: faeb762787bd10488a50c8b5be4a3b82e411949c
7267
- split: test
7268
  type: mteb/sts17-crosslingual-sts
 
 
 
7269
  metrics:
7270
  - type: cosine_pearson
7271
  value: 91.43391567649913
@@ -7285,14 +7287,14 @@ model-index:
7285
  value: 91.43391567649913
7286
  - type: spearman
7287
  value: 90.86953801008369
7288
- task:
7289
  type: STS
7290
- - dataset:
7291
- config: en
7292
  name: MTEB STS22 (en)
7293
- revision: de9d86b3b84231dc21f76c7b7af1f28e2f57f6e3
7294
- split: test
7295
  type: mteb/sts22-crosslingual-sts
 
 
 
7296
  metrics:
7297
  - type: cosine_pearson
7298
  value: 68.81338409687908
@@ -7312,14 +7314,14 @@ model-index:
7312
  value: 68.81338409687908
7313
  - type: spearman
7314
  value: 68.09215270009086
7315
- task:
7316
  type: STS
7317
- - dataset:
7318
- config: default
7319
  name: MTEB STSBenchmark (default)
7320
- revision: b0fddb56ed78048fa8b90373c8a3cfc37b684831
7321
- split: test
7322
  type: mteb/stsbenchmark-sts
 
 
 
7323
  metrics:
7324
  - type: cosine_pearson
7325
  value: 87.93191595794555
@@ -7339,14 +7341,14 @@ model-index:
7339
  value: 87.93191595794555
7340
  - type: spearman
7341
  value: 88.46646307403641
7342
- task:
7343
- type: STS
7344
- - dataset:
7345
- config: default
7346
  name: MTEB SciDocsRR (default)
7347
- revision: d3c5e1fc0b855ab6097bf1cda04dd73947d7caab
7348
- split: test
7349
  type: mteb/scidocs-reranking
 
 
 
7350
  metrics:
7351
  - type: main_score
7352
  value: 87.62672056519489
@@ -7366,14 +7368,14 @@ model-index:
7366
  value: 82.4844792677926
7367
  - type: nAUC_mrr_std
7368
  value: 82.0357865297397
7369
- task:
7370
- type: Reranking
7371
- - dataset:
7372
- config: default
7373
  name: MTEB SciFact (default)
7374
- revision: 0228b52cf27578f30900b9e5271d331663a030d7
7375
- split: test
7376
  type: mteb/scifact
 
 
 
7377
  metrics:
7378
  - type: main_score
7379
  value: 79.745
@@ -7657,14 +7659,14 @@ model-index:
7657
  value: 81.072
7658
  - type: recall_at_5
7659
  value: 87.339
7660
- task:
7661
- type: Retrieval
7662
- - dataset:
7663
- config: default
7664
  name: MTEB SprintDuplicateQuestions (default)
7665
- revision: d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46
7666
- split: test
7667
  type: mteb/sprintduplicatequestions-pairclassification
 
 
 
7668
  metrics:
7669
  - type: cosine_accuracy
7670
  value: 99.86039603960396
@@ -7748,14 +7750,14 @@ model-index:
7748
  value: 93.69277721261444
7749
  - type: similarity_recall
7750
  value: 92.10000000000001
7751
- task:
7752
- type: PairClassification
7753
- - dataset:
7754
- config: default
7755
  name: MTEB StackExchangeClustering (default)
7756
- revision: 6cbc1f7b2bc0622f2e39d2c77fa502909748c259
7757
- split: test
7758
  type: mteb/stackexchange-clustering
 
 
 
7759
  metrics:
7760
  - type: main_score
7761
  value: 81.5950420419382
@@ -7763,14 +7765,14 @@ model-index:
7763
  value: 81.5950420419382
7764
  - type: v_measure_std
7765
  value: 2.3518861207789126
7766
- task:
7767
  type: Clustering
7768
- - dataset:
7769
- config: default
7770
  name: MTEB StackExchangeClusteringP2P (default)
7771
- revision: 815ca46b2622cec33ccafc3735d572c266efdb44
7772
- split: test
7773
  type: mteb/stackexchange-clustering-p2p
 
 
 
7774
  metrics:
7775
  - type: main_score
7776
  value: 44.40836435329055
@@ -7778,14 +7780,14 @@ model-index:
7778
  value: 44.40836435329055
7779
  - type: v_measure_std
7780
  value: 1.3850659888959282
7781
- task:
7782
- type: Clustering
7783
- - dataset:
7784
- config: default
7785
  name: MTEB StackOverflowDupQuestions (default)
7786
- revision: e185fbe320c72810689fc5848eb6114e1ef5ec69
7787
- split: test
7788
  type: mteb/stackoverflowdupquestions-reranking
 
 
 
7789
  metrics:
7790
  - type: main_score
7791
  value: 58.792345747482436
@@ -7805,14 +7807,14 @@ model-index:
7805
  value: 14.587424770057197
7806
  - type: nAUC_mrr_std
7807
  value: 6.683981115477786
7808
- task:
7809
- type: Reranking
7810
- - dataset:
7811
- config: default
7812
  name: MTEB SummEval (default)
7813
- revision: cda12ad7615edc362dbf25a00fdd61d3b1eaf93c
7814
- split: test
7815
  type: mteb/summeval
 
 
 
7816
  metrics:
7817
  - type: cosine_pearson
7818
  value: 29.605378173647523
@@ -7828,14 +7830,14 @@ model-index:
7828
  value: 29.605378173647523
7829
  - type: spearman
7830
  value: 29.538937618105475
7831
- task:
7832
- type: Summarization
7833
- - dataset:
7834
- config: default
7835
  name: MTEB TRECCOVID (default)
7836
- revision: bb9466bac8153a0349341eb1b22e06409e78ef4e
7837
- split: test
7838
  type: mteb/trec-covid
 
 
 
7839
  metrics:
7840
  - type: main_score
7841
  value: 77.17500000000001
@@ -8119,14 +8121,14 @@ model-index:
8119
  value: 0.677
8120
  - type: recall_at_5
8121
  value: 1.087
8122
- task:
8123
  type: Retrieval
8124
- - dataset:
8125
- config: default
8126
  name: MTEB Touche2020 (default)
8127
- revision: a34f9a33db75fa0cbb21bb5cfc3dae8dc8bec93f
8128
- split: test
8129
  type: mteb/touche2020
 
 
 
8130
  metrics:
8131
  - type: main_score
8132
  value: 29.343000000000004
@@ -8410,14 +8412,14 @@ model-index:
8410
  value: 7.868
8411
  - type: recall_at_5
8412
  value: 11.413
8413
- task:
8414
- type: Retrieval
8415
- - dataset:
8416
- config: default
8417
  name: MTEB ToxicConversationsClassification (default)
8418
- revision: edfaf9da55d3dd50d43143d90c1ac476895ae6de
8419
- split: test
8420
  type: mteb/toxic_conversations_50k
 
 
 
8421
  metrics:
8422
  - type: accuracy
8423
  value: 92.3681640625
@@ -8431,14 +8433,14 @@ model-index:
8431
  value: 93.14474638528736
8432
  - type: main_score
8433
  value: 92.3681640625
8434
- task:
8435
  type: Classification
8436
- - dataset:
8437
- config: default
8438
  name: MTEB TweetSentimentExtractionClassification (default)
8439
- revision: d604517c81ca91fe16a244d1248fc021f9ecee7a
8440
- split: test
8441
  type: mteb/tweet_sentiment_extraction
 
 
 
8442
  metrics:
8443
  - type: accuracy
8444
  value: 80.42161856253539
@@ -8448,14 +8450,14 @@ model-index:
8448
  value: 80.3228654725881
8449
  - type: main_score
8450
  value: 80.42161856253539
8451
- task:
8452
- type: Classification
8453
- - dataset:
8454
- config: default
8455
  name: MTEB TwentyNewsgroupsClustering (default)
8456
- revision: 6125ec4e24fa026cec8a478383ee943acfbd5449
8457
- split: test
8458
  type: mteb/twentynewsgroups-clustering
 
 
 
8459
  metrics:
8460
  - type: main_score
8461
  value: 68.78385330772423
@@ -8463,14 +8465,14 @@ model-index:
8463
  value: 68.78385330772423
8464
  - type: v_measure_std
8465
  value: 1.4814035017480702
8466
- task:
8467
- type: Clustering
8468
- - dataset:
8469
- config: default
8470
  name: MTEB TwitterSemEval2015 (default)
8471
- revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
8472
- split: test
8473
  type: mteb/twittersemeval2015-pairclassification
 
 
 
8474
  metrics:
8475
  - type: cosine_accuracy
8476
  value: 87.96566728258925
@@ -8554,14 +8556,14 @@ model-index:
8554
  value: 68.30357142857143
8555
  - type: similarity_recall
8556
  value: 76.7018469656992
8557
- task:
8558
  type: PairClassification
8559
- - dataset:
8560
- config: default
8561
  name: MTEB TwitterURLCorpus (default)
8562
- revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
8563
- split: test
8564
  type: mteb/twitterurlcorpus-pairclassification
 
 
 
8565
  metrics:
8566
  - type: cosine_accuracy
8567
  value: 89.48073116777273
@@ -8645,6 +8647,4 @@ model-index:
8645
  value: 75.27245137260311
8646
  - type: similarity_recall
8647
  value: 84.02371419772098
8648
- task:
8649
- type: PairClassification
8650
  ---
 
9
  model-index:
10
  - name: Gouzi3618/LENS-8000
11
  results:
12
+ - task:
13
+ type: Classification
14
+ dataset:
15
  name: MTEB AmazonCounterfactualClassification (en)
 
 
16
  type: mteb/amazon_counterfactual
17
+ config: en
18
+ split: test
19
+ revision: e8379541af4e31359cca9fbcf4b00f2671dba205
20
  metrics:
21
  - type: accuracy
22
  value: 93.6865671641791
 
30
  value: 93.87207694461506
31
  - type: main_score
32
  value: 93.6865671641791
33
+ - task:
34
  type: Classification
35
+ dataset:
 
36
  name: MTEB AmazonPolarityClassification (default)
 
 
37
  type: mteb/amazon_polarity
38
+ config: default
39
+ split: test
40
+ revision: e2d317d38cd51312af73b3d32a06d1a08b442046
41
  metrics:
42
  - type: accuracy
43
  value: 97.06832499999999
 
51
  value: 97.06781792337515
52
  - type: main_score
53
  value: 97.06832499999999
54
+ - task:
55
  type: Classification
56
+ dataset:
 
57
  name: MTEB AmazonReviewsClassification (en)
 
 
58
  type: mteb/amazon_reviews_multi
59
+ config: en
60
+ split: test
61
+ revision: 1399c76144fd37290681b995c656ef9b2e06e26d
62
  metrics:
63
  - type: accuracy
64
  value: 63.608
 
68
  value: 62.41274991021244
69
  - type: main_score
70
  value: 63.608
71
+ - task:
72
+ type: Retrieval
73
+ dataset:
 
74
  name: MTEB ArguAna (default)
 
 
75
  type: mteb/arguana
76
+ config: default
77
+ split: test
78
+ revision: c22ab2a51041ffd869aaddef7af8d8215647e41a
79
  metrics:
80
  - type: main_score
81
  value: 76.019
 
359
  value: 81.57900000000001
360
  - type: recall_at_5
361
  value: 89.403
362
+ - task:
363
+ type: Clustering
364
+ dataset:
 
365
  name: MTEB ArxivClusteringP2P (default)
 
 
366
  type: mteb/arxiv-clustering-p2p
367
+ config: default
368
+ split: test
369
+ revision: a122ad7f3f0291bf49cc6f4d32aa80929df69d5d
370
  metrics:
371
  - type: main_score
372
  value: 54.809064728970625
 
374
  value: 54.809064728970625
375
  - type: v_measure_std
376
  value: 14.497861425102215
377
+ - task:
378
  type: Clustering
379
+ dataset:
 
380
  name: MTEB ArxivClusteringS2S (default)
 
 
381
  type: mteb/arxiv-clustering-s2s
382
+ config: default
383
+ split: test
384
+ revision: f910caf1a6075f7329cdf8c1a6135696f37dbd53
385
  metrics:
386
  - type: main_score
387
  value: 50.144159631474416
 
389
  value: 50.144159631474416
390
  - type: v_measure_std
391
  value: 14.596959041091187
392
+ - task:
393
+ type: Reranking
394
+ dataset:
 
395
  name: MTEB AskUbuntuDupQuestions (default)
 
 
396
  type: mteb/askubuntudupquestions-reranking
397
+ config: default
398
+ split: test
399
+ revision: 2000358ca161889fa9c082cb41daa8dcfb161a54
400
  metrics:
401
  - type: main_score
402
  value: 65.74396432331054
 
416
  value: 34.51981156443003
417
  - type: nAUC_mrr_std
418
  value: 28.863440464092747
419
+ - task:
420
+ type: STS
421
+ dataset:
 
422
  name: MTEB BIOSSES (default)
 
 
423
  type: mteb/biosses-sts
424
+ config: default
425
+ split: test
426
+ revision: d3fb88f8f02e40887cd149695127462bbcf29b4a
427
  metrics:
428
  - type: cosine_pearson
429
  value: 86.59612727828603
 
443
  value: 86.59612727828603
444
  - type: spearman
445
  value: 85.83087137728063
446
+ - task:
447
+ type: Classification
448
+ dataset:
 
449
  name: MTEB Banking77Classification (default)
 
 
450
  type: mteb/banking77
451
+ config: default
452
+ split: test
453
+ revision: 0fd18e25b25c072e09e0d92ab615fda904d66300
454
  metrics:
455
  - type: accuracy
456
  value: 90.19155844155846
 
460
  value: 90.05716678902826
461
  - type: main_score
462
  value: 90.19155844155846
463
+ - task:
464
+ type: Clustering
465
+ dataset:
 
466
  name: MTEB BiorxivClusteringP2P (default)
 
 
467
  type: mteb/biorxiv-clustering-p2p
468
+ config: default
469
+ split: test
470
+ revision: 65b79d1d13f80053f67aca9498d9402c2d9f1f40
471
  metrics:
472
  - type: main_score
473
  value: 52.480294793961924
 
475
  value: 52.480294793961924
476
  - type: v_measure_std
477
  value: 0.5558452294416437
478
+ - task:
479
  type: Clustering
480
+ dataset:
 
481
  name: MTEB BiorxivClusteringS2S (default)
 
 
482
  type: mteb/biorxiv-clustering-s2s
483
+ config: default
484
+ split: test
485
+ revision: 258694dd0231531bc1fd9de6ceb52a0853c6d908
486
  metrics:
487
  - type: main_score
488
  value: 48.51901581759115
 
490
  value: 48.51901581759115
491
  - type: v_measure_std
492
  value: 1.1094735884191569
493
+ - task:
494
+ type: Retrieval
495
+ dataset:
 
496
  name: MTEB CQADupstackAndroidRetrieval (default)
 
 
497
  type: mteb/cqadupstack-android
498
+ config: default
499
+ split: test
500
+ revision: f46a197baaae43b4f621051089b82a364682dfeb
501
  metrics:
502
  - type: main_score
503
  value: 57.9
 
781
  value: 54.764
782
  - type: recall_at_5
783
  value: 62.089000000000006
784
+ - task:
785
  type: Retrieval
786
+ dataset:
 
787
  name: MTEB CQADupstackEnglishRetrieval (default)
 
 
788
  type: mteb/cqadupstack-english
789
+ config: default
790
+ split: test
791
+ revision: ad9991cb51e31e31e430383c75ffb2885547b5f0
792
  metrics:
793
  - type: main_score
794
  value: 55.474000000000004
 
1072
  value: 53.36300000000001
1073
  - type: recall_at_5
1074
  value: 58.987
1075
+ - task:
1076
  type: Retrieval
1077
+ dataset:
 
1078
  name: MTEB CQADupstackGamingRetrieval (default)
 
 
1079
  type: mteb/cqadupstack-gaming
1080
+ config: default
1081
+ split: test
1082
+ revision: 4885aa143210c98657558c04aaf3dc47cfb54340
1083
  metrics:
1084
  - type: main_score
1085
  value: 65.236
 
1363
  value: 65.359
1364
  - type: recall_at_5
1365
  value: 71.439
1366
+ - task:
1367
  type: Retrieval
1368
+ dataset:
 
1369
  name: MTEB CQADupstackGisRetrieval (default)
 
 
1370
  type: mteb/cqadupstack-gis
1371
+ config: default
1372
+ split: test
1373
+ revision: 5003b3064772da1887988e05400cf3806fe491f2
1374
  metrics:
1375
  - type: main_score
1376
  value: 43.736999999999995
 
1654
  value: 42.295
1655
  - type: recall_at_5
1656
  value: 49.275999999999996
1657
+ - task:
1658
  type: Retrieval
1659
+ dataset:
 
1660
  name: MTEB CQADupstackMathematicaRetrieval (default)
 
 
1661
  type: mteb/cqadupstack-mathematica
1662
+ config: default
1663
+ split: test
1664
+ revision: 90fceea13679c63fe563ded68f3b6f06e50061de
1665
  metrics:
1666
  - type: main_score
1667
  value: 38.766
 
1945
  value: 36.278
1946
  - type: recall_at_5
1947
  value: 43.38
1948
+ - task:
1949
  type: Retrieval
1950
+ dataset:
 
1951
  name: MTEB CQADupstackPhysicsRetrieval (default)
 
 
1952
  type: mteb/cqadupstack-physics
1953
+ config: default
1954
+ split: test
1955
+ revision: 79531abbd1fb92d06c6d6315a0cbbbf5bb247ea4
1956
  metrics:
1957
  - type: main_score
1958
  value: 53.893
 
2236
  value: 52.5
2237
  - type: recall_at_5
2238
  value: 59.489000000000004
2239
+ - task:
2240
  type: Retrieval
2241
+ dataset:
 
2242
  name: MTEB CQADupstackProgrammersRetrieval (default)
 
 
2243
  type: mteb/cqadupstack-programmers
2244
+ config: default
2245
+ split: test
2246
+ revision: 6184bc1440d2dbc7612be22b50686b8826d22b32
2247
  metrics:
2248
  - type: main_score
2249
  value: 51.151
 
2527
  value: 48.254000000000005
2528
  - type: recall_at_5
2529
  value: 55.595000000000006
2530
+ - task:
2531
  type: Retrieval
2532
+ dataset:
 
2533
  name: MTEB CQADupstackRetrieval (default)
 
 
2534
  type: CQADupstackRetrieval_is_a_combined_dataset
2535
+ config: default
2536
+ split: test
2537
+ revision: CQADupstackRetrieval_is_a_combined_dataset
2538
  metrics:
2539
  - type: main_score
2540
  value: 48.669000000000004
2541
  - type: ndcg_at_10
2542
  value: 48.669000000000004
2543
+ - task:
2544
  type: Retrieval
2545
+ dataset:
 
2546
  name: MTEB CQADupstackStatsRetrieval (default)
 
 
2547
  type: mteb/cqadupstack-stats
2548
+ config: default
2549
+ split: test
2550
+ revision: 65ac3a16b8e91f9cee4c9828cc7c335575432a2a
2551
  metrics:
2552
  - type: main_score
2553
  value: 41.521
 
2831
  value: 40.373
2832
  - type: recall_at_5
2833
  value: 46.421
2834
+ - task:
2835
  type: Retrieval
2836
+ dataset:
 
2837
  name: MTEB CQADupstackTexRetrieval (default)
 
 
2838
  type: mteb/cqadupstack-tex
2839
+ config: default
2840
+ split: test
2841
+ revision: 46989137a86843e03a6195de44b09deda022eec7
2842
  metrics:
2843
  - type: main_score
2844
  value: 37.183
 
3122
  value: 35.522999999999996
3123
  - type: recall_at_5
3124
  value: 41.746
3125
+ - task:
3126
  type: Retrieval
3127
+ dataset:
 
3128
  name: MTEB CQADupstackUnixRetrieval (default)
 
 
3129
  type: mteb/cqadupstack-unix
3130
+ config: default
3131
+ split: test
3132
+ revision: 6c6430d3a6d36f8d2a829195bc5dc94d7e063e53
3133
  metrics:
3134
  - type: main_score
3135
  value: 51.396
 
3413
  value: 49.833
3414
  - type: recall_at_5
3415
  value: 55.145999999999994
3416
+ - task:
3417
  type: Retrieval
3418
+ dataset:
 
3419
  name: MTEB CQADupstackWebmastersRetrieval (default)
 
 
3420
  type: mteb/cqadupstack-webmasters
3421
+ config: default
3422
+ split: test
3423
+ revision: 160c094312a0e1facb97e55eeddb698c0abe3571
3424
  metrics:
3425
  - type: main_score
3426
  value: 48.229
 
3704
  value: 45.072
3705
  - type: recall_at_5
3706
  value: 52.993
3707
+ - task:
3708
  type: Retrieval
3709
+ dataset:
 
3710
  name: MTEB CQADupstackWordpressRetrieval (default)
 
 
3711
  type: mteb/cqadupstack-wordpress
3712
+ config: default
3713
+ split: test
3714
+ revision: 4ffe81d471b1924886b33c7567bfb200e9eec5c4
3715
  metrics:
3716
  - type: main_score
3717
  value: 39.542
 
3995
  value: 38.29
3996
  - type: recall_at_5
3997
  value: 43.817
3998
+ - task:
3999
  type: Retrieval
4000
+ dataset:
 
4001
  name: MTEB ClimateFEVER (default)
 
 
4002
  type: mteb/climate-fever
4003
+ config: default
4004
+ split: test
4005
+ revision: 47f2ac6acb640fc46020b02a5b59fdda04d39380
4006
  metrics:
4007
  - type: main_score
4008
  value: 45.765
 
4286
  value: 34.846
4287
  - type: recall_at_5
4288
  value: 43.504
4289
+ - task:
4290
  type: Retrieval
4291
+ dataset:
 
4292
  name: MTEB DBPedia (default)
 
 
4293
  type: mteb/dbpedia
4294
+ config: default
4295
+ split: test
4296
+ revision: c0f706b76e590d620bd6618b3ca8efdd34e2d659
4297
  metrics:
4298
  - type: main_score
4299
  value: 49.747
 
4577
  value: 17.218
4578
  - type: recall_at_5
4579
  value: 21.275
4580
+ - task:
4581
+ type: Classification
4582
+ dataset:
 
4583
  name: MTEB EmotionClassification (default)
 
 
4584
  type: mteb/emotion
4585
+ config: default
4586
+ split: test
4587
+ revision: 4f58c6b202a23cf9a4da393831edf4f9183cad37
4588
  metrics:
4589
  - type: accuracy
4590
  value: 91.86500000000001
 
4594
  value: 92.0659899919408
4595
  - type: main_score
4596
  value: 91.86500000000001
4597
+ - task:
4598
+ type: Retrieval
4599
+ dataset:
 
4600
  name: MTEB FEVER (default)
 
 
4601
  type: mteb/fever
4602
+ config: default
4603
+ split: test
4604
+ revision: bea83ef9e8fb933d90a2f1d5515737465d613e12
4605
  metrics:
4606
  - type: main_score
4607
  value: 92.324
 
4885
  value: 93.806
4886
  - type: recall_at_5
4887
  value: 95.36
4888
+ - task:
4889
  type: Retrieval
4890
+ dataset:
 
4891
  name: MTEB FiQA2018 (default)
 
 
4892
  type: mteb/fiqa
4893
+ config: default
4894
+ split: test
4895
+ revision: 27a168819829fe9bcd655c2df245fb19452e8e06
4896
  metrics:
4897
  - type: main_score
4898
  value: 61.565999999999995
 
5176
  value: 51.782
5177
  - type: recall_at_5
5178
  value: 59.911
5179
+ - task:
5180
  type: Retrieval
5181
+ dataset:
 
5182
  name: MTEB HotpotQA (default)
 
 
5183
  type: mteb/hotpotqa
5184
+ config: default
5185
+ split: test
5186
+ revision: ab518f4d6fcca38d87c25209f94beba119d02014
5187
  metrics:
5188
  - type: main_score
5189
  value: 85.71
 
5467
  value: 80.891
5468
  - type: recall_at_5
5469
  value: 85.307
5470
+ - task:
5471
+ type: Classification
5472
+ dataset:
 
5473
  name: MTEB ImdbClassification (default)
 
 
5474
  type: mteb/imdb
5475
+ config: default
5476
+ split: test
5477
+ revision: 3d86128a09e091d6018b6d26cad27f2739fc2db7
5478
  metrics:
5479
  - type: accuracy
5480
  value: 96.9972
 
5488
  value: 96.99685931130435
5489
  - type: main_score
5490
  value: 96.9972
5491
+ - task:
5492
+ type: Retrieval
5493
+ dataset:
 
5494
  name: MTEB MSMARCO (default)
 
 
5495
  type: mteb/msmarco
5496
+ config: default
5497
+ split: dev
5498
+ revision: c5a29a104738b98a9e76336939199e264163d4a0
5499
  metrics:
5500
  - type: main_score
5501
  value: 47.238
 
5779
  value: 47.714
5780
  - type: recall_at_5
5781
  value: 57.913000000000004
5782
+ - task:
5783
+ type: Classification
5784
+ dataset:
 
5785
  name: MTEB MTOPDomainClassification (en)
 
 
5786
  type: mteb/mtop_domain
5787
+ config: en
5788
+ split: test
5789
+ revision: d80d48c1eb48d3562165c59d59d0034df9fff0bf
5790
  metrics:
5791
  - type: accuracy
5792
  value: 97.43502051983585
 
5796
  value: 97.44797640554678
5797
  - type: main_score
5798
  value: 97.43502051983585
5799
+ - task:
5800
  type: Classification
5801
+ dataset:
 
5802
  name: MTEB MTOPIntentClassification (en)
 
 
5803
  type: mteb/mtop_intent
5804
+ config: en
5805
+ split: test
5806
+ revision: ae001d0e6b1228650b7bd1c2c65fb50ad11a8aba
5807
  metrics:
5808
  - type: accuracy
5809
  value: 92.80665754673961
 
5813
  value: 93.45063761064331
5814
  - type: main_score
5815
  value: 92.80665754673961
5816
+ - task:
5817
  type: Classification
5818
+ dataset:
 
5819
  name: MTEB MassiveIntentClassification (en)
 
 
5820
  type: mteb/amazon_massive_intent
5821
+ config: en
5822
+ split: test
5823
+ revision: 4672e20407010da34463acc759c162ca9734bca6
5824
  metrics:
5825
  - type: accuracy
5826
  value: 81.14324142568931
 
5830
  value: 80.06102282439677
5831
  - type: main_score
5832
  value: 81.14324142568931
5833
+ - task:
5834
  type: Classification
5835
+ dataset:
 
5836
  name: MTEB MassiveScenarioClassification (en)
 
 
5837
  type: mteb/amazon_massive_scenario
5838
+ config: en
5839
+ split: test
5840
+ revision: fad2c6e8459f9e1c45d9315f4953d921437d70f8
5841
  metrics:
5842
  - type: accuracy
5843
  value: 83.52723604572965
 
5847
  value: 83.18340208761732
5848
  - type: main_score
5849
  value: 83.52723604572965
5850
+ - task:
5851
+ type: Clustering
5852
+ dataset:
 
5853
  name: MTEB MedrxivClusteringP2P (default)
 
 
5854
  type: mteb/medrxiv-clustering-p2p
5855
+ config: default
5856
+ split: test
5857
+ revision: e7a26af6f3ae46b30dde8737f02c07b1505bcc73
5858
  metrics:
5859
  - type: main_score
5860
  value: 46.38149873605036
 
5862
  value: 46.38149873605036
5863
  - type: v_measure_std
5864
  value: 1.0749788856434186
5865
+ - task:
5866
  type: Clustering
5867
+ dataset:
 
5868
  name: MTEB MedrxivClusteringS2S (default)
 
 
5869
  type: mteb/medrxiv-clustering-s2s
5870
+ config: default
5871
+ split: test
5872
+ revision: 35191c8c0dca72d8ff3efcd72aa802307d469663
5873
  metrics:
5874
  - type: main_score
5875
  value: 44.8945524407664
 
5877
  value: 44.8945524407664
5878
  - type: v_measure_std
5879
  value: 1.2389193370528488
5880
+ - task:
5881
+ type: Reranking
5882
+ dataset:
 
5883
  name: MTEB MindSmallReranking (default)
 
 
5884
  type: mteb/mind_small
5885
+ config: default
5886
+ split: test
5887
+ revision: 59042f120c80e8afa9cdbb224f67076cec0fc9a7
5888
  metrics:
5889
  - type: main_score
5890
  value: 31.464871623418794
 
5904
  value: -19.359704641723024
5905
  - type: nAUC_mrr_std
5906
  value: 0.2553333974009825
5907
+ - task:
5908
+ type: Retrieval
5909
+ dataset:
 
5910
  name: MTEB NFCorpus (default)
 
 
5911
  type: mteb/nfcorpus
5912
+ config: default
5913
+ split: test
5914
+ revision: ec0fa4fe99da2ff19ca1214b7966684033a58814
5915
  metrics:
5916
  - type: main_score
5917
  value: 40.608
 
6195
  value: 12.592999999999998
6196
  - type: recall_at_5
6197
  value: 15.847
6198
+ - task:
6199
  type: Retrieval
6200
+ dataset:
 
6201
  name: MTEB NQ (default)
 
 
6202
  type: mteb/nq
6203
+ config: default
6204
+ split: test
6205
+ revision: b774495ed302d8c44a3a7ea25c90dbce03968f31
6206
  metrics:
6207
  - type: main_score
6208
  value: 74.639
 
6486
  value: 76.32
6487
  - type: recall_at_5
6488
  value: 83.992
6489
+ - task:
6490
  type: Retrieval
6491
+ dataset:
 
6492
  name: MTEB QuoraRetrieval (default)
 
 
6493
  type: mteb/quora
6494
+ config: default
6495
+ split: test
6496
+ revision: e4e08e0b7dbe3c8700f0daef558ff32256715259
6497
  metrics:
6498
  - type: main_score
6499
  value: 90.78500000000001
 
6777
  value: 89.85499999999999
6778
  - type: recall_at_5
6779
  value: 93.758
6780
+ - task:
6781
+ type: Clustering
6782
+ dataset:
 
6783
  name: MTEB RedditClustering (default)
 
 
6784
  type: mteb/reddit-clustering
6785
+ config: default
6786
+ split: test
6787
+ revision: 24640382cdbf8abc73003fb0fa6d111a705499eb
6788
  metrics:
6789
  - type: main_score
6790
  value: 72.36527124460562
 
6792
  value: 72.36527124460562
6793
  - type: v_measure_std
6794
  value: 2.7778891945364195
6795
+ - task:
6796
  type: Clustering
6797
+ dataset:
 
6798
  name: MTEB RedditClusteringP2P (default)
 
 
6799
  type: mteb/reddit-clustering-p2p
6800
+ config: default
6801
+ split: test
6802
+ revision: 385e3cb46b4cfa89021f56c4380204149d0efe33
6803
  metrics:
6804
  - type: main_score
6805
  value: 73.89142551084535
 
6807
  value: 73.89142551084535
6808
  - type: v_measure_std
6809
  value: 11.258242813412751
6810
+ - task:
6811
+ type: Retrieval
6812
+ dataset:
 
6813
  name: MTEB SCIDOCS (default)
 
 
6814
  type: mteb/scidocs
6815
+ config: default
6816
+ split: test
6817
+ revision: f8c2fcf00f625baaa80f62ec5bd9e1fff3b8ae88
6818
  metrics:
6819
  - type: main_score
6820
  value: 28.538000000000004
 
7098
  value: 15.573
7099
  - type: recall_at_5
7100
  value: 20.948
7101
+ - task:
7102
+ type: STS
7103
+ dataset:
 
7104
  name: MTEB SICK-R (default)
 
 
7105
  type: mteb/sickr-sts
7106
+ config: default
7107
+ split: test
7108
+ revision: 20a6d6f312dd54037fe07a32d58e5e168867909d
7109
  metrics:
7110
  - type: cosine_pearson
7111
  value: 84.37281363343187
 
7125
  value: 84.37281363343187
7126
  - type: spearman
7127
  value: 83.30200195593044
7128
+ - task:
7129
  type: STS
7130
+ dataset:
 
7131
  name: MTEB STS12 (default)
 
 
7132
  type: mteb/sts12-sts
7133
+ config: default
7134
+ split: test
7135
+ revision: a0d554a64d88156834ff5ae9920b964011b16384
7136
  metrics:
7137
  - type: cosine_pearson
7138
  value: 86.82824905521925
 
7152
  value: 86.82824905521925
7153
  - type: spearman
7154
  value: 80.98590815911939
7155
+ - task:
7156
  type: STS
7157
+ dataset:
 
7158
  name: MTEB STS13 (default)
 
 
7159
  type: mteb/sts13-sts
7160
+ config: default
7161
+ split: test
7162
+ revision: 7e90230a92c190f1bf69ae9002b8cea547a64cca
7163
  metrics:
7164
  - type: cosine_pearson
7165
  value: 87.19722316157294
 
7179
  value: 87.19722316157294
7180
  - type: spearman
7181
  value: 87.34287142701457
7182
+ - task:
7183
  type: STS
7184
+ dataset:
 
7185
  name: MTEB STS14 (default)
 
 
7186
  type: mteb/sts14-sts
7187
+ config: default
7188
+ split: test
7189
+ revision: 6031580fec1f6af667f0bd2da0a551cf4f0b2375
7190
  metrics:
7191
  - type: cosine_pearson
7192
  value: 84.82646675904164
 
7206
  value: 84.82646675904164
7207
  - type: spearman
7208
  value: 84.38843815801556
7209
+ - task:
7210
  type: STS
7211
+ dataset:
 
7212
  name: MTEB STS15 (default)
 
 
7213
  type: mteb/sts15-sts
7214
+ config: default
7215
+ split: test
7216
+ revision: ae752c7c21bf194d8b67fd573edf7ae58183cbe3
7217
  metrics:
7218
  - type: cosine_pearson
7219
  value: 89.69909533656704
 
7233
  value: 89.69909533656704
7234
  - type: spearman
7235
  value: 89.74723322749233
7236
+ - task:
7237
  type: STS
7238
+ dataset:
 
7239
  name: MTEB STS16 (default)
 
 
7240
  type: mteb/sts16-sts
7241
+ config: default
7242
+ split: test
7243
+ revision: 4d8694f8f0e0100860b497b999b3dbed754a0513
7244
  metrics:
7245
  - type: cosine_pearson
7246
  value: 86.84947603401746
 
7260
  value: 86.84947603401746
7261
  - type: spearman
7262
  value: 87.63022743056388
7263
+ - task:
7264
  type: STS
7265
+ dataset:
 
7266
  name: MTEB STS17 (en-en)
 
 
7267
  type: mteb/sts17-crosslingual-sts
7268
+ config: en-en
7269
+ split: test
7270
+ revision: faeb762787bd10488a50c8b5be4a3b82e411949c
7271
  metrics:
7272
  - type: cosine_pearson
7273
  value: 91.43391567649913
 
7287
  value: 91.43391567649913
7288
  - type: spearman
7289
  value: 90.86953801008369
7290
+ - task:
7291
  type: STS
7292
+ dataset:
 
7293
  name: MTEB STS22 (en)
 
 
7294
  type: mteb/sts22-crosslingual-sts
7295
+ config: en
7296
+ split: test
7297
+ revision: de9d86b3b84231dc21f76c7b7af1f28e2f57f6e3
7298
  metrics:
7299
  - type: cosine_pearson
7300
  value: 68.81338409687908
 
7314
  value: 68.81338409687908
7315
  - type: spearman
7316
  value: 68.09215270009086
7317
+ - task:
7318
  type: STS
7319
+ dataset:
 
7320
  name: MTEB STSBenchmark (default)
 
 
7321
  type: mteb/stsbenchmark-sts
7322
+ config: default
7323
+ split: test
7324
+ revision: b0fddb56ed78048fa8b90373c8a3cfc37b684831
7325
  metrics:
7326
  - type: cosine_pearson
7327
  value: 87.93191595794555
 
7341
  value: 87.93191595794555
7342
  - type: spearman
7343
  value: 88.46646307403641
7344
+ - task:
7345
+ type: Reranking
7346
+ dataset:
 
7347
  name: MTEB SciDocsRR (default)
 
 
7348
  type: mteb/scidocs-reranking
7349
+ config: default
7350
+ split: test
7351
+ revision: d3c5e1fc0b855ab6097bf1cda04dd73947d7caab
7352
  metrics:
7353
  - type: main_score
7354
  value: 87.62672056519489
 
7368
  value: 82.4844792677926
7369
  - type: nAUC_mrr_std
7370
  value: 82.0357865297397
7371
+ - task:
7372
+ type: Retrieval
7373
+ dataset:
 
7374
  name: MTEB SciFact (default)
 
 
7375
  type: mteb/scifact
7376
+ config: default
7377
+ split: test
7378
+ revision: 0228b52cf27578f30900b9e5271d331663a030d7
7379
  metrics:
7380
  - type: main_score
7381
  value: 79.745
 
7659
  value: 81.072
7660
  - type: recall_at_5
7661
  value: 87.339
7662
+ - task:
7663
+ type: PairClassification
7664
+ dataset:
 
7665
  name: MTEB SprintDuplicateQuestions (default)
 
 
7666
  type: mteb/sprintduplicatequestions-pairclassification
7667
+ config: default
7668
+ split: test
7669
+ revision: d66bd1f72af766a5cc4b0ca5e00c162f89e8cc46
7670
  metrics:
7671
  - type: cosine_accuracy
7672
  value: 99.86039603960396
 
7750
  value: 93.69277721261444
7751
  - type: similarity_recall
7752
  value: 92.10000000000001
7753
+ - task:
7754
+ type: Clustering
7755
+ dataset:
 
7756
  name: MTEB StackExchangeClustering (default)
 
 
7757
  type: mteb/stackexchange-clustering
7758
+ config: default
7759
+ split: test
7760
+ revision: 6cbc1f7b2bc0622f2e39d2c77fa502909748c259
7761
  metrics:
7762
  - type: main_score
7763
  value: 81.5950420419382
 
7765
  value: 81.5950420419382
7766
  - type: v_measure_std
7767
  value: 2.3518861207789126
7768
+ - task:
7769
  type: Clustering
7770
+ dataset:
 
7771
  name: MTEB StackExchangeClusteringP2P (default)
 
 
7772
  type: mteb/stackexchange-clustering-p2p
7773
+ config: default
7774
+ split: test
7775
+ revision: 815ca46b2622cec33ccafc3735d572c266efdb44
7776
  metrics:
7777
  - type: main_score
7778
  value: 44.40836435329055
 
7780
  value: 44.40836435329055
7781
  - type: v_measure_std
7782
  value: 1.3850659888959282
7783
+ - task:
7784
+ type: Reranking
7785
+ dataset:
 
7786
  name: MTEB StackOverflowDupQuestions (default)
 
 
7787
  type: mteb/stackoverflowdupquestions-reranking
7788
+ config: default
7789
+ split: test
7790
+ revision: e185fbe320c72810689fc5848eb6114e1ef5ec69
7791
  metrics:
7792
  - type: main_score
7793
  value: 58.792345747482436
 
7807
  value: 14.587424770057197
7808
  - type: nAUC_mrr_std
7809
  value: 6.683981115477786
7810
+ - task:
7811
+ type: Summarization
7812
+ dataset:
 
7813
  name: MTEB SummEval (default)
 
 
7814
  type: mteb/summeval
7815
+ config: default
7816
+ split: test
7817
+ revision: cda12ad7615edc362dbf25a00fdd61d3b1eaf93c
7818
  metrics:
7819
  - type: cosine_pearson
7820
  value: 29.605378173647523
 
7830
  value: 29.605378173647523
7831
  - type: spearman
7832
  value: 29.538937618105475
7833
+ - task:
7834
+ type: Retrieval
7835
+ dataset:
 
7836
  name: MTEB TRECCOVID (default)
 
 
7837
  type: mteb/trec-covid
7838
+ config: default
7839
+ split: test
7840
+ revision: bb9466bac8153a0349341eb1b22e06409e78ef4e
7841
  metrics:
7842
  - type: main_score
7843
  value: 77.17500000000001
 
8121
  value: 0.677
8122
  - type: recall_at_5
8123
  value: 1.087
8124
+ - task:
8125
  type: Retrieval
8126
+ dataset:
 
8127
  name: MTEB Touche2020 (default)
 
 
8128
  type: mteb/touche2020
8129
+ config: default
8130
+ split: test
8131
+ revision: a34f9a33db75fa0cbb21bb5cfc3dae8dc8bec93f
8132
  metrics:
8133
  - type: main_score
8134
  value: 29.343000000000004
 
8412
  value: 7.868
8413
  - type: recall_at_5
8414
  value: 11.413
8415
+ - task:
8416
+ type: Classification
8417
+ dataset:
 
8418
  name: MTEB ToxicConversationsClassification (default)
 
 
8419
  type: mteb/toxic_conversations_50k
8420
+ config: default
8421
+ split: test
8422
+ revision: edfaf9da55d3dd50d43143d90c1ac476895ae6de
8423
  metrics:
8424
  - type: accuracy
8425
  value: 92.3681640625
 
8433
  value: 93.14474638528736
8434
  - type: main_score
8435
  value: 92.3681640625
8436
+ - task:
8437
  type: Classification
8438
+ dataset:
 
8439
  name: MTEB TweetSentimentExtractionClassification (default)
 
 
8440
  type: mteb/tweet_sentiment_extraction
8441
+ config: default
8442
+ split: test
8443
+ revision: d604517c81ca91fe16a244d1248fc021f9ecee7a
8444
  metrics:
8445
  - type: accuracy
8446
  value: 80.42161856253539
 
8450
  value: 80.3228654725881
8451
  - type: main_score
8452
  value: 80.42161856253539
8453
+ - task:
8454
+ type: Clustering
8455
+ dataset:
 
8456
  name: MTEB TwentyNewsgroupsClustering (default)
 
 
8457
  type: mteb/twentynewsgroups-clustering
8458
+ config: default
8459
+ split: test
8460
+ revision: 6125ec4e24fa026cec8a478383ee943acfbd5449
8461
  metrics:
8462
  - type: main_score
8463
  value: 68.78385330772423
 
8465
  value: 68.78385330772423
8466
  - type: v_measure_std
8467
  value: 1.4814035017480702
8468
+ - task:
8469
+ type: PairClassification
8470
+ dataset:
 
8471
  name: MTEB TwitterSemEval2015 (default)
 
 
8472
  type: mteb/twittersemeval2015-pairclassification
8473
+ config: default
8474
+ split: test
8475
+ revision: 70970daeab8776df92f5ea462b6173c0b46fd2d1
8476
  metrics:
8477
  - type: cosine_accuracy
8478
  value: 87.96566728258925
 
8556
  value: 68.30357142857143
8557
  - type: similarity_recall
8558
  value: 76.7018469656992
8559
+ - task:
8560
  type: PairClassification
8561
+ dataset:
 
8562
  name: MTEB TwitterURLCorpus (default)
 
 
8563
  type: mteb/twitterurlcorpus-pairclassification
8564
+ config: default
8565
+ split: test
8566
+ revision: 8b6510b0b1fa4e4c4f879467980e9be563ec1cdf
8567
  metrics:
8568
  - type: cosine_accuracy
8569
  value: 89.48073116777273
 
8647
  value: 75.27245137260311
8648
  - type: similarity_recall
8649
  value: 84.02371419772098
 
 
8650
  ---
config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/projects/0/prjs0835/ACL25/reps-llm-2/huggingface_models/wrap_model/model_lens_8000",
3
+ "architectures": [
4
+ "MistralModel"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 2,
9
+ "head_dim": 128,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 4096,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 14336,
14
+ "max_position_embeddings": 32768,
15
+ "model_type": "mistral",
16
+ "num_attention_heads": 32,
17
+ "num_hidden_layers": 32,
18
+ "num_key_value_heads": 8,
19
+ "rms_norm_eps": 1e-05,
20
+ "rope_theta": 10000.0,
21
+ "sliding_window": 4096,
22
+ "tie_word_embeddings": false,
23
+ "torch_dtype": "float32",
24
+ "transformers_version": "4.43.1",
25
+ "use_cache": false,
26
+ "vocab_size": 32003
27
+ }
model-00001-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bb494b856d59521f7aa3f85d267047c8bb0989e3ef3877164d090a1b73c5250
3
+ size 4987245800
model-00002-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db48eac273441e1ce91b8df5df3da14cb995b37b2384c414ac2944a55530aec2
3
+ size 4899116152
model-00003-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62b83abd1fa64fbc428083bef0cfbb1f67e49c1d83c12aa36350df787ef32907
3
+ size 4999812808
model-00004-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa05808ae834fa506c16f96e60264363947fe64b9978bdc2a796333866561852
3
+ size 4999812808
model-00005-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01441d94a31f225bff2a4a1c3a18030697ab14cd34a24d66dab290203a150309
3
+ size 4832007216
model-00006-of-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4044180ffe3a641d301ef30b9d7c26f8fddc1a915f509579e9710d30b5a1e51f
3
+ size 3724726552
model.safetensors.index.json ADDED
@@ -0,0 +1,297 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "metadata": {
3
+ "total_size": 28442689536
4
+ },
5
+ "weight_map": {
6
+ "embed_tokens.weight": "model-00001-of-00006.safetensors",
7
+ "layers.0.input_layernorm.weight": "model-00001-of-00006.safetensors",
8
+ "layers.0.mlp.down_proj.weight": "model-00001-of-00006.safetensors",
9
+ "layers.0.mlp.gate_proj.weight": "model-00001-of-00006.safetensors",
10
+ "layers.0.mlp.up_proj.weight": "model-00001-of-00006.safetensors",
11
+ "layers.0.post_attention_layernorm.weight": "model-00001-of-00006.safetensors",
12
+ "layers.0.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
13
+ "layers.0.self_attn.o_proj.weight": "model-00001-of-00006.safetensors",
14
+ "layers.0.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
15
+ "layers.0.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
16
+ "layers.1.input_layernorm.weight": "model-00001-of-00006.safetensors",
17
+ "layers.1.mlp.down_proj.weight": "model-00001-of-00006.safetensors",
18
+ "layers.1.mlp.gate_proj.weight": "model-00001-of-00006.safetensors",
19
+ "layers.1.mlp.up_proj.weight": "model-00001-of-00006.safetensors",
20
+ "layers.1.post_attention_layernorm.weight": "model-00001-of-00006.safetensors",
21
+ "layers.1.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
22
+ "layers.1.self_attn.o_proj.weight": "model-00001-of-00006.safetensors",
23
+ "layers.1.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
24
+ "layers.1.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
25
+ "layers.10.input_layernorm.weight": "model-00003-of-00006.safetensors",
26
+ "layers.10.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
27
+ "layers.10.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
28
+ "layers.10.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
29
+ "layers.10.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
30
+ "layers.10.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
31
+ "layers.10.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
32
+ "layers.10.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
33
+ "layers.10.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
34
+ "layers.11.input_layernorm.weight": "model-00003-of-00006.safetensors",
35
+ "layers.11.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
36
+ "layers.11.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
37
+ "layers.11.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
38
+ "layers.11.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
39
+ "layers.11.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
40
+ "layers.11.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
41
+ "layers.11.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
42
+ "layers.11.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
43
+ "layers.12.input_layernorm.weight": "model-00003-of-00006.safetensors",
44
+ "layers.12.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
45
+ "layers.12.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
46
+ "layers.12.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
47
+ "layers.12.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
48
+ "layers.12.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
49
+ "layers.12.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
50
+ "layers.12.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
51
+ "layers.12.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
52
+ "layers.13.input_layernorm.weight": "model-00003-of-00006.safetensors",
53
+ "layers.13.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
54
+ "layers.13.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
55
+ "layers.13.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
56
+ "layers.13.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
57
+ "layers.13.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
58
+ "layers.13.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
59
+ "layers.13.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
60
+ "layers.13.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
61
+ "layers.14.input_layernorm.weight": "model-00003-of-00006.safetensors",
62
+ "layers.14.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
63
+ "layers.14.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
64
+ "layers.14.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
65
+ "layers.14.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
66
+ "layers.14.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
67
+ "layers.14.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
68
+ "layers.14.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
69
+ "layers.14.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
70
+ "layers.15.input_layernorm.weight": "model-00003-of-00006.safetensors",
71
+ "layers.15.mlp.down_proj.weight": "model-00003-of-00006.safetensors",
72
+ "layers.15.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
73
+ "layers.15.mlp.up_proj.weight": "model-00003-of-00006.safetensors",
74
+ "layers.15.post_attention_layernorm.weight": "model-00003-of-00006.safetensors",
75
+ "layers.15.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
76
+ "layers.15.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
77
+ "layers.15.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
78
+ "layers.15.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
79
+ "layers.16.input_layernorm.weight": "model-00004-of-00006.safetensors",
80
+ "layers.16.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
81
+ "layers.16.mlp.gate_proj.weight": "model-00003-of-00006.safetensors",
82
+ "layers.16.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
83
+ "layers.16.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
84
+ "layers.16.self_attn.k_proj.weight": "model-00003-of-00006.safetensors",
85
+ "layers.16.self_attn.o_proj.weight": "model-00003-of-00006.safetensors",
86
+ "layers.16.self_attn.q_proj.weight": "model-00003-of-00006.safetensors",
87
+ "layers.16.self_attn.v_proj.weight": "model-00003-of-00006.safetensors",
88
+ "layers.17.input_layernorm.weight": "model-00004-of-00006.safetensors",
89
+ "layers.17.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
90
+ "layers.17.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
91
+ "layers.17.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
92
+ "layers.17.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
93
+ "layers.17.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
94
+ "layers.17.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
95
+ "layers.17.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
96
+ "layers.17.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
97
+ "layers.18.input_layernorm.weight": "model-00004-of-00006.safetensors",
98
+ "layers.18.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
99
+ "layers.18.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
100
+ "layers.18.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
101
+ "layers.18.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
102
+ "layers.18.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
103
+ "layers.18.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
104
+ "layers.18.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
105
+ "layers.18.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
106
+ "layers.19.input_layernorm.weight": "model-00004-of-00006.safetensors",
107
+ "layers.19.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
108
+ "layers.19.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
109
+ "layers.19.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
110
+ "layers.19.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
111
+ "layers.19.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
112
+ "layers.19.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
113
+ "layers.19.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
114
+ "layers.19.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
115
+ "layers.2.input_layernorm.weight": "model-00001-of-00006.safetensors",
116
+ "layers.2.mlp.down_proj.weight": "model-00001-of-00006.safetensors",
117
+ "layers.2.mlp.gate_proj.weight": "model-00001-of-00006.safetensors",
118
+ "layers.2.mlp.up_proj.weight": "model-00001-of-00006.safetensors",
119
+ "layers.2.post_attention_layernorm.weight": "model-00001-of-00006.safetensors",
120
+ "layers.2.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
121
+ "layers.2.self_attn.o_proj.weight": "model-00001-of-00006.safetensors",
122
+ "layers.2.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
123
+ "layers.2.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
124
+ "layers.20.input_layernorm.weight": "model-00004-of-00006.safetensors",
125
+ "layers.20.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
126
+ "layers.20.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
127
+ "layers.20.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
128
+ "layers.20.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
129
+ "layers.20.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
130
+ "layers.20.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
131
+ "layers.20.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
132
+ "layers.20.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
133
+ "layers.21.input_layernorm.weight": "model-00004-of-00006.safetensors",
134
+ "layers.21.mlp.down_proj.weight": "model-00004-of-00006.safetensors",
135
+ "layers.21.mlp.gate_proj.weight": "model-00004-of-00006.safetensors",
136
+ "layers.21.mlp.up_proj.weight": "model-00004-of-00006.safetensors",
137
+ "layers.21.post_attention_layernorm.weight": "model-00004-of-00006.safetensors",
138
+ "layers.21.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
139
+ "layers.21.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
140
+ "layers.21.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
141
+ "layers.21.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
142
+ "layers.22.input_layernorm.weight": "model-00005-of-00006.safetensors",
143
+ "layers.22.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
144
+ "layers.22.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
145
+ "layers.22.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
146
+ "layers.22.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
147
+ "layers.22.self_attn.k_proj.weight": "model-00004-of-00006.safetensors",
148
+ "layers.22.self_attn.o_proj.weight": "model-00004-of-00006.safetensors",
149
+ "layers.22.self_attn.q_proj.weight": "model-00004-of-00006.safetensors",
150
+ "layers.22.self_attn.v_proj.weight": "model-00004-of-00006.safetensors",
151
+ "layers.23.input_layernorm.weight": "model-00005-of-00006.safetensors",
152
+ "layers.23.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
153
+ "layers.23.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
154
+ "layers.23.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
155
+ "layers.23.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
156
+ "layers.23.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
157
+ "layers.23.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
158
+ "layers.23.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
159
+ "layers.23.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
160
+ "layers.24.input_layernorm.weight": "model-00005-of-00006.safetensors",
161
+ "layers.24.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
162
+ "layers.24.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
163
+ "layers.24.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
164
+ "layers.24.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
165
+ "layers.24.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
166
+ "layers.24.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
167
+ "layers.24.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
168
+ "layers.24.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
169
+ "layers.25.input_layernorm.weight": "model-00005-of-00006.safetensors",
170
+ "layers.25.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
171
+ "layers.25.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
172
+ "layers.25.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
173
+ "layers.25.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
174
+ "layers.25.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
175
+ "layers.25.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
176
+ "layers.25.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
177
+ "layers.25.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
178
+ "layers.26.input_layernorm.weight": "model-00005-of-00006.safetensors",
179
+ "layers.26.mlp.down_proj.weight": "model-00005-of-00006.safetensors",
180
+ "layers.26.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
181
+ "layers.26.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
182
+ "layers.26.post_attention_layernorm.weight": "model-00005-of-00006.safetensors",
183
+ "layers.26.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
184
+ "layers.26.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
185
+ "layers.26.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
186
+ "layers.26.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
187
+ "layers.27.input_layernorm.weight": "model-00006-of-00006.safetensors",
188
+ "layers.27.mlp.down_proj.weight": "model-00006-of-00006.safetensors",
189
+ "layers.27.mlp.gate_proj.weight": "model-00005-of-00006.safetensors",
190
+ "layers.27.mlp.up_proj.weight": "model-00005-of-00006.safetensors",
191
+ "layers.27.post_attention_layernorm.weight": "model-00006-of-00006.safetensors",
192
+ "layers.27.self_attn.k_proj.weight": "model-00005-of-00006.safetensors",
193
+ "layers.27.self_attn.o_proj.weight": "model-00005-of-00006.safetensors",
194
+ "layers.27.self_attn.q_proj.weight": "model-00005-of-00006.safetensors",
195
+ "layers.27.self_attn.v_proj.weight": "model-00005-of-00006.safetensors",
196
+ "layers.28.input_layernorm.weight": "model-00006-of-00006.safetensors",
197
+ "layers.28.mlp.down_proj.weight": "model-00006-of-00006.safetensors",
198
+ "layers.28.mlp.gate_proj.weight": "model-00006-of-00006.safetensors",
199
+ "layers.28.mlp.up_proj.weight": "model-00006-of-00006.safetensors",
200
+ "layers.28.post_attention_layernorm.weight": "model-00006-of-00006.safetensors",
201
+ "layers.28.self_attn.k_proj.weight": "model-00006-of-00006.safetensors",
202
+ "layers.28.self_attn.o_proj.weight": "model-00006-of-00006.safetensors",
203
+ "layers.28.self_attn.q_proj.weight": "model-00006-of-00006.safetensors",
204
+ "layers.28.self_attn.v_proj.weight": "model-00006-of-00006.safetensors",
205
+ "layers.29.input_layernorm.weight": "model-00006-of-00006.safetensors",
206
+ "layers.29.mlp.down_proj.weight": "model-00006-of-00006.safetensors",
207
+ "layers.29.mlp.gate_proj.weight": "model-00006-of-00006.safetensors",
208
+ "layers.29.mlp.up_proj.weight": "model-00006-of-00006.safetensors",
209
+ "layers.29.post_attention_layernorm.weight": "model-00006-of-00006.safetensors",
210
+ "layers.29.self_attn.k_proj.weight": "model-00006-of-00006.safetensors",
211
+ "layers.29.self_attn.o_proj.weight": "model-00006-of-00006.safetensors",
212
+ "layers.29.self_attn.q_proj.weight": "model-00006-of-00006.safetensors",
213
+ "layers.29.self_attn.v_proj.weight": "model-00006-of-00006.safetensors",
214
+ "layers.3.input_layernorm.weight": "model-00001-of-00006.safetensors",
215
+ "layers.3.mlp.down_proj.weight": "model-00001-of-00006.safetensors",
216
+ "layers.3.mlp.gate_proj.weight": "model-00001-of-00006.safetensors",
217
+ "layers.3.mlp.up_proj.weight": "model-00001-of-00006.safetensors",
218
+ "layers.3.post_attention_layernorm.weight": "model-00001-of-00006.safetensors",
219
+ "layers.3.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
220
+ "layers.3.self_attn.o_proj.weight": "model-00001-of-00006.safetensors",
221
+ "layers.3.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
222
+ "layers.3.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
223
+ "layers.30.input_layernorm.weight": "model-00006-of-00006.safetensors",
224
+ "layers.30.mlp.down_proj.weight": "model-00006-of-00006.safetensors",
225
+ "layers.30.mlp.gate_proj.weight": "model-00006-of-00006.safetensors",
226
+ "layers.30.mlp.up_proj.weight": "model-00006-of-00006.safetensors",
227
+ "layers.30.post_attention_layernorm.weight": "model-00006-of-00006.safetensors",
228
+ "layers.30.self_attn.k_proj.weight": "model-00006-of-00006.safetensors",
229
+ "layers.30.self_attn.o_proj.weight": "model-00006-of-00006.safetensors",
230
+ "layers.30.self_attn.q_proj.weight": "model-00006-of-00006.safetensors",
231
+ "layers.30.self_attn.v_proj.weight": "model-00006-of-00006.safetensors",
232
+ "layers.31.input_layernorm.weight": "model-00006-of-00006.safetensors",
233
+ "layers.31.mlp.down_proj.weight": "model-00006-of-00006.safetensors",
234
+ "layers.31.mlp.gate_proj.weight": "model-00006-of-00006.safetensors",
235
+ "layers.31.mlp.up_proj.weight": "model-00006-of-00006.safetensors",
236
+ "layers.31.post_attention_layernorm.weight": "model-00006-of-00006.safetensors",
237
+ "layers.31.self_attn.k_proj.weight": "model-00006-of-00006.safetensors",
238
+ "layers.31.self_attn.o_proj.weight": "model-00006-of-00006.safetensors",
239
+ "layers.31.self_attn.q_proj.weight": "model-00006-of-00006.safetensors",
240
+ "layers.31.self_attn.v_proj.weight": "model-00006-of-00006.safetensors",
241
+ "layers.4.input_layernorm.weight": "model-00001-of-00006.safetensors",
242
+ "layers.4.mlp.down_proj.weight": "model-00001-of-00006.safetensors",
243
+ "layers.4.mlp.gate_proj.weight": "model-00001-of-00006.safetensors",
244
+ "layers.4.mlp.up_proj.weight": "model-00001-of-00006.safetensors",
245
+ "layers.4.post_attention_layernorm.weight": "model-00001-of-00006.safetensors",
246
+ "layers.4.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
247
+ "layers.4.self_attn.o_proj.weight": "model-00001-of-00006.safetensors",
248
+ "layers.4.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
249
+ "layers.4.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
250
+ "layers.5.input_layernorm.weight": "model-00002-of-00006.safetensors",
251
+ "layers.5.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
252
+ "layers.5.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
253
+ "layers.5.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
254
+ "layers.5.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
255
+ "layers.5.self_attn.k_proj.weight": "model-00001-of-00006.safetensors",
256
+ "layers.5.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
257
+ "layers.5.self_attn.q_proj.weight": "model-00001-of-00006.safetensors",
258
+ "layers.5.self_attn.v_proj.weight": "model-00001-of-00006.safetensors",
259
+ "layers.6.input_layernorm.weight": "model-00002-of-00006.safetensors",
260
+ "layers.6.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
261
+ "layers.6.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
262
+ "layers.6.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
263
+ "layers.6.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
264
+ "layers.6.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
265
+ "layers.6.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
266
+ "layers.6.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
267
+ "layers.6.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
268
+ "layers.7.input_layernorm.weight": "model-00002-of-00006.safetensors",
269
+ "layers.7.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
270
+ "layers.7.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
271
+ "layers.7.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
272
+ "layers.7.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
273
+ "layers.7.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
274
+ "layers.7.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
275
+ "layers.7.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
276
+ "layers.7.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
277
+ "layers.8.input_layernorm.weight": "model-00002-of-00006.safetensors",
278
+ "layers.8.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
279
+ "layers.8.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
280
+ "layers.8.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
281
+ "layers.8.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
282
+ "layers.8.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
283
+ "layers.8.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
284
+ "layers.8.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
285
+ "layers.8.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
286
+ "layers.9.input_layernorm.weight": "model-00002-of-00006.safetensors",
287
+ "layers.9.mlp.down_proj.weight": "model-00002-of-00006.safetensors",
288
+ "layers.9.mlp.gate_proj.weight": "model-00002-of-00006.safetensors",
289
+ "layers.9.mlp.up_proj.weight": "model-00002-of-00006.safetensors",
290
+ "layers.9.post_attention_layernorm.weight": "model-00002-of-00006.safetensors",
291
+ "layers.9.self_attn.k_proj.weight": "model-00002-of-00006.safetensors",
292
+ "layers.9.self_attn.o_proj.weight": "model-00002-of-00006.safetensors",
293
+ "layers.9.self_attn.q_proj.weight": "model-00002-of-00006.safetensors",
294
+ "layers.9.self_attn.v_proj.weight": "model-00002-of-00006.safetensors",
295
+ "norm.weight": "model-00006-of-00006.safetensors"
296
+ }
297
+ }