anudit
/

finetuned-gte-base

@@ -1,6 +1,5 @@
 ---
 base_model: Alibaba-NLP/gte-base-en-v1.5
-datasets: []
 language:
 - en
 library_name: sentence-transformers
@@ -75,7 +74,7 @@ widget:
   - What lessons can be learned from the historical context of employee relations
     in large corporations?
 model-index:
-- name: Custom Embedding Test - Anudit Nagar
   results:
   - task:
       type: information-retrieval
@@ -85,49 +84,49 @@ model-index:
       type: dim_768
     metrics:
     - type: cosine_accuracy@1
-      value: 0.7683027145599123
       name: Cosine Accuracy@1
     - type: cosine_accuracy@3
-      value: 0.8755141211955032
       name: Cosine Accuracy@3
     - type: cosine_accuracy@5
-      value: 0.9097888675623801
       name: Cosine Accuracy@5
     - type: cosine_accuracy@10
-      value: 0.9465313956676721
       name: Cosine Accuracy@10
     - type: cosine_precision@1
-      value: 0.7683027145599123
       name: Cosine Precision@1
     - type: cosine_precision@3
-      value: 0.29183804039850103
       name: Cosine Precision@3
     - type: cosine_precision@5
-      value: 0.18195777351247602
       name: Cosine Precision@5
     - type: cosine_precision@10
-      value: 0.09465313956676721
       name: Cosine Precision@10
     - type: cosine_recall@1
-      value: 0.7683027145599123
       name: Cosine Recall@1
     - type: cosine_recall@3
-      value: 0.8755141211955032
       name: Cosine Recall@3
     - type: cosine_recall@5
-      value: 0.9097888675623801
       name: Cosine Recall@5
     - type: cosine_recall@10
-      value: 0.9465313956676721
       name: Cosine Recall@10
     - type: cosine_ndcg@10
-      value: 0.8566925927271383
       name: Cosine Ndcg@10
     - type: cosine_mrr@10
-      value: 0.8279207524340517
       name: Cosine Mrr@10
     - type: cosine_map@100
-      value: 0.8302321946792381
       name: Cosine Map@100
   - task:
       type: information-retrieval
@@ -137,49 +136,49 @@ model-index:
       type: dim_512
     metrics:
     - type: cosine_accuracy@1
-      value: 0.762818755141212
       name: Cosine Accuracy@1
     - type: cosine_accuracy@3
-      value: 0.8700301617768028
       name: Cosine Accuracy@3
     - type: cosine_accuracy@5
-      value: 0.9062242939402249
       name: Cosine Accuracy@5
     - type: cosine_accuracy@10
-      value: 0.946257197696737
       name: Cosine Accuracy@10
     - type: cosine_precision@1
-      value: 0.762818755141212
       name: Cosine Precision@1
     - type: cosine_precision@3
-      value: 0.2900100539256009
       name: Cosine Precision@3
     - type: cosine_precision@5
-      value: 0.18124485878804497
       name: Cosine Precision@5
     - type: cosine_precision@10
-      value: 0.09462571976967371
       name: Cosine Precision@10
     - type: cosine_recall@1
-      value: 0.762818755141212
       name: Cosine Recall@1
     - type: cosine_recall@3
-      value: 0.8700301617768028
       name: Cosine Recall@3
     - type: cosine_recall@5
-      value: 0.9062242939402249
       name: Cosine Recall@5
     - type: cosine_recall@10
-      value: 0.946257197696737
       name: Cosine Recall@10
     - type: cosine_ndcg@10
-      value: 0.8529743473843932
       name: Cosine Ndcg@10
     - type: cosine_mrr@10
-      value: 0.8231949721667308
       name: Cosine Mrr@10
     - type: cosine_map@100
-      value: 0.825407004380477
       name: Cosine Map@100
   - task:
       type: information-retrieval
@@ -189,49 +188,49 @@ model-index:
       type: dim_256
     metrics:
     - type: cosine_accuracy@1
-      value: 0.762818755141212
       name: Cosine Accuracy@1
     - type: cosine_accuracy@3
-      value: 0.8683849739511927
       name: Cosine Accuracy@3
     - type: cosine_accuracy@5
-      value: 0.9015629284343296
       name: Cosine Accuracy@5
     - type: cosine_accuracy@10
-      value: 0.9418700301617768
       name: Cosine Accuracy@10
     - type: cosine_precision@1
-      value: 0.762818755141212
       name: Cosine Precision@1
     - type: cosine_precision@3
-      value: 0.28946165798373086
       name: Cosine Precision@3
     - type: cosine_precision@5
-      value: 0.18031258568686592
       name: Cosine Precision@5
     - type: cosine_precision@10
-      value: 0.09418700301617768
       name: Cosine Precision@10
     - type: cosine_recall@1
-      value: 0.762818755141212
       name: Cosine Recall@1
     - type: cosine_recall@3
-      value: 0.8683849739511927
       name: Cosine Recall@3
     - type: cosine_recall@5
-      value: 0.9015629284343296
       name: Cosine Recall@5
     - type: cosine_recall@10
-      value: 0.9418700301617768
       name: Cosine Recall@10
     - type: cosine_ndcg@10
-      value: 0.850685453111757
       name: Cosine Ndcg@10
     - type: cosine_mrr@10
-      value: 0.8215859088357048
       name: Cosine Mrr@10
     - type: cosine_map@100
-      value: 0.8239714751253995
       name: Cosine Map@100
   - task:
       type: information-retrieval
@@ -241,49 +240,49 @@ model-index:
       type: dim_128
     metrics:
     - type: cosine_accuracy@1
-      value: 0.7573347957225116
       name: Cosine Accuracy@1
     - type: cosine_accuracy@3
-      value: 0.8634494104743625
       name: Cosine Accuracy@3
     - type: cosine_accuracy@5
-      value: 0.8952563751028242
       name: Cosine Accuracy@5
     - type: cosine_accuracy@10
-      value: 0.9347408829174664
       name: Cosine Accuracy@10
     - type: cosine_precision@1
-      value: 0.7573347957225116
       name: Cosine Precision@1
     - type: cosine_precision@3
-      value: 0.2878164701581208
       name: Cosine Precision@3
     - type: cosine_precision@5
-      value: 0.17905127502056484
       name: Cosine Precision@5
     - type: cosine_precision@10
-      value: 0.09347408829174664
       name: Cosine Precision@10
     - type: cosine_recall@1
-      value: 0.7573347957225116
       name: Cosine Recall@1
     - type: cosine_recall@3
-      value: 0.8634494104743625
       name: Cosine Recall@3
     - type: cosine_recall@5
-      value: 0.8952563751028242
       name: Cosine Recall@5
     - type: cosine_recall@10
-      value: 0.9347408829174664
       name: Cosine Recall@10
     - type: cosine_ndcg@10
-      value: 0.8445055968214926
       name: Cosine Ndcg@10
     - type: cosine_mrr@10
-      value: 0.8157123053956075
       name: Cosine Mrr@10
     - type: cosine_map@100
-      value: 0.8184088689781863
       name: Cosine Map@100
   - task:
       type: information-retrieval
@@ -293,55 +292,55 @@ model-index:
       type: dim_64
     metrics:
     - type: cosine_accuracy@1
-      value: 0.7419797093501508
       name: Cosine Accuracy@1
     - type: cosine_accuracy@3
-      value: 0.8530298875788319
       name: Cosine Accuracy@3
     - type: cosine_accuracy@5
-      value: 0.8859336440910337
       name: Cosine Accuracy@5
     - type: cosine_accuracy@10
-      value: 0.9284343295859611
       name: Cosine Accuracy@10
     - type: cosine_precision@1
-      value: 0.7419797093501508
       name: Cosine Precision@1
     - type: cosine_precision@3
-      value: 0.28434329585961066
       name: Cosine Precision@3
     - type: cosine_precision@5
-      value: 0.17718672881820677
       name: Cosine Precision@5
     - type: cosine_precision@10
-      value: 0.09284343295859611
       name: Cosine Precision@10
     - type: cosine_recall@1
-      value: 0.7419797093501508
       name: Cosine Recall@1
     - type: cosine_recall@3
-      value: 0.8530298875788319
       name: Cosine Recall@3
     - type: cosine_recall@5
-      value: 0.8859336440910337
       name: Cosine Recall@5
     - type: cosine_recall@10
-      value: 0.9284343295859611
       name: Cosine Recall@10
     - type: cosine_ndcg@10
-      value: 0.8334906130922063
       name: Cosine Ndcg@10
     - type: cosine_mrr@10
-      value: 0.8032139919307455
       name: Cosine Mrr@10
     - type: cosine_map@100
-      value: 0.8057146368194794
       name: Cosine Map@100
 ---
-# Custom Embedding Test - Anudit Nagar
-This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [Alibaba-NLP/gte-base-en-v1.5](https://huggingface.co/Alibaba-NLP/gte-base-en-v1.5). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
 ## Model Details
@@ -351,7 +350,8 @@ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [A
 - **Maximum Sequence Length:** 8192 tokens
 - **Output Dimensionality:** 768 tokens
 - **Similarity Function:** Cosine Similarity
-<!-- - **Training Dataset:** Unknown -->
 - **Language:** en
 - **License:** apache-2.0
@@ -436,21 +436,21 @@ You can finetune this model on your own dataset.
 | Metric              | Value      |
 |:--------------------|:-----------|
-| cosine_accuracy@1   | 0.7683     |
-| cosine_accuracy@3   | 0.8755     |
-| cosine_accuracy@5   | 0.9098     |
-| cosine_accuracy@10  | 0.9465     |
-| cosine_precision@1  | 0.7683     |
-| cosine_precision@3  | 0.2918     |
-| cosine_precision@5  | 0.182      |
-| cosine_precision@10 | 0.0947     |
-| cosine_recall@1     | 0.7683     |
-| cosine_recall@3     | 0.8755     |
-| cosine_recall@5     | 0.9098     |
-| cosine_recall@10    | 0.9465     |
-| cosine_ndcg@10      | 0.8567     |
-| cosine_mrr@10       | 0.8279     |
-| **cosine_map@100**  | **0.8302** |
 #### Information Retrieval
 * Dataset: `dim_512`
@@ -458,43 +458,43 @@ You can finetune this model on your own dataset.
 | Metric              | Value      |
 |:--------------------|:-----------|
-| cosine_accuracy@1   | 0.7628     |
-| cosine_accuracy@3   | 0.87       |
-| cosine_accuracy@5   | 0.9062     |
-| cosine_accuracy@10  | 0.9463     |
-| cosine_precision@1  | 0.7628     |
-| cosine_precision@3  | 0.29       |
-| cosine_precision@5  | 0.1812     |
-| cosine_precision@10 | 0.0946     |
-| cosine_recall@1     | 0.7628     |
-| cosine_recall@3     | 0.87       |
-| cosine_recall@5     | 0.9062     |
-| cosine_recall@10    | 0.9463     |
-| cosine_ndcg@10      | 0.853      |
-| cosine_mrr@10       | 0.8232     |
-| **cosine_map@100**  | **0.8254** |
 #### Information Retrieval
 * Dataset: `dim_256`
 * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator)
-| Metric              | Value     |
-|:--------------------|:----------|
-| cosine_accuracy@1   | 0.7628    |
-| cosine_accuracy@3   | 0.8684    |
-| cosine_accuracy@5   | 0.9016    |
-| cosine_accuracy@10  | 0.9419    |
-| cosine_precision@1  | 0.7628    |
-| cosine_precision@3  | 0.2895    |
-| cosine_precision@5  | 0.1803    |
-| cosine_precision@10 | 0.0942    |
-| cosine_recall@1     | 0.7628    |
-| cosine_recall@3     | 0.8684    |
-| cosine_recall@5     | 0.9016    |
-| cosine_recall@10    | 0.9419    |
-| cosine_ndcg@10      | 0.8507    |
-| cosine_mrr@10       | 0.8216    |
-| **cosine_map@100**  | **0.824** |
 #### Information Retrieval
 * Dataset: `dim_128`
@@ -502,21 +502,21 @@ You can finetune this model on your own dataset.
 | Metric              | Value      |
 |:--------------------|:-----------|
-| cosine_accuracy@1   | 0.7573     |
-| cosine_accuracy@3   | 0.8634     |
-| cosine_accuracy@5   | 0.8953     |
-| cosine_accuracy@10  | 0.9347     |
-| cosine_precision@1  | 0.7573     |
-| cosine_precision@3  | 0.2878     |
-| cosine_precision@5  | 0.1791     |
-| cosine_precision@10 | 0.0935     |
-| cosine_recall@1     | 0.7573     |
-| cosine_recall@3     | 0.8634     |
-| cosine_recall@5     | 0.8953     |
-| cosine_recall@10    | 0.9347     |
-| cosine_ndcg@10      | 0.8445     |
-| cosine_mrr@10       | 0.8157     |
-| **cosine_map@100**  | **0.8184** |
 #### Information Retrieval
 * Dataset: `dim_64`
@@ -524,21 +524,21 @@ You can finetune this model on your own dataset.
 | Metric              | Value      |
 |:--------------------|:-----------|
-| cosine_accuracy@1   | 0.742      |
-| cosine_accuracy@3   | 0.853      |
-| cosine_accuracy@5   | 0.8859     |
-| cosine_accuracy@10  | 0.9284     |
-| cosine_precision@1  | 0.742      |
-| cosine_precision@3  | 0.2843     |
-| cosine_precision@5  | 0.1772     |
-| cosine_precision@10 | 0.0928     |
-| cosine_recall@1     | 0.742      |
-| cosine_recall@3     | 0.853      |
-| cosine_recall@5     | 0.8859     |
-| cosine_recall@10    | 0.9284     |
-| cosine_ndcg@10      | 0.8335     |
-| cosine_mrr@10       | 0.8032     |
-| **cosine_map@100**  | **0.8057** |
 <!--
 ## Bias, Risks and Limitations
@@ -556,9 +556,9 @@ You can finetune this model on your own dataset.
 ### Training Dataset
-#### Unnamed Dataset
 * Size: 32,833 training samples
 * Columns: <code>positive</code> and <code>anchor</code>
 * Approximate statistics based on the first 1000 samples:
@@ -598,11 +598,11 @@ You can finetune this model on your own dataset.
 #### Non-Default Hyperparameters
 - `eval_strategy`: epoch
-- `per_device_train_batch_size`: 32
-- `per_device_eval_batch_size`: 16
-- `gradient_accumulation_steps`: 16
-- `learning_rate`: 0.0002
-- `num_train_epochs`: 5
 - `lr_scheduler_type`: cosine
 - `warmup_ratio`: 0.1
 - `bf16`: True
@@ -616,20 +616,20 @@ You can finetune this model on your own dataset.
 - `do_predict`: False
 - `eval_strategy`: epoch
 - `prediction_loss_only`: True
-- `per_device_train_batch_size`: 32
-- `per_device_eval_batch_size`: 16
 - `per_gpu_train_batch_size`: None
 - `per_gpu_eval_batch_size`: None
-- `gradient_accumulation_steps`: 16
 - `eval_accumulation_steps`: None
 - `torch_empty_cache_steps`: None
-- `learning_rate`: 0.0002
 - `weight_decay`: 0.0
 - `adam_beta1`: 0.9
 - `adam_beta2`: 0.999
 - `adam_epsilon`: 1e-08
 - `max_grad_norm`: 1.0
-- `num_train_epochs`: 5
 - `max_steps`: -1
 - `lr_scheduler_type`: cosine
 - `lr_scheduler_kwargs`: {}
@@ -727,52 +727,88 @@ You can finetune this model on your own dataset.
 </details>
 ### Training Logs
-| Epoch      | Step   | Training Loss | dim_128_cosine_map@100 | dim_256_cosine_map@100 | dim_512_cosine_map@100 | dim_64_cosine_map@100 | dim_768_cosine_map@100 |
-|:----------:|:------:|:-------------:|:----------------------:|:----------------------:|:----------------------:|:---------------------:|:----------------------:|
-| 0.1558     | 10     | 0.7195        | -                      | -                      | -                      | -                     | -                      |
-| 0.3116     | 20     | 0.324         | -                      | -                      | -                      | -                     | -                      |
-| 0.4674     | 30     | 0.238         | -                      | -                      | -                      | -                     | -                      |
-| 0.6232     | 40     | 0.2265        | -                      | -                      | -                      | -                     | -                      |
-| 0.7790     | 50     | 0.1825        | -                      | -                      | -                      | -                     | -                      |
-| 0.9348     | 60     | 0.1938        | -                      | -                      | -                      | -                     | -                      |
-| **0.9971** | **64** | **-**         | **0.8054**             | **0.8198**             | **0.8276**             | **0.7796**            | **0.8329**             |
-| 1.0906     | 70     | 0.1397        | -                      | -                      | -                      | -                     | -                      |
-| 1.2463     | 80     | 0.0611        | -                      | -                      | -                      | -                     | -                      |
-| 1.4021     | 90     | 0.0506        | -                      | -                      | -                      | -                     | -                      |
-| 1.5579     | 100    | 0.047         | -                      | -                      | -                      | -                     | -                      |
-| 1.7137     | 110    | 0.0327        | -                      | -                      | -                      | -                     | -                      |
-| 1.8695     | 120    | 0.034         | -                      | -                      | -                      | -                     | -                      |
-| 1.9942     | 128    | -             | 0.8036                 | 0.8135                 | 0.8187                 | 0.7861                | 0.8243                 |
-| 2.0253     | 130    | 0.0319        | -                      | -                      | -                      | -                     | -                      |
-| 2.1811     | 140    | 0.0347        | -                      | -                      | -                      | -                     | -                      |
-| 2.3369     | 150    | 0.021         | -                      | -                      | -                      | -                     | -                      |
-| 2.4927     | 160    | 0.0169        | -                      | -                      | -                      | -                     | -                      |
-| 2.6485     | 170    | 0.0135        | -                      | -                      | -                      | -                     | -                      |
-| 2.8043     | 180    | 0.0123        | -                      | -                      | -                      | -                     | -                      |
-| 2.9601     | 190    | 0.0111        | -                      | -                      | -                      | -                     | -                      |
-| 2.9912     | 192    | -             | 0.8109                 | 0.8179                 | 0.8213                 | 0.7973                | 0.8264                 |
-| 3.1159     | 200    | 0.0083        | -                      | -                      | -                      | -                     | -                      |
-| 3.2717     | 210    | 0.0088        | -                      | -                      | -                      | -                     | -                      |
-| 3.4275     | 220    | 0.005         | -                      | -                      | -                      | -                     | -                      |
-| 3.5833     | 230    | 0.005         | -                      | -                      | -                      | -                     | -                      |
-| 3.7390     | 240    | 0.0043        | -                      | -                      | -                      | -                     | -                      |
-| 3.8948     | 250    | 0.0058        | -                      | -                      | -                      | -                     | -                      |
-| 3.9883     | 256    | -             | 0.8163                 | 0.8244                 | 0.8260                 | 0.8045                | 0.8287                 |
-| 4.0506     | 260    | 0.0057        | -                      | -                      | -                      | -                     | -                      |
-| 4.2064     | 270    | 0.0035        | -                      | -                      | -                      | -                     | -                      |
-| 4.3622     | 280    | 0.0033        | -                      | -                      | -                      | -                     | -                      |
-| 4.5180     | 290    | 0.0032        | -                      | -                      | -                      | -                     | -                      |
-| 4.6738     | 300    | 0.0031        | -                      | -                      | -                      | -                     | -                      |
-| 4.8296     | 310    | 0.0038        | -                      | -                      | -                      | -                     | -                      |
-| 4.9854     | 320    | 0.0042        | 0.8184                 | 0.8240                 | 0.8254                 | 0.8057                | 0.8302                 |
 * The bold row denotes the saved checkpoint.
 ### Framework Versions
 - Python: 3.12.5
-- Sentence Transformers: 3.0.1
 - Transformers: 4.44.2
-- PyTorch: 2.4.0
 - Accelerate: 0.33.0
 - Datasets: 2.21.0
 - Tokenizers: 0.19.1
@@ -797,7 +833,7 @@ You can finetune this model on your own dataset.
 #### MatryoshkaLoss
 ```bibtex
 @misc{kusupati2024matryoshka,
-    title={Matryoshka Representation Learning},
     author={Aditya Kusupati and Gantavya Bhatt and Aniket Rege and Matthew Wallingford and Aditya Sinha and Vivek Ramanujan and William Howard-Snyder and Kaifeng Chen and Sham Kakade and Prateek Jain and Ali Farhadi},
     year={2024},
     eprint={2205.13147},
@@ -809,7 +845,7 @@ You can finetune this model on your own dataset.
 #### MultipleNegativesRankingLoss
 ```bibtex
 @misc{henderson2017efficient,
-    title={Efficient Natural Language Response Suggestion for Smart Reply},
     author={Matthew Henderson and Rami Al-Rfou and Brian Strope and Yun-hsuan Sung and Laszlo Lukacs and Ruiqi Guo and Sanjiv Kumar and Balint Miklos and Ray Kurzweil},
     year={2017},
     eprint={1705.00652},

 ---
 base_model: Alibaba-NLP/gte-base-en-v1.5
 language:
 - en
 library_name: sentence-transformers
   - What lessons can be learned from the historical context of employee relations
     in large corporations?
 model-index:
+- name: Alchemy Embedding - Anudit Nagar
   results:
   - task:
       type: information-retrieval
       type: dim_768
     metrics:
     - type: cosine_accuracy@1
+      value: 0.782012613106663
       name: Cosine Accuracy@1
     - type: cosine_accuracy@3
+      value: 0.8889498217713189
       name: Cosine Accuracy@3
     - type: cosine_accuracy@5
+      value: 0.9248697559638058
       name: Cosine Accuracy@5
     - type: cosine_accuracy@10
+      value: 0.9520153550863724
       name: Cosine Accuracy@10
     - type: cosine_precision@1
+      value: 0.782012613106663
       name: Cosine Precision@1
     - type: cosine_precision@3
+      value: 0.29631660725710623
       name: Cosine Precision@3
     - type: cosine_precision@5
+      value: 0.1849739511927612
       name: Cosine Precision@5
     - type: cosine_precision@10
+      value: 0.09520153550863725
       name: Cosine Precision@10
     - type: cosine_recall@1
+      value: 0.782012613106663
       name: Cosine Recall@1
     - type: cosine_recall@3
+      value: 0.8889498217713189
       name: Cosine Recall@3
     - type: cosine_recall@5
+      value: 0.9248697559638058
       name: Cosine Recall@5
     - type: cosine_recall@10
+      value: 0.9520153550863724
       name: Cosine Recall@10
     - type: cosine_ndcg@10
+      value: 0.867555587052628
       name: Cosine Ndcg@10
     - type: cosine_mrr@10
+      value: 0.8402608580220322
       name: Cosine Mrr@10
     - type: cosine_map@100
+      value: 0.8422322227138224
       name: Cosine Map@100
   - task:
       type: information-retrieval
       type: dim_512
     metrics:
     - type: cosine_accuracy@1
+      value: 0.780367425281053
       name: Cosine Accuracy@1
     - type: cosine_accuracy@3
+      value: 0.8848368522072937
       name: Cosine Accuracy@3
     - type: cosine_accuracy@5
+      value: 0.9221277762544557
       name: Cosine Accuracy@5
     - type: cosine_accuracy@10
+      value: 0.9514669591445023
       name: Cosine Accuracy@10
     - type: cosine_precision@1
+      value: 0.780367425281053
       name: Cosine Precision@1
     - type: cosine_precision@3
+      value: 0.2949456174024312
       name: Cosine Precision@3
     - type: cosine_precision@5
+      value: 0.1844255552508912
       name: Cosine Precision@5
     - type: cosine_precision@10
+      value: 0.09514669591445023
       name: Cosine Precision@10
     - type: cosine_recall@1
+      value: 0.780367425281053
       name: Cosine Recall@1
     - type: cosine_recall@3
+      value: 0.8848368522072937
       name: Cosine Recall@3
     - type: cosine_recall@5
+      value: 0.9221277762544557
       name: Cosine Recall@5
     - type: cosine_recall@10
+      value: 0.9514669591445023
       name: Cosine Recall@10
     - type: cosine_ndcg@10
+      value: 0.8661558392165704
       name: Cosine Ndcg@10
     - type: cosine_mrr@10
+      value: 0.838656038231032
       name: Cosine Mrr@10
     - type: cosine_map@100
+      value: 0.8405372438205077
       name: Cosine Map@100
   - task:
       type: information-retrieval
       type: dim_256
     metrics:
     - type: cosine_accuracy@1
+      value: 0.7754318618042226
       name: Cosine Accuracy@1
     - type: cosine_accuracy@3
+      value: 0.8804496846723334
       name: Cosine Accuracy@3
     - type: cosine_accuracy@5
+      value: 0.9169180148066904
       name: Cosine Accuracy@5
     - type: cosine_accuracy@10
+      value: 0.9468055936386071
       name: Cosine Accuracy@10
     - type: cosine_precision@1
+      value: 0.7754318618042226
       name: Cosine Precision@1
     - type: cosine_precision@3
+      value: 0.2934832282241111
       name: Cosine Precision@3
     - type: cosine_precision@5
+      value: 0.18338360296133807
       name: Cosine Precision@5
     - type: cosine_precision@10
+      value: 0.09468055936386072
       name: Cosine Precision@10
     - type: cosine_recall@1
+      value: 0.7754318618042226
       name: Cosine Recall@1
     - type: cosine_recall@3
+      value: 0.8804496846723334
       name: Cosine Recall@3
     - type: cosine_recall@5
+      value: 0.9169180148066904
       name: Cosine Recall@5
     - type: cosine_recall@10
+      value: 0.9468055936386071
       name: Cosine Recall@10
     - type: cosine_ndcg@10
+      value: 0.8613819477350178
       name: Cosine Ndcg@10
     - type: cosine_mrr@10
+      value: 0.8338379881703168
       name: Cosine Mrr@10
     - type: cosine_map@100
+      value: 0.8360735900013385
       name: Cosine Map@100
   - task:
       type: information-retrieval
       type: dim_128
     metrics:
     - type: cosine_accuracy@1
+      value: 0.7617219632574719
       name: Cosine Accuracy@1
     - type: cosine_accuracy@3
+      value: 0.871675349602413
       name: Cosine Accuracy@3
     - type: cosine_accuracy@5
+      value: 0.9117082533589251
       name: Cosine Accuracy@5
     - type: cosine_accuracy@10
+      value: 0.9418700301617768
       name: Cosine Accuracy@10
     - type: cosine_precision@1
+      value: 0.7617219632574719
       name: Cosine Precision@1
     - type: cosine_precision@3
+      value: 0.2905584498674709
       name: Cosine Precision@3
     - type: cosine_precision@5
+      value: 0.18234165067178504
       name: Cosine Precision@5
     - type: cosine_precision@10
+      value: 0.09418700301617768
       name: Cosine Precision@10
     - type: cosine_recall@1
+      value: 0.7617219632574719
       name: Cosine Recall@1
     - type: cosine_recall@3
+      value: 0.871675349602413
       name: Cosine Recall@3
     - type: cosine_recall@5
+      value: 0.9117082533589251
       name: Cosine Recall@5
     - type: cosine_recall@10
+      value: 0.9418700301617768
       name: Cosine Recall@10
     - type: cosine_ndcg@10
+      value: 0.851649908463093
       name: Cosine Ndcg@10
     - type: cosine_mrr@10
+      value: 0.8225671458602635
       name: Cosine Mrr@10
     - type: cosine_map@100
+      value: 0.8248455884524328
       name: Cosine Map@100
   - task:
       type: information-retrieval
       type: dim_64
     metrics:
     - type: cosine_accuracy@1
+      value: 0.7408829174664108
       name: Cosine Accuracy@1
     - type: cosine_accuracy@3
+      value: 0.853852481491637
       name: Cosine Accuracy@3
     - type: cosine_accuracy@5
+      value: 0.8936111872772141
       name: Cosine Accuracy@5
     - type: cosine_accuracy@10
+      value: 0.9292569234987661
       name: Cosine Accuracy@10
     - type: cosine_precision@1
+      value: 0.7408829174664108
       name: Cosine Precision@1
     - type: cosine_precision@3
+      value: 0.28461749383054563
       name: Cosine Precision@3
     - type: cosine_precision@5
+      value: 0.17872223745544283
       name: Cosine Precision@5
     - type: cosine_precision@10
+      value: 0.0929256923498766
       name: Cosine Precision@10
     - type: cosine_recall@1
+      value: 0.7408829174664108
       name: Cosine Recall@1
     - type: cosine_recall@3
+      value: 0.853852481491637
       name: Cosine Recall@3
     - type: cosine_recall@5
+      value: 0.8936111872772141
       name: Cosine Recall@5
     - type: cosine_recall@10
+      value: 0.9292569234987661
       name: Cosine Recall@10
     - type: cosine_ndcg@10
+      value: 0.8338956659320366
       name: Cosine Ndcg@10
     - type: cosine_mrr@10
+      value: 0.8033378162525404
       name: Cosine Mrr@10
     - type: cosine_map@100
+      value: 0.8057702637208689
       name: Cosine Map@100
 ---
+# Alchemy Embedding - Anudit Nagar
+This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [Alibaba-NLP/gte-base-en-v1.5](https://huggingface.co/Alibaba-NLP/gte-base-en-v1.5) on the json dataset. It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
 ## Model Details
 - **Maximum Sequence Length:** 8192 tokens
 - **Output Dimensionality:** 768 tokens
 - **Similarity Function:** Cosine Similarity
+- **Training Dataset:**
+    - json
 - **Language:** en
 - **License:** apache-2.0
 | Metric              | Value      |
 |:--------------------|:-----------|
+| cosine_accuracy@1   | 0.782      |
+| cosine_accuracy@3   | 0.8889     |
+| cosine_accuracy@5   | 0.9249     |
+| cosine_accuracy@10  | 0.952      |
+| cosine_precision@1  | 0.782      |
+| cosine_precision@3  | 0.2963     |
+| cosine_precision@5  | 0.185      |
+| cosine_precision@10 | 0.0952     |
+| cosine_recall@1     | 0.782      |
+| cosine_recall@3     | 0.8889     |
+| cosine_recall@5     | 0.9249     |
+| cosine_recall@10    | 0.952      |
+| cosine_ndcg@10      | 0.8676     |
+| cosine_mrr@10       | 0.8403     |
+| **cosine_map@100**  | **0.8422** |
 #### Information Retrieval
 * Dataset: `dim_512`
 | Metric              | Value      |
 |:--------------------|:-----------|
+| cosine_accuracy@1   | 0.7804     |
+| cosine_accuracy@3   | 0.8848     |
+| cosine_accuracy@5   | 0.9221     |
+| cosine_accuracy@10  | 0.9515     |
+| cosine_precision@1  | 0.7804     |
+| cosine_precision@3  | 0.2949     |
+| cosine_precision@5  | 0.1844     |
+| cosine_precision@10 | 0.0951     |
+| cosine_recall@1     | 0.7804     |
+| cosine_recall@3     | 0.8848     |
+| cosine_recall@5     | 0.9221     |
+| cosine_recall@10    | 0.9515     |
+| cosine_ndcg@10      | 0.8662     |
+| cosine_mrr@10       | 0.8387     |
+| **cosine_map@100**  | **0.8405** |
 #### Information Retrieval
 * Dataset: `dim_256`
 * Evaluated with [<code>InformationRetrievalEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.InformationRetrievalEvaluator)
+| Metric              | Value      |
+|:--------------------|:-----------|
+| cosine_accuracy@1   | 0.7754     |
+| cosine_accuracy@3   | 0.8804     |
+| cosine_accuracy@5   | 0.9169     |
+| cosine_accuracy@10  | 0.9468     |
+| cosine_precision@1  | 0.7754     |
+| cosine_precision@3  | 0.2935     |
+| cosine_precision@5  | 0.1834     |
+| cosine_precision@10 | 0.0947     |
+| cosine_recall@1     | 0.7754     |
+| cosine_recall@3     | 0.8804     |
+| cosine_recall@5     | 0.9169     |
+| cosine_recall@10    | 0.9468     |
+| cosine_ndcg@10      | 0.8614     |
+| cosine_mrr@10       | 0.8338     |
+| **cosine_map@100**  | **0.8361** |
 #### Information Retrieval
 * Dataset: `dim_128`
 | Metric              | Value      |
 |:--------------------|:-----------|
+| cosine_accuracy@1   | 0.7617     |
+| cosine_accuracy@3   | 0.8717     |
+| cosine_accuracy@5   | 0.9117     |
+| cosine_accuracy@10  | 0.9419     |
+| cosine_precision@1  | 0.7617     |
+| cosine_precision@3  | 0.2906     |
+| cosine_precision@5  | 0.1823     |
+| cosine_precision@10 | 0.0942     |
+| cosine_recall@1     | 0.7617     |
+| cosine_recall@3     | 0.8717     |
+| cosine_recall@5     | 0.9117     |
+| cosine_recall@10    | 0.9419     |
+| cosine_ndcg@10      | 0.8516     |
+| cosine_mrr@10       | 0.8226     |
+| **cosine_map@100**  | **0.8248** |
 #### Information Retrieval
 * Dataset: `dim_64`
 | Metric              | Value      |
 |:--------------------|:-----------|
+| cosine_accuracy@1   | 0.7409     |
+| cosine_accuracy@3   | 0.8539     |
+| cosine_accuracy@5   | 0.8936     |
+| cosine_accuracy@10  | 0.9293     |
+| cosine_precision@1  | 0.7409     |
+| cosine_precision@3  | 0.2846     |
+| cosine_precision@5  | 0.1787     |
+| cosine_precision@10 | 0.0929     |
+| cosine_recall@1     | 0.7409     |
+| cosine_recall@3     | 0.8539     |
+| cosine_recall@5     | 0.8936     |
+| cosine_recall@10    | 0.9293     |
+| cosine_ndcg@10      | 0.8339     |
+| cosine_mrr@10       | 0.8033     |
+| **cosine_map@100**  | **0.8058** |
 <!--
 ## Bias, Risks and Limitations
 ### Training Dataset
+#### json
+* Dataset: json
 * Size: 32,833 training samples
 * Columns: <code>positive</code> and <code>anchor</code>
 * Approximate statistics based on the first 1000 samples:
 #### Non-Default Hyperparameters
 - `eval_strategy`: epoch
+- `per_device_train_batch_size`: 24
+- `per_device_eval_batch_size`: 24
+- `gradient_accumulation_steps`: 8
+- `learning_rate`: 2e-05
+- `num_train_epochs`: 4
 - `lr_scheduler_type`: cosine
 - `warmup_ratio`: 0.1
 - `bf16`: True
 - `do_predict`: False
 - `eval_strategy`: epoch
 - `prediction_loss_only`: True
+- `per_device_train_batch_size`: 24
+- `per_device_eval_batch_size`: 24
 - `per_gpu_train_batch_size`: None
 - `per_gpu_eval_batch_size`: None
+- `gradient_accumulation_steps`: 8
 - `eval_accumulation_steps`: None
 - `torch_empty_cache_steps`: None
+- `learning_rate`: 2e-05
 - `weight_decay`: 0.0
 - `adam_beta1`: 0.9
 - `adam_beta2`: 0.999
 - `adam_epsilon`: 1e-08
 - `max_grad_norm`: 1.0
+- `num_train_epochs`: 4
 - `max_steps`: -1
 - `lr_scheduler_type`: cosine
 - `lr_scheduler_kwargs`: {}
 </details>
 ### Training Logs
+| Epoch      | Step    | Training Loss | dim_128_cosine_map@100 | dim_256_cosine_map@100 | dim_512_cosine_map@100 | dim_64_cosine_map@100 | dim_768_cosine_map@100 |
+|:----------:|:-------:|:-------------:|:----------------------:|:----------------------:|:----------------------:|:---------------------:|:----------------------:|
+| 0.0584     | 10      | 0.8567        | -                      | -                      | -                      | -                     | -                      |
+| 0.1169     | 20      | 0.6549        | -                      | -                      | -                      | -                     | -                      |
+| 0.1753     | 30      | 0.5407        | -                      | -                      | -                      | -                     | -                      |
+| 0.2337     | 40      | 0.4586        | -                      | -                      | -                      | -                     | -                      |
+| 0.2922     | 50      | 0.3914        | -                      | -                      | -                      | -                     | -                      |
+| 0.3506     | 60      | 0.4104        | -                      | -                      | -                      | -                     | -                      |
+| 0.4091     | 70      | 0.299         | -                      | -                      | -                      | -                     | -                      |
+| 0.4675     | 80      | 0.2444        | -                      | -                      | -                      | -                     | -                      |
+| 0.5259     | 90      | 0.2367        | -                      | -                      | -                      | -                     | -                      |
+| 0.5844     | 100     | 0.2302        | -                      | -                      | -                      | -                     | -                      |
+| 0.6428     | 110     | 0.2356        | -                      | -                      | -                      | -                     | -                      |
+| 0.7012     | 120     | 0.1537        | -                      | -                      | -                      | -                     | -                      |
+| 0.7597     | 130     | 0.2043        | -                      | -                      | -                      | -                     | -                      |
+| 0.8181     | 140     | 0.1606        | -                      | -                      | -                      | -                     | -                      |
+| 0.8766     | 150     | 0.1896        | -                      | -                      | -                      | -                     | -                      |
+| 0.9350     | 160     | 0.1766        | -                      | -                      | -                      | -                     | -                      |
+| 0.9934     | 170     | 0.1259        | -                      | -                      | -                      | -                     | -                      |
+| 0.9993     | 171     | -             | 0.8115                 | 0.8233                 | 0.8321                 | 0.7829                | 0.8340                 |
+| 1.0519     | 180     | 0.1661        | -                      | -                      | -                      | -                     | -                      |
+| 1.1103     | 190     | 0.1632        | -                      | -                      | -                      | -                     | -                      |
+| 1.1687     | 200     | 0.1032        | -                      | -                      | -                      | -                     | -                      |
+| 1.2272     | 210     | 0.1037        | -                      | -                      | -                      | -                     | -                      |
+| 1.2856     | 220     | 0.0708        | -                      | -                      | -                      | -                     | -                      |
+| 1.3440     | 230     | 0.0827        | -                      | -                      | -                      | -                     | -                      |
+| 1.4025     | 240     | 0.0505        | -                      | -                      | -                      | -                     | -                      |
+| 1.4609     | 250     | 0.0468        | -                      | -                      | -                      | -                     | -                      |
+| 1.5194     | 260     | 0.0371        | -                      | -                      | -                      | -                     | -                      |
+| 1.5778     | 270     | 0.049         | -                      | -                      | -                      | -                     | -                      |
+| 1.6362     | 280     | 0.0527        | -                      | -                      | -                      | -                     | -                      |
+| 1.6947     | 290     | 0.0316        | -                      | -                      | -                      | -                     | -                      |
+| 1.7531     | 300     | 0.052         | -                      | -                      | -                      | -                     | -                      |
+| 1.8115     | 310     | 0.0298        | -                      | -                      | -                      | -                     | -                      |
+| 1.8700     | 320     | 0.0334        | -                      | -                      | -                      | -                     | -                      |
+| 1.9284     | 330     | 0.0431        | -                      | -                      | -                      | -                     | -                      |
+| 1.9869     | 340     | 0.0316        | -                      | -                      | -                      | -                     | -                      |
+| 1.9985     | 342     | -             | 0.8216                 | 0.8342                 | 0.8397                 | 0.8006                | 0.8408                 |
+| 2.0453     | 350     | 0.0275        | -                      | -                      | -                      | -                     | -                      |
+| 2.1037     | 360     | 0.0461        | -                      | -                      | -                      | -                     | -                      |
+| 2.1622     | 370     | 0.0341        | -                      | -                      | -                      | -                     | -                      |
+| 2.2206     | 380     | 0.0323        | -                      | -                      | -                      | -                     | -                      |
+| 2.2790     | 390     | 0.0205        | -                      | -                      | -                      | -                     | -                      |
+| 2.3375     | 400     | 0.0223        | -                      | -                      | -                      | -                     | -                      |
+| 2.3959     | 410     | 0.0189        | -                      | -                      | -                      | -                     | -                      |
+| 2.4543     | 420     | 0.0181        | -                      | -                      | -                      | -                     | -                      |
+| 2.5128     | 430     | 0.0144        | -                      | -                      | -                      | -                     | -                      |
+| 2.5712     | 440     | 0.0179        | -                      | -                      | -                      | -                     | -                      |
+| 2.6297     | 450     | 0.0217        | -                      | -                      | -                      | -                     | -                      |
+| 2.6881     | 460     | 0.016         | -                      | -                      | -                      | -                     | -                      |
+| 2.7465     | 470     | 0.0143        | -                      | -                      | -                      | -                     | -                      |
+| 2.8050     | 480     | 0.0193        | -                      | -                      | -                      | -                     | -                      |
+| 2.8634     | 490     | 0.0183        | -                      | -                      | -                      | -                     | -                      |
+| 2.9218     | 500     | 0.0171        | -                      | -                      | -                      | -                     | -                      |
+| 2.9803     | 510     | 0.0195        | -                      | -                      | -                      | -                     | -                      |
+| 2.9978     | 513     | -             | 0.8242                 | 0.8350                 | 0.8409                 | 0.8051                | 0.8413                 |
+| 3.0387     | 520     | 0.0127        | -                      | -                      | -                      | -                     | -                      |
+| 3.0972     | 530     | 0.0261        | -                      | -                      | -                      | -                     | -                      |
+| 3.1556     | 540     | 0.017         | -                      | -                      | -                      | -                     | -                      |
+| 3.2140     | 550     | 0.0198        | -                      | -                      | -                      | -                     | -                      |
+| 3.2725     | 560     | 0.0131        | -                      | -                      | -                      | -                     | -                      |
+| 3.3309     | 570     | 0.0156        | -                      | -                      | -                      | -                     | -                      |
+| 3.3893     | 580     | 0.0107        | -                      | -                      | -                      | -                     | -                      |
+| 3.4478     | 590     | 0.0123        | -                      | -                      | -                      | -                     | -                      |
+| 3.5062     | 600     | 0.0111        | -                      | -                      | -                      | -                     | -                      |
+| 3.5646     | 610     | 0.0112        | -                      | -                      | -                      | -                     | -                      |
+| 3.6231     | 620     | 0.0143        | -                      | -                      | -                      | -                     | -                      |
+| 3.6815     | 630     | 0.013         | -                      | -                      | -                      | -                     | -                      |
+| 3.7400     | 640     | 0.0105        | -                      | -                      | -                      | -                     | -                      |
+| 3.7984     | 650     | 0.0126        | -                      | -                      | -                      | -                     | -                      |
+| 3.8568     | 660     | 0.0118        | -                      | -                      | -                      | -                     | -                      |
+| 3.9153     | 670     | 0.0163        | -                      | -                      | -                      | -                     | -                      |
+| 3.9737     | 680     | 0.0187        | -                      | -                      | -                      | -                     | -                      |
+| **3.9971** | **684** | **-**         | **0.8248**             | **0.8361**             | **0.8405**             | **0.8058**            | **0.8422**             |
 * The bold row denotes the saved checkpoint.
 ### Framework Versions
 - Python: 3.12.5
+- Sentence Transformers: 3.1.1
 - Transformers: 4.44.2
+- PyTorch: 2.4.1
 - Accelerate: 0.33.0
 - Datasets: 2.21.0
 - Tokenizers: 0.19.1
 #### MatryoshkaLoss
 ```bibtex
 @misc{kusupati2024matryoshka,
+    title={Matryoshka Representation Learning},
     author={Aditya Kusupati and Gantavya Bhatt and Aniket Rege and Matthew Wallingford and Aditya Sinha and Vivek Ramanujan and William Howard-Snyder and Kaifeng Chen and Sham Kakade and Prateek Jain and Ali Farhadi},
     year={2024},
     eprint={2205.13147},
 #### MultipleNegativesRankingLoss
 ```bibtex
 @misc{henderson2017efficient,
+    title={Efficient Natural Language Response Suggestion for Smart Reply},
     author={Matthew Henderson and Rami Al-Rfou and Brian Strope and Yun-hsuan Sung and Laszlo Lukacs and Ruiqi Guo and Sanjiv Kumar and Balint Miklos and Ray Kurzweil},
     year={2017},
     eprint={1705.00652},

config_sentence_transformers.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "__version__": {
-    "sentence_transformers": "3.0.1",
     "transformers": "4.44.2",
-    "pytorch": "2.4.0"
   },
   "prompts": {},
   "default_prompt_name": null,

 {
   "__version__": {
+    "sentence_transformers": "3.1.1",
     "transformers": "4.44.2",
+    "pytorch": "2.4.1"
   },
   "prompts": {},
   "default_prompt_name": null,

model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:905ef4cf9bbd19190b586e4dc4173774b01b619eb4f4ab5fa233fb5dfc725472
 size 555896347

 version https://git-lfs.github.com/spec/v1
+oid sha256:50557ba011052514c2e8d048257176d199c9b609b15d5c39dfe8a18383aadb60
 size 555896347

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aa8280e8c799e0e3acd77f0263ef9df6449c601d630fdd734bf422c5f5352daf
 size 547119128

 version https://git-lfs.github.com/spec/v1
+oid sha256:6d13bedb560025363d482eb733dc9f18a0bfe5b342490240b9e9faabccf22983
 size 547119128

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e93f7b36897bd6605d5c5db5bd2469f5e524cc3d49234bbcc23e781c26404414
 size 5496

 version https://git-lfs.github.com/spec/v1
+oid sha256:5d2ca4f4a8289d13a34ff02bc7fb1d07d6772ee0b83178f7a016e3de1e0ba45e
 size 5496