End of training

Files changed (6) hide show

README.md CHANGED Viewed

@@ -15,7 +15,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [eugenesiow/bart-paraphrase](https://huggingface.co/eugenesiow/bart-paraphrase) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 1.7935
 ## Model description
@@ -35,11 +35,11 @@ More information needed
 The following hyperparameters were used during training:
 - learning_rate: 2e-05
-- train_batch_size: 16
-- eval_batch_size: 16
 - seed: 42
 - gradient_accumulation_steps: 2
-- total_train_batch_size: 32
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_steps: 500
@@ -47,11 +47,11 @@ The following hyperparameters were used during training:
 ### Training results
-| Training Loss | Epoch | Step | Validation Loss |
-|:-------------:|:-----:|:----:|:---------------:|
-| 4.1212        | 1.0   | 187  | 3.4982          |
-| 2.8867        | 2.0   | 374  | 2.3374          |
-| 2.2427        | 3.0   | 561  | 1.7548          |
 ### Framework versions

 This model is a fine-tuned version of [eugenesiow/bart-paraphrase](https://huggingface.co/eugenesiow/bart-paraphrase) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 3.3337
 ## Model description
 The following hyperparameters were used during training:
 - learning_rate: 2e-05
+- train_batch_size: 32
+- eval_batch_size: 32
 - seed: 42
 - gradient_accumulation_steps: 2
+- total_train_batch_size: 64
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_steps: 500
 ### Training results
+| Training Loss | Epoch  | Step | Validation Loss |
+|:-------------:|:------:|:----:|:---------------:|
+| 5.2622        | 0.9968 | 154  | 4.8920          |
+| 4.4409        | 2.0    | 309  | 3.8232          |
+| 3.8001        | 2.9903 | 462  | 3.2888          |
 ### Framework versions

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:33c9486e8d903ee43bc2221289cfff29d979bd726dd42c0a4cc2ac767446a109
 size 1625426996

 version https://git-lfs.github.com/spec/v1
+oid sha256:5752e548c1e4f7ef8deba4be3cd81e7069c939ee0c2bf600a386c98da0120973
 size 1625426996

special_tokens_map.json CHANGED Viewed

@@ -1,7 +1,25 @@
 {
-  "bos_token": "<s>",
-  "cls_token": "<s>",
-  "eos_token": "</s>",
   "mask_token": {
     "content": "<mask>",
     "lstrip": true,
@@ -9,7 +27,25 @@
     "rstrip": false,
     "single_word": false
   },
-  "pad_token": "<pad>",
-  "sep_token": "</s>",
-  "unk_token": "<unk>"
 }

 {
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "cls_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
   "mask_token": {
     "content": "<mask>",
     "lstrip": true,
     "rstrip": false,
     "single_word": false
   },
+  "pad_token": {
+    "content": "<pad>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
 }

tokenizer_config.json CHANGED Viewed

@@ -48,10 +48,9 @@
   "eos_token": "</s>",
   "errors": "replace",
   "mask_token": "<mask>",
-  "model_max_length": 1000000000000000019884624838656,
   "pad_token": "<pad>",
   "sep_token": "</s>",
   "tokenizer_class": "BartTokenizer",
-  "trim_offsets": true,
   "unk_token": "<unk>"
 }

   "eos_token": "</s>",
   "errors": "replace",
   "mask_token": "<mask>",
+  "model_max_length": 1024,
   "pad_token": "<pad>",
   "sep_token": "</s>",
   "tokenizer_class": "BartTokenizer",
   "unk_token": "<unk>"
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2ac0b7cf3cf74e5bdfb57541f92de3816a8163161438428d48f5437117cdf4fd
 size 4920

 version https://git-lfs.github.com/spec/v1
+oid sha256:4f4a9d90b024e60cf38f5d53c1d4213acadc99707cb5b7712469951525ad4fb0
 size 4920

vocab.json CHANGED Viewed

The diff for this file is too large to render. See raw diff