Training in progress, step 39, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dfe2fb418afccaf64c1013ab63252ae75ed038bd4282a446118b3bf60fab6ea7
 size 25192496

 version https://git-lfs.github.com/spec/v1
+oid sha256:3a4b1b9f92f2c3f801f4027f95d4c80de298a5b2d3de9cb507f8ca53cd4a14b9
 size 25192496

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2969e162bbaff7f0a99ac88fe368121d9e90b20e296928c80a039efae1319837
 size 13005178

 version https://git-lfs.github.com/spec/v1
+oid sha256:33d7c08a12c11dc5458f94a3d6b41ab1d6f9cc1aedc689cdcee6f067d4e7d658
 size 13005178

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a96ec98b03d2103c39025046aa0a135811765566c4aedce7d9cac444d8384b2d
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:1c7830ee97fa51bd1d743895da89276028ce6a6b88f43103020645687fd0ef70
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:37841e69eda911caeb33edeefa0b2f140e72dcce247aeb757b2fe89c00d7887b
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:0c50dbaa792cda4a28fbbc2acb2a3e03c59530712bbc5107212d33064d193da4
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.0004314761879078798,
   "eval_steps": 10,
-  "global_step": 26,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -66,6 +66,28 @@
       "learning_rate": 6.91341716182545e-05,
       "loss": 0.9362,
       "step": 25
     }
   ],
   "logging_steps": 5,
@@ -85,7 +107,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 783752468889600.0,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.0006472142818618197,
   "eval_steps": 10,
+  "global_step": 39,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 6.91341716182545e-05,
       "loss": 0.9362,
       "step": 25
+    },
+    {
+      "epoch": 0.0004978571398937075,
+      "grad_norm": 7.281345844268799,
+      "learning_rate": 5e-05,
+      "loss": 0.5976,
+      "step": 30
+    },
+    {
+      "epoch": 0.0004978571398937075,
+      "eval_loss": 0.12552273273468018,
+      "eval_runtime": 689.2345,
+      "eval_samples_per_second": 36.812,
+      "eval_steps_per_second": 18.406,
+      "step": 30
+    },
+    {
+      "epoch": 0.0005808333298759921,
+      "grad_norm": 5.342987060546875,
+      "learning_rate": 3.086582838174551e-05,
+      "loss": 0.488,
+      "step": 35
     }
   ],
   "logging_steps": 5,
       "attributes": {}
     }
   },
+  "total_flos": 1179360857948160.0,
   "train_batch_size": 2,
   "trial_name": null,
   "trial_params": null