Training in progress, step 1000, checkpoint

Files changed (5) hide show

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ce2bcaf1ce585a953de36656872e26fe6947647ba2dce7f82249c3b5b8000d54
 size 242041896

 version https://git-lfs.github.com/spec/v1
+oid sha256:07d271253ad7eddb3db134bdc96bf72b6fb29b6eb89123849a14c7282a602b17
 size 242041896

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ace46838efb8f53b6941f219d589ae0fd1380a0a93380ddf76e4d388f0197619
 size 484163514

 version https://git-lfs.github.com/spec/v1
+oid sha256:c0be3c6f687e594da8e7c05affb0a3216e74ada978a190ce6a966734a0423ef4
 size 484163514

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:db0a075208dd3cb3b7f7fd9174ec727b26bed33bf0a8454e702c3a907c5e0811
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:eeef5a5cd399c2cfa96c423b188489f80b820a820435147acbd8127820b7b621
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b0a1a5cbb746068357eb0cf9177889b6b2d8490ed0583c85fd890df79b00500c
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:4c5235b2e87f9d721a92e0318f55cf82a1eb4118f0ef4f59ca28e5b517cde92c
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.0767341927562922,
   "eval_steps": 500,
-  "global_step": 500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -13,13 +13,19 @@
       "learning_rate": 0.0009846531614487416,
       "loss": 0.5762,
       "step": 500
     }
   ],
   "logging_steps": 500,
   "max_steps": 32580,
   "num_train_epochs": 5,
   "save_steps": 500,
-  "total_flos": 265536385056768.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.1534683855125844,
   "eval_steps": 500,
+  "global_step": 1000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.0009846531614487416,
       "loss": 0.5762,
       "step": 500
+    },
+    {
+      "epoch": 0.15,
+      "learning_rate": 0.0009693063228974831,
+      "loss": 0.6042,
+      "step": 1000
     }
   ],
   "logging_steps": 500,
   "max_steps": 32580,
   "num_train_epochs": 5,
   "save_steps": 500,
+  "total_flos": 529584010297344.0,
   "trial_name": null,
   "trial_params": null
 }