Training in progress, step 12446, checkpoint

Files changed (5) hide show

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bc17b6495b052823943dcb01863a50fe4f5d7f7748278302ad90585df253899e
 size 3055544304

 version https://git-lfs.github.com/spec/v1
+oid sha256:560a3733f4bbb77c7facbd8e1fcbec09c47c91778df2706dfaa878b1dab0a8ff
 size 3055544304

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0ab8ebd8defbea51e1f1e6049bedc94c98cdcdf84c3477f6aae01a1b0a708ed0
 size 6099375168

 version https://git-lfs.github.com/spec/v1
+oid sha256:4a221df9a99724f5892178dc1aee259955a08a1659f7a165bd00b016ef52a032
 size 6099375168

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0e3865541adb0192a23dd785d3972183d6f068ebb2ff816b3a16420ce3f5e1aa
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:0b9afb76df39f158a5e48a47e5fd99ff76fe61548f70cccfae2931dd44ced886
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a1da51795904dee109014b2c85b0e607cd48a08f83296b5cdda09bb8cdd64804
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:99cc361e445085ab266b15edad9fa18a2afe08322b075eb52cc3dd62210b622c
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": 4.682127039146104,
   "best_model_checkpoint": "./whisper-medium-ur/checkpoint-11000",
-  "epoch": 0.9641264612541678,
   "eval_steps": 1000,
-  "global_step": 12000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -955,6 +955,34 @@
       "eval_steps_per_second": 0.222,
       "eval_wer": 4.687628951060494,
       "step": 12000
     }
   ],
   "logging_steps": 100,
@@ -978,12 +1006,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 1.9595614224384e+20,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": 4.682127039146104,
   "best_model_checkpoint": "./whisper-medium-ur/checkpoint-11000",
+  "epoch": 0.9999598280641144,
   "eval_steps": 1000,
+  "global_step": 12446,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_steps_per_second": 0.222,
       "eval_wer": 4.687628951060494,
       "step": 12000
+    },
+    {
+      "epoch": 0.9721608484312859,
+      "grad_norm": 2.960160493850708,
+      "learning_rate": 2.946593001841621e-07,
+      "loss": 0.2245,
+      "step": 12100
+    },
+    {
+      "epoch": 0.9801952356084039,
+      "grad_norm": 1.555345892906189,
+      "learning_rate": 2.109492717227524e-07,
+      "loss": 0.2078,
+      "step": 12200
+    },
+    {
+      "epoch": 0.9882296227855221,
+      "grad_norm": 6.304783821105957,
+      "learning_rate": 1.2723924326134273e-07,
+      "loss": 0.2169,
+      "step": 12300
+    },
+    {
+      "epoch": 0.9962640099626401,
+      "grad_norm": 2.4615955352783203,
+      "learning_rate": 4.352921479993303e-08,
+      "loss": 0.2152,
+      "step": 12400
     }
   ],
   "logging_steps": 100,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 2.0323917886390272e+20,
   "train_batch_size": 8,
   "trial_name": null,
   "trial_params": null