Training in progress, step 10, checkpoint

Files changed (12) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1623d6b3a59c7a32c66f828a169ca71f7b735b77b2c6a27858726a06327cfc22
 size 130583912

 version https://git-lfs.github.com/spec/v1
+oid sha256:d757243f503344b7811431b04ed26faa173948ed9e56ea963ca55e8e7e4bc03b
 size 130583912

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cf789c0a027087f7c384511e444dce2b20eb558b0d64f3b76f6360736ca67bb3
 size 66578772

 version https://git-lfs.github.com/spec/v1
+oid sha256:0cfc89fc11ed4c15cb339f27a6743d01d0200f8327c89f05ae72c424ab687e25
 size 66578772

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8d63289c5d04f2383b71ba99ab7652862b29466628d679a7f2b02d0fcdcc4da0
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:8bf6413e852be2cf688208c1704f913e5832da44d4c80b17ec9583f98fb0864c
 size 15984

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:93154ab653dd9adc62e305cb44be3d4cf8f6f7370124d22ce262388fdd3f16b5
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:1e4e1e3668e91b54a58da1ce6f5c7e6b1553629081e2ee6e6ec89e9df4de7128
 size 15984

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:edad8284ff84b94ec708b9eb257b9d770d3adef066494f245cf2c51dc659164b
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:dabebd1c16ad1482a9b6ac36cbcd94d2fb8623833ce700c649442aab5592f63c
 size 15984

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f9c8dbb46a9a74fc09c0eb4d787c118be17c860af785749c012382f79fbc9121
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:422a5e7e7660c4a9fddfbb53556696d7909d580ade84163abb00a59311819365
 size 15984

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:009402242046e588b30763e69f21be1c7fde9c10c17467c4a20db57ff0c78e87
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:eb732cb1b72b02838d9caad609515135e7638548c69ee64a18f63b8eef2b048f
 size 15984

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1ba0c0bd9979cfe74fa236eb5a2e4c12f3ea24dd8cbe5225eb3f303941c44c3c
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:cb63466a5bcf657473f2d960e277d4cbcc0a9c4a1e451be5d373a79f8fc4196f
 size 15984

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:33bf9a4ef7c0b20ceeaa1cbd1bacae415bdb21876893a2072dc934f8a9da7b5d
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:61e5883f037f93f02b6a025b5cb7d945d09d8e29f914292c468c9e4e008a85ce
 size 15984

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:75a57d3dbd028d4822c84de2623c8b1fedf5f921d0a089d23fb7b9b24235a874
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:f387686327168eef8043d717153998c55445f4ab3f6ae746687ee9f06afb96ec
 size 15984

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8bdda546a1390be3b85a90dd4ef31050dfb7b691765ffc12ed691b6786ed6e3d
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:26a93b2a1f4b5368650119fe6e0d6eec6d19cda6badeba4d21943ab48964fa00
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.18,
   "eval_steps": 3,
-  "global_step": 9,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -102,6 +102,13 @@
       "eval_samples_per_second": 28.601,
       "eval_steps_per_second": 3.745,
       "step": 9
     }
   ],
   "logging_steps": 1,
@@ -116,12 +123,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 4.713086603545805e+16,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.2,
   "eval_steps": 3,
+  "global_step": 10,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 28.601,
       "eval_steps_per_second": 3.745,
       "step": 9
+    },
+    {
+      "epoch": 0.2,
+      "grad_norm": 48.75463104248047,
+      "learning_rate": 0.00016,
+      "loss": 8.6251,
+      "step": 10
     }
   ],
   "logging_steps": 1,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 5.236762892828672e+16,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null