Training in progress, step 6000, checkpoint

Files changed (15) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:43404aa4801c8a8f07d44770fc0ae19c928ca84485064b608bdf6cb0e8d9347a
 size 2384440

 version https://git-lfs.github.com/spec/v1
+oid sha256:85b422ee3958e189a80805f9f965a72c206d8049b9f09de490eb890e2ce1a613
 size 2384440

last-checkpoint/global_step6000/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:215d9ebee4db7ada43a179c37480a4bb6ffbea5b9f9ce3b025332cd422ca8aed
+size 3621285613

last-checkpoint/global_step6000/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:f9117bd105c2a585b2a71bbe1fcda5b458785ca444cd771b854037d5c59462f2
+size 3542398

last-checkpoint/global_step6000/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:34be61ca15897765094e0bff9d07430873d7c70d342a48934b5c437669d8c841
+size 3621285613

last-checkpoint/global_step6000/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:84aadcdf820229bbb8699d3323272ce296cd085e451274879eed9f343aaa89fb
+size 3542398

last-checkpoint/global_step6000/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e4d0a486549934eb96c39e9240b40dc232e759778eb47182c4b6c7410a98d3b5
+size 3621285613

last-checkpoint/global_step6000/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:49307bef2bd400cf814aa71b5ea9ae7c5f457dae70a4151a7ba191ad05beb921
+size 3542398

last-checkpoint/global_step6000/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:9bb775385db2832cb91fd59cf72dbd16be582202bd50ed16f73a84a5e10358a2
+size 3621285613

last-checkpoint/global_step6000/zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:6e25d262deca190648b50b5dc7b37900e05fac39325115fc6ecf745071c968f0
+size 3542398

last-checkpoint/latest CHANGED Viewed

	@@ -1 +1 @@
1	- ~~global_step5000~~


1	+ global_step6000

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bbc46a1b44d90304fa6c2d97e45a09ff9ca39e2f158513357c6cbafadd965846
 size 17655

 version https://git-lfs.github.com/spec/v1
+oid sha256:d32349f4b48b9fb4729a79147fd7b83d66f0d4c2474b9f1e25ff4d1f056ed81b
 size 17655

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:12bd87b02d242431882456ba54feb929c619932428f827859ffa31f8595a6685
 size 17655

 version https://git-lfs.github.com/spec/v1
+oid sha256:c3b1142fca547114f3d0a445f9800567d556596ee89ff6a986d92b5245f0dd93
 size 17655

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:60503c24da7903188168982879429796e990d5059867cd1ae5b5ed86b0aa3966
 size 17655

 version https://git-lfs.github.com/spec/v1
+oid sha256:93cde37cb441ecff6612fae913672d7d9b71d9755e386684e5be26f202a20f4d
 size 17655

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5fc535ca2f5c6f4069ade15a885ef339906847e85c537ee37acb74a1c28d19da
 size 17655

 version https://git-lfs.github.com/spec/v1
+oid sha256:d5a1d857da05e0f9f6ddfb61aacc0dff2f758b31c8fb47768b2dafe568cfc92d
 size 17655

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 3.9093041438623923,
   "eval_steps": 500,
-  "global_step": 5000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -37,13 +37,19 @@
       "learning_rate": 0.0001,
       "loss": 0.4379,
       "step": 5000
     }
   ],
   "logging_steps": 1000,
   "max_steps": 12790,
   "num_train_epochs": 10,
   "save_steps": 1000,
-  "total_flos": 36500817838080.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 4.691164972634871,
   "eval_steps": 500,
+  "global_step": 6000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.0001,
       "loss": 0.4379,
       "step": 5000
+    },
+    {
+      "epoch": 4.69,
+      "learning_rate": 0.0001,
+      "loss": 0.4208,
+      "step": 6000
     }
   ],
   "logging_steps": 1000,
   "max_steps": 12790,
   "num_train_epochs": 10,
   "save_steps": 1000,
+  "total_flos": 43787607343104.0,
   "trial_name": null,
   "trial_params": null
 }