youdiniplays commited on
Commit
1cb5b20
·
verified ·
1 Parent(s): 52e006d

Training in progress, step 25000, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00cb98eb1da63ba4189d4b55310bd43816969d50531865b7774f8fdcf202af6a
3
  size 242041896
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4a556b743de53b81786a2c97c189b8ab38eaa9b1b15213d74592f6e5df0ee9b
3
  size 242041896
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1827f3ba86066e05a7c8d0cf70bf3fefd44d3648c1da02dcd8f3c00a2aece1c
3
  size 484163514
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07f36edfb9a4f724f199b1d822cf88054f24aa8663e46816caef2402d04ec3c8
3
  size 484163514
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76200746e0093b7cc6d3809d80c9ea53532cb8fe856e4e289194263f281b138c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4466b7aec0280a011a8c4d08d66796961b3a1f1e19e62b4a4a1b3bce38987c6c
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb4ff7878a46fca2f7284f626205121313e31cd4872637223f000f97e21368d0
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3237be099a38adc6de0eebdf22fb3fe78ade2edb6a766c16e20254df2789831
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 3.759975445058318,
5
  "eval_steps": 500,
6
- "global_step": 24500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -331,13 +331,19 @@
331
  "learning_rate": 0.0002483118477593616,
332
  "loss": 0.4896,
333
  "step": 24500
 
 
 
 
 
 
334
  }
335
  ],
336
  "logging_steps": 500,
337
  "max_steps": 32580,
338
  "num_train_epochs": 5,
339
  "save_steps": 500,
340
- "total_flos": 1.2986967867260928e+16,
341
  "trial_name": null,
342
  "trial_params": null
343
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.83670963781461,
5
  "eval_steps": 500,
6
+ "global_step": 25000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
331
  "learning_rate": 0.0002483118477593616,
332
  "loss": 0.4896,
333
  "step": 24500
334
+ },
335
+ {
336
+ "epoch": 3.84,
337
+ "learning_rate": 0.00023296500920810313,
338
+ "loss": 0.4832,
339
+ "step": 25000
340
  }
341
  ],
342
  "logging_steps": 500,
343
  "max_steps": 32580,
344
  "num_train_epochs": 5,
345
  "save_steps": 500,
346
+ "total_flos": 1.325300755464192e+16,
347
  "trial_name": null,
348
  "trial_params": null
349
  }