masatochi commited on
Commit
37d72a0
·
verified ·
1 Parent(s): fb09ce7

Training in progress, step 55, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb3562d2376c7e44e807e75a251bfe4e20a8bbb1d2473548015437b6b53b8be3
3
  size 83945296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e0b256324c77b74ce7cf35a934a1dea4cf2f1c4e901640287d88f57a3f16226
3
  size 83945296
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a568b5ae0096ae42229e78a73ab2eb0dffab5c441bf57831500fe90f81243a04
3
  size 43122580
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54788bd57376a0ecc9872c34fed24cc6327e9699d90ddaa7ba48b2e34adcbf9a
3
  size 43122580
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e6a3dd563025f97e8d76541a82675dcf5abbc55aa6acc033ab4e92d8fbe7d5d
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:501917edc59cb38fa8ba673663fd0069ec90987aba1d4647ea54c9fb6fe18e47
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6c6ef871b14e9c2b6e6517244b08d50c3b172209dbf2c7f2f35e5b70f657975
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61487aeef4449a4dec50f3ae9ec76bca52908878863009a40746a21c237f51ad
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.024451372333272204,
5
  "eval_steps": 34,
6
- "global_step": 50,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -373,6 +373,41 @@
373
  "learning_rate": 0.00019324722294043558,
374
  "loss": 1.0124,
375
  "step": 50
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
376
  }
377
  ],
378
  "logging_steps": 1,
@@ -392,7 +427,7 @@
392
  "attributes": {}
393
  }
394
  },
395
- "total_flos": 2.219477097775104e+17,
396
  "train_batch_size": 3,
397
  "trial_name": null,
398
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.026896509566599426,
5
  "eval_steps": 34,
6
+ "global_step": 55,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
373
  "learning_rate": 0.00019324722294043558,
374
  "loss": 1.0124,
375
  "step": 50
376
+ },
377
+ {
378
+ "epoch": 0.024940399779937648,
379
+ "grad_norm": 0.2487930953502655,
380
+ "learning_rate": 0.00019256376597815564,
381
+ "loss": 0.9894,
382
+ "step": 51
383
+ },
384
+ {
385
+ "epoch": 0.02542942722660309,
386
+ "grad_norm": 0.39657795429229736,
387
+ "learning_rate": 0.00019184869857459232,
388
+ "loss": 1.138,
389
+ "step": 52
390
+ },
391
+ {
392
+ "epoch": 0.02591845467326854,
393
+ "grad_norm": 0.5362446308135986,
394
+ "learning_rate": 0.00019110226492460885,
395
+ "loss": 1.0342,
396
+ "step": 53
397
+ },
398
+ {
399
+ "epoch": 0.026407482119933982,
400
+ "grad_norm": 0.5089200139045715,
401
+ "learning_rate": 0.0001903247199346129,
402
+ "loss": 1.1193,
403
+ "step": 54
404
+ },
405
+ {
406
+ "epoch": 0.026896509566599426,
407
+ "grad_norm": 0.28259485960006714,
408
+ "learning_rate": 0.00018951632913550626,
409
+ "loss": 0.9054,
410
+ "step": 55
411
  }
412
  ],
413
  "logging_steps": 1,
 
427
  "attributes": {}
428
  }
429
  },
430
+ "total_flos": 2.4414248075526144e+17,
431
  "train_batch_size": 3,
432
  "trial_name": null,
433
  "trial_params": null