ma2za commited on
Commit
e738a42
·
1 Parent(s): 929e3ab

Training in progress, step 1200

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aafda980146253cd7b82b0dd2e2a1211ce96ed9fccbf804597a542c6abfab59e
3
  size 2117841669
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a9981820a9caf110a2c23b1da7d2f536b1f8f699f5738297c09d21fa04033cd
3
  size 2117841669
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:925941313b310518092ca4c0ce765c6ed1e75d6a07a200cdf61def1fa48fdef8
3
  size 2268273785
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d679cbd4839c4e29030e2274bb779823a88f1e2495ada8acbb79a08c2895666c
3
  size 2268273785
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a45a08059f2351fc7b31a0c40f1b65158be9ff667b5b2468faf63f546d65222b
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47f0b09a8b590ae907b4d8a8ecfba9db2fa39c863f8584cdbf7a96552440f68a
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:90b1e78b64b76d121ce0a17312e4bc1a4adeafa3fb2ee51db16618bc84d92166
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2b5a6185254ac5883361938b853934daa886e8ffec96c4edd0064efe70ce735
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.06295907660020986,
5
- "global_step": 600,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -22,11 +22,27 @@
22
  "eval_samples_per_second": 190.071,
23
  "eval_steps_per_second": 0.743,
24
  "step": 600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  }
26
  ],
27
  "max_steps": 953000,
28
  "num_train_epochs": 100,
29
- "total_flos": 2.544857570206464e+16,
30
  "trial_name": null,
31
  "trial_params": null
32
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.1259181532004197,
5
+ "global_step": 1200,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
22
  "eval_samples_per_second": 190.071,
23
  "eval_steps_per_second": 0.743,
24
  "step": 600
25
+ },
26
+ {
27
+ "epoch": 0.1,
28
+ "learning_rate": 9.989517313746065e-06,
29
+ "loss": 1.5882,
30
+ "step": 1000
31
+ },
32
+ {
33
+ "epoch": 0.13,
34
+ "eval_accuracy": 0.4599964585577476,
35
+ "eval_f1": 0.38184708517142385,
36
+ "eval_loss": 1.539364218711853,
37
+ "eval_runtime": 713.8848,
38
+ "eval_samples_per_second": 189.86,
39
+ "eval_steps_per_second": 0.742,
40
+ "step": 1200
41
  }
42
  ],
43
  "max_steps": 953000,
44
  "num_train_epochs": 100,
45
+ "total_flos": 5.046794543497728e+16,
46
  "trial_name": null,
47
  "trial_params": null
48
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:925941313b310518092ca4c0ce765c6ed1e75d6a07a200cdf61def1fa48fdef8
3
  size 2268273785
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d679cbd4839c4e29030e2274bb779823a88f1e2495ada8acbb79a08c2895666c
3
  size 2268273785