besimray commited on
Commit
bfad8db
·
verified ·
1 Parent(s): 29afcdf

Training in progress, step 20, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95b67ddad24a5888e91bf681c83298eee26617a5578138ced45888ba6be330fc
3
  size 59827904
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47b7ebf2902b2a07f7ea2535994bdad3615a8f0ab4563e45a903f02b32f57283
3
  size 59827904
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7c73bc72debf386e2c36c561a99ca71c87d00c275123b07d8008bc462049f466
3
  size 30875540
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf786dd14b0811f274964d9a68546892677186e3507a506e1825106470480916
3
  size 30875540
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10e42003eeaa7e3634e469fed070b1b1d3ecaaf8edad837bd4893e0c7415da96
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdf01e2f573e4c0a520091ab55a625babf975c24160921fd3cf96006054217ee
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:afbddc242ced46f745f057a8ae6c242cb208cc8c07c450e2e13f98a4e78227eb
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1bd5e0b1abc9327c71d57aae52a46f7c0ab15b77158b2f2fa6d9b1a513a5267
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 9.236889839172363,
3
  "best_model_checkpoint": "miner_id_besimray/checkpoint-5",
4
- "epoch": 0.003056234718826406,
5
  "eval_steps": 5,
6
- "global_step": 15,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -144,6 +144,49 @@
144
  "eval_samples_per_second": 3.065,
145
  "eval_steps_per_second": 0.307,
146
  "step": 15
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
147
  }
148
  ],
149
  "logging_steps": 1,
@@ -158,7 +201,7 @@
158
  "early_stopping_threshold": 0.0
159
  },
160
  "attributes": {
161
- "early_stopping_patience_counter": 2
162
  }
163
  },
164
  "TrainerControl": {
@@ -167,12 +210,12 @@
167
  "should_evaluate": false,
168
  "should_log": false,
169
  "should_save": true,
170
- "should_training_stop": false
171
  },
172
  "attributes": {}
173
  }
174
  },
175
- "total_flos": 1.37779979747328e+16,
176
  "train_batch_size": 10,
177
  "trial_name": null,
178
  "trial_params": null
 
1
  {
2
  "best_metric": 9.236889839172363,
3
  "best_model_checkpoint": "miner_id_besimray/checkpoint-5",
4
+ "epoch": 0.004074979625101874,
5
  "eval_steps": 5,
6
+ "global_step": 20,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
144
  "eval_samples_per_second": 3.065,
145
  "eval_steps_per_second": 0.307,
146
  "step": 15
147
+ },
148
+ {
149
+ "epoch": 0.0032599837000814994,
150
+ "grad_norm": 1.3874351302323995e+19,
151
+ "learning_rate": 1.9999982199133416e-05,
152
+ "loss": 8.5286,
153
+ "step": 16
154
+ },
155
+ {
156
+ "epoch": 0.0034637326813365932,
157
+ "grad_norm": 9.607972408157798e+18,
158
+ "learning_rate": 1.9999975771045303e-05,
159
+ "loss": 7.7833,
160
+ "step": 17
161
+ },
162
+ {
163
+ "epoch": 0.003667481662591687,
164
+ "grad_norm": Infinity,
165
+ "learning_rate": 1.9999968354022266e-05,
166
+ "loss": 10.4327,
167
+ "step": 18
168
+ },
169
+ {
170
+ "epoch": 0.003871230643846781,
171
+ "grad_norm": Infinity,
172
+ "learning_rate": 1.999995994806504e-05,
173
+ "loss": 8.3376,
174
+ "step": 19
175
+ },
176
+ {
177
+ "epoch": 0.004074979625101874,
178
+ "grad_norm": Infinity,
179
+ "learning_rate": 1.999995055317446e-05,
180
+ "loss": 9.8773,
181
+ "step": 20
182
+ },
183
+ {
184
+ "epoch": 0.004074979625101874,
185
+ "eval_loss": 9.251687049865723,
186
+ "eval_runtime": 841.2776,
187
+ "eval_samples_per_second": 3.07,
188
+ "eval_steps_per_second": 0.308,
189
+ "step": 20
190
  }
191
  ],
192
  "logging_steps": 1,
 
201
  "early_stopping_threshold": 0.0
202
  },
203
  "attributes": {
204
+ "early_stopping_patience_counter": 3
205
  }
206
  },
207
  "TrainerControl": {
 
210
  "should_evaluate": false,
211
  "should_log": false,
212
  "should_save": true,
213
+ "should_training_stop": true
214
  },
215
  "attributes": {}
216
  }
217
  },
218
+ "total_flos": 1.83706639663104e+16,
219
  "train_batch_size": 10,
220
  "trial_name": null,
221
  "trial_params": null