arshsin commited on
Commit
8e20d4d
·
verified ·
1 Parent(s): 0ed365d

Training in progress, epoch 2, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b948a914e39fad4e65020c5a428e98d9ef510b3c5699b312791549222200834
3
  size 344814656
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5c64c281a4cde322ef3eb6901f5acc80b324755fe3573a877fca65b6fdaa614
3
  size 344814656
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:370a3783788e3426f46911174c6ecf5ee6c66358da5df6ada20646ce9f2ad264
3
  size 689741690
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fb4798e31a0c379f8d2aea2f62c93a4ebb0f2223f0b6871e830c00610a07c83
3
  size 689741690
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9196a1e708bf24d6abba41cce3f8558820acc3e50f9394c5955e29eb41ffea3d
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c062f7f375beded48b5337f5a3f3a5cb38807fa3e85dbf3e294c0ab6b627bfc2
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1556c40535abe1ed34e2654d4ee34ba195375d3a724579fc6d1e890cfd9ace7
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08b0fce6ed4085eabc1083cc6543ed01efa76540d9e0ff5ac4e32bdd796f6655
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.83,
3
- "best_model_checkpoint": "ast-finetuned-audioset-10-10-0.4593-finetuned-gtzan/checkpoint-113",
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
- "global_step": 113,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -148,13 +148,160 @@
148
  "eval_samples_per_second": 6.377,
149
  "eval_steps_per_second": 0.829,
150
  "step": 113
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
151
  }
152
  ],
153
  "logging_steps": 5,
154
  "max_steps": 1130,
155
  "num_train_epochs": 10,
156
  "save_steps": 500,
157
- "total_flos": 6.094112254328832e+16,
158
  "trial_name": null,
159
  "trial_params": null
160
  }
 
1
  {
2
+ "best_metric": 0.87,
3
+ "best_model_checkpoint": "ast-finetuned-audioset-10-10-0.4593-finetuned-gtzan/checkpoint-226",
4
+ "epoch": 2.0,
5
  "eval_steps": 500,
6
+ "global_step": 226,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
148
  "eval_samples_per_second": 6.377,
149
  "eval_steps_per_second": 0.829,
150
  "step": 113
151
+ },
152
+ {
153
+ "epoch": 1.02,
154
+ "learning_rate": 4.990167158308752e-05,
155
+ "loss": 0.5449,
156
+ "step": 115
157
+ },
158
+ {
159
+ "epoch": 1.06,
160
+ "learning_rate": 4.9655850540806295e-05,
161
+ "loss": 0.5122,
162
+ "step": 120
163
+ },
164
+ {
165
+ "epoch": 1.11,
166
+ "learning_rate": 4.941002949852507e-05,
167
+ "loss": 0.5462,
168
+ "step": 125
169
+ },
170
+ {
171
+ "epoch": 1.15,
172
+ "learning_rate": 4.9164208456243856e-05,
173
+ "loss": 0.5006,
174
+ "step": 130
175
+ },
176
+ {
177
+ "epoch": 1.19,
178
+ "learning_rate": 4.891838741396263e-05,
179
+ "loss": 0.4551,
180
+ "step": 135
181
+ },
182
+ {
183
+ "epoch": 1.24,
184
+ "learning_rate": 4.867256637168142e-05,
185
+ "loss": 0.7397,
186
+ "step": 140
187
+ },
188
+ {
189
+ "epoch": 1.28,
190
+ "learning_rate": 4.8426745329400195e-05,
191
+ "loss": 0.4615,
192
+ "step": 145
193
+ },
194
+ {
195
+ "epoch": 1.33,
196
+ "learning_rate": 4.818092428711898e-05,
197
+ "loss": 0.3942,
198
+ "step": 150
199
+ },
200
+ {
201
+ "epoch": 1.37,
202
+ "learning_rate": 4.7935103244837756e-05,
203
+ "loss": 0.4799,
204
+ "step": 155
205
+ },
206
+ {
207
+ "epoch": 1.42,
208
+ "learning_rate": 4.768928220255654e-05,
209
+ "loss": 0.421,
210
+ "step": 160
211
+ },
212
+ {
213
+ "epoch": 1.46,
214
+ "learning_rate": 4.7443461160275324e-05,
215
+ "loss": 0.694,
216
+ "step": 165
217
+ },
218
+ {
219
+ "epoch": 1.5,
220
+ "learning_rate": 4.71976401179941e-05,
221
+ "loss": 0.3993,
222
+ "step": 170
223
+ },
224
+ {
225
+ "epoch": 1.55,
226
+ "learning_rate": 4.6951819075712886e-05,
227
+ "loss": 0.5977,
228
+ "step": 175
229
+ },
230
+ {
231
+ "epoch": 1.59,
232
+ "learning_rate": 4.670599803343166e-05,
233
+ "loss": 0.974,
234
+ "step": 180
235
+ },
236
+ {
237
+ "epoch": 1.64,
238
+ "learning_rate": 4.646017699115045e-05,
239
+ "loss": 0.5518,
240
+ "step": 185
241
+ },
242
+ {
243
+ "epoch": 1.68,
244
+ "learning_rate": 4.6214355948869224e-05,
245
+ "loss": 0.5082,
246
+ "step": 190
247
+ },
248
+ {
249
+ "epoch": 1.73,
250
+ "learning_rate": 4.596853490658801e-05,
251
+ "loss": 0.5166,
252
+ "step": 195
253
+ },
254
+ {
255
+ "epoch": 1.77,
256
+ "learning_rate": 4.5722713864306786e-05,
257
+ "loss": 0.6408,
258
+ "step": 200
259
+ },
260
+ {
261
+ "epoch": 1.81,
262
+ "learning_rate": 4.547689282202557e-05,
263
+ "loss": 0.6056,
264
+ "step": 205
265
+ },
266
+ {
267
+ "epoch": 1.86,
268
+ "learning_rate": 4.523107177974435e-05,
269
+ "loss": 0.6339,
270
+ "step": 210
271
+ },
272
+ {
273
+ "epoch": 1.9,
274
+ "learning_rate": 4.498525073746313e-05,
275
+ "loss": 0.7673,
276
+ "step": 215
277
+ },
278
+ {
279
+ "epoch": 1.95,
280
+ "learning_rate": 4.473942969518191e-05,
281
+ "loss": 0.2352,
282
+ "step": 220
283
+ },
284
+ {
285
+ "epoch": 1.99,
286
+ "learning_rate": 4.449360865290069e-05,
287
+ "loss": 0.3513,
288
+ "step": 225
289
+ },
290
+ {
291
+ "epoch": 2.0,
292
+ "eval_accuracy": 0.87,
293
+ "eval_loss": 0.5030723810195923,
294
+ "eval_runtime": 15.1706,
295
+ "eval_samples_per_second": 6.592,
296
+ "eval_steps_per_second": 0.857,
297
+ "step": 226
298
  }
299
  ],
300
  "logging_steps": 5,
301
  "max_steps": 1130,
302
  "num_train_epochs": 10,
303
  "save_steps": 500,
304
+ "total_flos": 1.2188224508657664e+17,
305
  "trial_name": null,
306
  "trial_params": null
307
  }