arshsin commited on
Commit
a275002
·
verified ·
1 Parent(s): 898b6ee

Training in progress, epoch 9, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:49ca587b4d5d8717421a4af485723139a27d619ab5d250bb505543ea18c0b00a
3
  size 344814656
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8c4bc197ae6609e636c1acebdecb4450fae4cfd794e2f8bc9b54c75e3ce752e
3
  size 344814656
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:791bb2165d16b628931f25c79f6a6cea9bbb548ffc869eac87e243fc4d9d753c
3
  size 689741690
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbb5b73e896c076b7857396e5c3157c071638b325ea0b1351b027ca98c90c9fa
3
  size 689741690
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5f38f6446ba43bb9ae0be4911c150b41c5adfbe2712844ea3cb854b62ee2432
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3bd3cafcd141485c5526689e7070ba65dab1e4639fbae44141ae41439003c1f
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65919f7fd01ea36c70a3abe58dbd434dcf13cb0b65cf9d41cba6fbb9678b20df
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bb119f3746a9da47b87642d601b53ab62f9c42621fd5116cb0fdc3c05776476
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.89,
3
  "best_model_checkpoint": "ast-finetuned-audioset-10-10-0.4593-finetuned-gtzan/checkpoint-339",
4
- "epoch": 8.0,
5
  "eval_steps": 500,
6
- "global_step": 904,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1159,13 +1159,160 @@
1159
  "eval_samples_per_second": 6.564,
1160
  "eval_steps_per_second": 0.853,
1161
  "step": 904
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1162
  }
1163
  ],
1164
  "logging_steps": 5,
1165
  "max_steps": 1130,
1166
  "num_train_epochs": 10,
1167
  "save_steps": 500,
1168
- "total_flos": 4.8752898034630656e+17,
1169
  "trial_name": null,
1170
  "trial_params": null
1171
  }
 
1
  {
2
  "best_metric": 0.89,
3
  "best_model_checkpoint": "ast-finetuned-audioset-10-10-0.4593-finetuned-gtzan/checkpoint-339",
4
+ "epoch": 9.0,
5
  "eval_steps": 500,
6
+ "global_step": 1017,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1159
  "eval_samples_per_second": 6.564,
1160
  "eval_steps_per_second": 0.853,
1161
  "step": 904
1162
+ },
1163
+ {
1164
+ "epoch": 8.01,
1165
+ "learning_rate": 1.1061946902654869e-05,
1166
+ "loss": 0.0,
1167
+ "step": 905
1168
+ },
1169
+ {
1170
+ "epoch": 8.05,
1171
+ "learning_rate": 1.0816125860373648e-05,
1172
+ "loss": 0.0,
1173
+ "step": 910
1174
+ },
1175
+ {
1176
+ "epoch": 8.1,
1177
+ "learning_rate": 1.0570304818092429e-05,
1178
+ "loss": 0.0,
1179
+ "step": 915
1180
+ },
1181
+ {
1182
+ "epoch": 8.14,
1183
+ "learning_rate": 1.032448377581121e-05,
1184
+ "loss": 0.0,
1185
+ "step": 920
1186
+ },
1187
+ {
1188
+ "epoch": 8.19,
1189
+ "learning_rate": 1.007866273352999e-05,
1190
+ "loss": 0.0,
1191
+ "step": 925
1192
+ },
1193
+ {
1194
+ "epoch": 8.23,
1195
+ "learning_rate": 9.832841691248771e-06,
1196
+ "loss": 0.4195,
1197
+ "step": 930
1198
+ },
1199
+ {
1200
+ "epoch": 8.27,
1201
+ "learning_rate": 9.587020648967553e-06,
1202
+ "loss": 0.0,
1203
+ "step": 935
1204
+ },
1205
+ {
1206
+ "epoch": 8.32,
1207
+ "learning_rate": 9.341199606686332e-06,
1208
+ "loss": 0.0,
1209
+ "step": 940
1210
+ },
1211
+ {
1212
+ "epoch": 8.36,
1213
+ "learning_rate": 9.095378564405113e-06,
1214
+ "loss": 0.0,
1215
+ "step": 945
1216
+ },
1217
+ {
1218
+ "epoch": 8.41,
1219
+ "learning_rate": 8.849557522123894e-06,
1220
+ "loss": 0.0,
1221
+ "step": 950
1222
+ },
1223
+ {
1224
+ "epoch": 8.45,
1225
+ "learning_rate": 8.603736479842674e-06,
1226
+ "loss": 0.0,
1227
+ "step": 955
1228
+ },
1229
+ {
1230
+ "epoch": 8.5,
1231
+ "learning_rate": 8.357915437561457e-06,
1232
+ "loss": 0.0,
1233
+ "step": 960
1234
+ },
1235
+ {
1236
+ "epoch": 8.54,
1237
+ "learning_rate": 8.112094395280237e-06,
1238
+ "loss": 0.0,
1239
+ "step": 965
1240
+ },
1241
+ {
1242
+ "epoch": 8.58,
1243
+ "learning_rate": 7.866273352999016e-06,
1244
+ "loss": 0.0,
1245
+ "step": 970
1246
+ },
1247
+ {
1248
+ "epoch": 8.63,
1249
+ "learning_rate": 7.620452310717798e-06,
1250
+ "loss": 0.0,
1251
+ "step": 975
1252
+ },
1253
+ {
1254
+ "epoch": 8.67,
1255
+ "learning_rate": 7.374631268436579e-06,
1256
+ "loss": 0.0,
1257
+ "step": 980
1258
+ },
1259
+ {
1260
+ "epoch": 8.72,
1261
+ "learning_rate": 7.128810226155359e-06,
1262
+ "loss": 0.0,
1263
+ "step": 985
1264
+ },
1265
+ {
1266
+ "epoch": 8.76,
1267
+ "learning_rate": 6.88298918387414e-06,
1268
+ "loss": 0.0,
1269
+ "step": 990
1270
+ },
1271
+ {
1272
+ "epoch": 8.81,
1273
+ "learning_rate": 6.6371681415929215e-06,
1274
+ "loss": 0.0,
1275
+ "step": 995
1276
+ },
1277
+ {
1278
+ "epoch": 8.85,
1279
+ "learning_rate": 6.3913470993117005e-06,
1280
+ "loss": 0.0,
1281
+ "step": 1000
1282
+ },
1283
+ {
1284
+ "epoch": 8.89,
1285
+ "learning_rate": 6.145526057030482e-06,
1286
+ "loss": 0.0,
1287
+ "step": 1005
1288
+ },
1289
+ {
1290
+ "epoch": 8.94,
1291
+ "learning_rate": 5.899705014749263e-06,
1292
+ "loss": 0.2103,
1293
+ "step": 1010
1294
+ },
1295
+ {
1296
+ "epoch": 8.98,
1297
+ "learning_rate": 5.653883972468043e-06,
1298
+ "loss": 0.0,
1299
+ "step": 1015
1300
+ },
1301
+ {
1302
+ "epoch": 9.0,
1303
+ "eval_accuracy": 0.89,
1304
+ "eval_loss": 0.7874658107757568,
1305
+ "eval_runtime": 14.9655,
1306
+ "eval_samples_per_second": 6.682,
1307
+ "eval_steps_per_second": 0.869,
1308
+ "step": 1017
1309
  }
1310
  ],
1311
  "logging_steps": 5,
1312
  "max_steps": 1130,
1313
  "num_train_epochs": 10,
1314
  "save_steps": 500,
1315
+ "total_flos": 5.484701028895949e+17,
1316
  "trial_name": null,
1317
  "trial_params": null
1318
  }