arshsin commited on
Commit
a5dc4b5
·
verified ·
1 Parent(s): cf6f59b

Training in progress, epoch 4, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a464be9fec0b1c828e8a3be4ac1fb7168b03c5ed4d2dbaa87a5f47702a4b740
3
  size 344814656
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:557a7b887efea43f30540591296b172670f833eb24b7fcde5d38500396cd2120
3
  size 344814656
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0adda3532a4298fb3546704495979338b3071ea44e0487623379f887c7621f51
3
  size 689741690
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cfe7ba32285d8aca52e368728864045e3b3198f2b05634e71e6db69fa512bc6
3
  size 689741690
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:48ee9b73399c28d7e668360bf1d5a4d11095c4738bf96c13f7bb6fbff59f8ccb
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3e5d946241df2516b06d7074d8779088eae7607173ad780df56583910a9589b
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:62c39630ef971dd09b3fe4dd100706148d6dbc710ecd4f44ada87a34fe07ca75
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8e927e0c71d62c9d3968420452b731232314f4117cc838742af50f1ba552059
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.89,
3
  "best_model_checkpoint": "ast-finetuned-audioset-10-10-0.4593-finetuned-gtzan/checkpoint-339",
4
- "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 339,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -436,13 +436,160 @@
436
  "eval_samples_per_second": 6.583,
437
  "eval_steps_per_second": 0.856,
438
  "step": 339
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
439
  }
440
  ],
441
  "logging_steps": 5,
442
  "max_steps": 1130,
443
  "num_train_epochs": 10,
444
  "save_steps": 500,
445
- "total_flos": 1.8282336762986496e+17,
446
  "trial_name": null,
447
  "trial_params": null
448
  }
 
1
  {
2
  "best_metric": 0.89,
3
  "best_model_checkpoint": "ast-finetuned-audioset-10-10-0.4593-finetuned-gtzan/checkpoint-339",
4
+ "epoch": 4.0,
5
  "eval_steps": 500,
6
+ "global_step": 452,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
436
  "eval_samples_per_second": 6.583,
437
  "eval_steps_per_second": 0.856,
438
  "step": 339
439
+ },
440
+ {
441
+ "epoch": 3.01,
442
+ "learning_rate": 3.883972468043265e-05,
443
+ "loss": 0.2607,
444
+ "step": 340
445
+ },
446
+ {
447
+ "epoch": 3.05,
448
+ "learning_rate": 3.859390363815143e-05,
449
+ "loss": 0.2316,
450
+ "step": 345
451
+ },
452
+ {
453
+ "epoch": 3.1,
454
+ "learning_rate": 3.834808259587021e-05,
455
+ "loss": 0.0272,
456
+ "step": 350
457
+ },
458
+ {
459
+ "epoch": 3.14,
460
+ "learning_rate": 3.810226155358899e-05,
461
+ "loss": 0.1928,
462
+ "step": 355
463
+ },
464
+ {
465
+ "epoch": 3.19,
466
+ "learning_rate": 3.7856440511307774e-05,
467
+ "loss": 0.0225,
468
+ "step": 360
469
+ },
470
+ {
471
+ "epoch": 3.23,
472
+ "learning_rate": 3.7610619469026545e-05,
473
+ "loss": 0.0359,
474
+ "step": 365
475
+ },
476
+ {
477
+ "epoch": 3.27,
478
+ "learning_rate": 3.736479842674533e-05,
479
+ "loss": 0.0208,
480
+ "step": 370
481
+ },
482
+ {
483
+ "epoch": 3.32,
484
+ "learning_rate": 3.711897738446411e-05,
485
+ "loss": 0.0131,
486
+ "step": 375
487
+ },
488
+ {
489
+ "epoch": 3.36,
490
+ "learning_rate": 3.687315634218289e-05,
491
+ "loss": 0.0209,
492
+ "step": 380
493
+ },
494
+ {
495
+ "epoch": 3.41,
496
+ "learning_rate": 3.6627335299901674e-05,
497
+ "loss": 0.1438,
498
+ "step": 385
499
+ },
500
+ {
501
+ "epoch": 3.45,
502
+ "learning_rate": 3.638151425762045e-05,
503
+ "loss": 0.4599,
504
+ "step": 390
505
+ },
506
+ {
507
+ "epoch": 3.5,
508
+ "learning_rate": 3.6135693215339236e-05,
509
+ "loss": 0.0166,
510
+ "step": 395
511
+ },
512
+ {
513
+ "epoch": 3.54,
514
+ "learning_rate": 3.588987217305801e-05,
515
+ "loss": 0.0156,
516
+ "step": 400
517
+ },
518
+ {
519
+ "epoch": 3.58,
520
+ "learning_rate": 3.56440511307768e-05,
521
+ "loss": 0.0039,
522
+ "step": 405
523
+ },
524
+ {
525
+ "epoch": 3.63,
526
+ "learning_rate": 3.5398230088495574e-05,
527
+ "loss": 0.0753,
528
+ "step": 410
529
+ },
530
+ {
531
+ "epoch": 3.67,
532
+ "learning_rate": 3.515240904621436e-05,
533
+ "loss": 0.0047,
534
+ "step": 415
535
+ },
536
+ {
537
+ "epoch": 3.72,
538
+ "learning_rate": 3.4906588003933136e-05,
539
+ "loss": 0.1596,
540
+ "step": 420
541
+ },
542
+ {
543
+ "epoch": 3.76,
544
+ "learning_rate": 3.466076696165192e-05,
545
+ "loss": 0.409,
546
+ "step": 425
547
+ },
548
+ {
549
+ "epoch": 3.81,
550
+ "learning_rate": 3.44149459193707e-05,
551
+ "loss": 0.0616,
552
+ "step": 430
553
+ },
554
+ {
555
+ "epoch": 3.85,
556
+ "learning_rate": 3.416912487708948e-05,
557
+ "loss": 0.0113,
558
+ "step": 435
559
+ },
560
+ {
561
+ "epoch": 3.89,
562
+ "learning_rate": 3.3923303834808265e-05,
563
+ "loss": 0.107,
564
+ "step": 440
565
+ },
566
+ {
567
+ "epoch": 3.94,
568
+ "learning_rate": 3.367748279252704e-05,
569
+ "loss": 0.0516,
570
+ "step": 445
571
+ },
572
+ {
573
+ "epoch": 3.98,
574
+ "learning_rate": 3.343166175024583e-05,
575
+ "loss": 0.0142,
576
+ "step": 450
577
+ },
578
+ {
579
+ "epoch": 4.0,
580
+ "eval_accuracy": 0.89,
581
+ "eval_loss": 0.6147953271865845,
582
+ "eval_runtime": 15.3899,
583
+ "eval_samples_per_second": 6.498,
584
+ "eval_steps_per_second": 0.845,
585
+ "step": 452
586
  }
587
  ],
588
  "logging_steps": 5,
589
  "max_steps": 1130,
590
  "num_train_epochs": 10,
591
  "save_steps": 500,
592
+ "total_flos": 2.4376449017315328e+17,
593
  "trial_name": null,
594
  "trial_params": null
595
  }