arshsin commited on
Commit
65a739a
·
verified ·
1 Parent(s): 4e068d9

Training in progress, epoch 5, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:557a7b887efea43f30540591296b172670f833eb24b7fcde5d38500396cd2120
3
  size 344814656
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:053ddaffaa3db7a607dcf27230a9b13bc087cce0f3db3f08d1e8741b7b623d93
3
  size 344814656
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2cfe7ba32285d8aca52e368728864045e3b3198f2b05634e71e6db69fa512bc6
3
  size 689741690
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:773e1f541dd330034fd9d01db68892d5dfe39f756e2702b5ecf8302a69810ab4
3
  size 689741690
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3e5d946241df2516b06d7074d8779088eae7607173ad780df56583910a9589b
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5328f04f222a66b45931d6bc246721e0747decf9d78d167903d0547a248f78f0
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c8e927e0c71d62c9d3968420452b731232314f4117cc838742af50f1ba552059
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcb0fd9ecc07788eea0cda082ff0eb7a870dddfb1340a536b8e8db94ebdced55
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.89,
3
  "best_model_checkpoint": "ast-finetuned-audioset-10-10-0.4593-finetuned-gtzan/checkpoint-339",
4
- "epoch": 4.0,
5
  "eval_steps": 500,
6
- "global_step": 452,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -583,13 +583,160 @@
583
  "eval_samples_per_second": 6.498,
584
  "eval_steps_per_second": 0.845,
585
  "step": 452
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
586
  }
587
  ],
588
  "logging_steps": 5,
589
  "max_steps": 1130,
590
  "num_train_epochs": 10,
591
  "save_steps": 500,
592
- "total_flos": 2.4376449017315328e+17,
593
  "trial_name": null,
594
  "trial_params": null
595
  }
 
1
  {
2
  "best_metric": 0.89,
3
  "best_model_checkpoint": "ast-finetuned-audioset-10-10-0.4593-finetuned-gtzan/checkpoint-339",
4
+ "epoch": 5.0,
5
  "eval_steps": 500,
6
+ "global_step": 565,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
583
  "eval_samples_per_second": 6.498,
584
  "eval_steps_per_second": 0.845,
585
  "step": 452
586
+ },
587
+ {
588
+ "epoch": 4.03,
589
+ "learning_rate": 3.3185840707964604e-05,
590
+ "loss": 0.0107,
591
+ "step": 455
592
+ },
593
+ {
594
+ "epoch": 4.07,
595
+ "learning_rate": 3.294001966568339e-05,
596
+ "loss": 0.0747,
597
+ "step": 460
598
+ },
599
+ {
600
+ "epoch": 4.12,
601
+ "learning_rate": 3.2694198623402165e-05,
602
+ "loss": 0.0063,
603
+ "step": 465
604
+ },
605
+ {
606
+ "epoch": 4.16,
607
+ "learning_rate": 3.244837758112095e-05,
608
+ "loss": 0.0002,
609
+ "step": 470
610
+ },
611
+ {
612
+ "epoch": 4.2,
613
+ "learning_rate": 3.220255653883973e-05,
614
+ "loss": 0.0011,
615
+ "step": 475
616
+ },
617
+ {
618
+ "epoch": 4.25,
619
+ "learning_rate": 3.1956735496558504e-05,
620
+ "loss": 0.0488,
621
+ "step": 480
622
+ },
623
+ {
624
+ "epoch": 4.29,
625
+ "learning_rate": 3.171091445427729e-05,
626
+ "loss": 0.0013,
627
+ "step": 485
628
+ },
629
+ {
630
+ "epoch": 4.34,
631
+ "learning_rate": 3.1465093411996065e-05,
632
+ "loss": 0.0015,
633
+ "step": 490
634
+ },
635
+ {
636
+ "epoch": 4.38,
637
+ "learning_rate": 3.121927236971485e-05,
638
+ "loss": 0.1122,
639
+ "step": 495
640
+ },
641
+ {
642
+ "epoch": 4.42,
643
+ "learning_rate": 3.097345132743363e-05,
644
+ "loss": 0.1653,
645
+ "step": 500
646
+ },
647
+ {
648
+ "epoch": 4.47,
649
+ "learning_rate": 3.072763028515241e-05,
650
+ "loss": 0.0001,
651
+ "step": 505
652
+ },
653
+ {
654
+ "epoch": 4.51,
655
+ "learning_rate": 3.048180924287119e-05,
656
+ "loss": 0.0118,
657
+ "step": 510
658
+ },
659
+ {
660
+ "epoch": 4.56,
661
+ "learning_rate": 3.0235988200589972e-05,
662
+ "loss": 0.161,
663
+ "step": 515
664
+ },
665
+ {
666
+ "epoch": 4.6,
667
+ "learning_rate": 2.9990167158308753e-05,
668
+ "loss": 0.1282,
669
+ "step": 520
670
+ },
671
+ {
672
+ "epoch": 4.65,
673
+ "learning_rate": 2.9744346116027534e-05,
674
+ "loss": 0.0003,
675
+ "step": 525
676
+ },
677
+ {
678
+ "epoch": 4.69,
679
+ "learning_rate": 2.9498525073746314e-05,
680
+ "loss": 0.0003,
681
+ "step": 530
682
+ },
683
+ {
684
+ "epoch": 4.73,
685
+ "learning_rate": 2.9252704031465095e-05,
686
+ "loss": 0.0023,
687
+ "step": 535
688
+ },
689
+ {
690
+ "epoch": 4.78,
691
+ "learning_rate": 2.9006882989183876e-05,
692
+ "loss": 0.0124,
693
+ "step": 540
694
+ },
695
+ {
696
+ "epoch": 4.82,
697
+ "learning_rate": 2.8761061946902656e-05,
698
+ "loss": 0.0002,
699
+ "step": 545
700
+ },
701
+ {
702
+ "epoch": 4.87,
703
+ "learning_rate": 2.8515240904621437e-05,
704
+ "loss": 0.0012,
705
+ "step": 550
706
+ },
707
+ {
708
+ "epoch": 4.91,
709
+ "learning_rate": 2.8269419862340218e-05,
710
+ "loss": 0.0,
711
+ "step": 555
712
+ },
713
+ {
714
+ "epoch": 4.96,
715
+ "learning_rate": 2.8023598820059e-05,
716
+ "loss": 0.3903,
717
+ "step": 560
718
+ },
719
+ {
720
+ "epoch": 5.0,
721
+ "learning_rate": 2.777777777777778e-05,
722
+ "loss": 0.188,
723
+ "step": 565
724
+ },
725
+ {
726
+ "epoch": 5.0,
727
+ "eval_accuracy": 0.88,
728
+ "eval_loss": 0.8578123450279236,
729
+ "eval_runtime": 15.4617,
730
+ "eval_samples_per_second": 6.468,
731
+ "eval_steps_per_second": 0.841,
732
+ "step": 565
733
  }
734
  ],
735
  "logging_steps": 5,
736
  "max_steps": 1130,
737
  "num_train_epochs": 10,
738
  "save_steps": 500,
739
+ "total_flos": 3.047056127164416e+17,
740
  "trial_name": null,
741
  "trial_params": null
742
  }