pere commited on
Commit
62b0686
·
1 Parent(s): 084062b

End of training

Browse files
Files changed (3) hide show
  1. all_results.json +4 -4
  2. train_results.json +4 -4
  3. trainer_state.json +12 -3
all_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 1.0,
3
- "train_loss": 1.7381801103855406e-06,
4
- "train_runtime": 64.0295,
5
- "train_samples_per_second": 29986.165,
6
- "train_steps_per_second": 312.356
7
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "train_loss": 5.53145265653126e-07,
4
+ "train_runtime": 51.8572,
5
+ "train_samples_per_second": 37024.777,
6
+ "train_steps_per_second": 385.675
7
  }
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 1.0,
3
- "train_loss": 1.7381801103855406e-06,
4
- "train_runtime": 64.0295,
5
- "train_samples_per_second": 29986.165,
6
- "train_steps_per_second": 312.356
7
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "train_loss": 5.53145265653126e-07,
4
+ "train_runtime": 51.8572,
5
+ "train_samples_per_second": 37024.777,
6
+ "train_steps_per_second": 385.675
7
  }
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 7.411630558722919,
3
  "best_model_checkpoint": "../whisper-NST2-unfreeze-constanti-low-lr/checkpoint-14000",
4
- "epoch": 1.00005,
5
- "global_step": 20001,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -684,11 +684,20 @@
684
  "train_runtime": 64.0295,
685
  "train_samples_per_second": 29986.165,
686
  "train_steps_per_second": 312.356
 
 
 
 
 
 
 
 
 
687
  }
688
  ],
689
  "max_steps": 20000,
690
  "num_train_epochs": 9223372036854775807,
691
- "total_flos": 2.7702640069558272e+20,
692
  "trial_name": null,
693
  "trial_params": null
694
  }
 
1
  {
2
  "best_metric": 7.411630558722919,
3
  "best_model_checkpoint": "../whisper-NST2-unfreeze-constanti-low-lr/checkpoint-14000",
4
+ "epoch": 1.0001,
5
+ "global_step": 20002,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
684
  "train_runtime": 64.0295,
685
  "train_samples_per_second": 29986.165,
686
  "train_steps_per_second": 312.356
687
+ },
688
+ {
689
+ "epoch": 1.0,
690
+ "step": 20002,
691
+ "total_flos": 2.7704025279479808e+20,
692
+ "train_loss": 5.53145265653126e-07,
693
+ "train_runtime": 51.8572,
694
+ "train_samples_per_second": 37024.777,
695
+ "train_steps_per_second": 385.675
696
  }
697
  ],
698
  "max_steps": 20000,
699
  "num_train_epochs": 9223372036854775807,
700
+ "total_flos": 2.7704025279479808e+20,
701
  "trial_name": null,
702
  "trial_params": null
703
  }