ales commited on
Commit
6484e0e
·
1 Parent(s): 7956c2a

End of training

Browse files
all_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 1.05,
3
+ "eval_loss": 0.974454939365387,
4
+ "eval_runtime": 20.3472,
5
+ "eval_samples": 64,
6
+ "eval_samples_per_second": 3.145,
7
+ "eval_steps_per_second": 0.098,
8
+ "eval_wer": 75.27472527472527,
9
+ "train_loss": 0.041942973931630455,
10
+ "train_runtime": 33.8193,
11
+ "train_samples_per_second": 18.924,
12
+ "train_steps_per_second": 0.591
13
+ }
eval_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 1.05,
3
+ "eval_loss": 0.974454939365387,
4
+ "eval_runtime": 20.3472,
5
+ "eval_samples": 64,
6
+ "eval_samples_per_second": 3.145,
7
+ "eval_steps_per_second": 0.098,
8
+ "eval_wer": 75.27472527472527
9
+ }
runs/Dec12_19-20-12_13ea4557542f/events.out.tfevents.1670872941.13ea4557542f.7255.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14d37370fa62b290fb860bc578e906fe2a5176b5967438a4cf0f699cee3d39aa
3
+ size 352
train.log CHANGED
@@ -2,3 +2,9 @@
2
  {'eval_loss': 1.3674653768539429, 'eval_wer': 95.42124542124543, 'eval_runtime': 44.1027, 'eval_samples_per_second': 1.451, 'eval_steps_per_second': 0.045, 'epoch': 0.5}
3
  {'loss': 1.256, 'learning_rate': 2e-05, 'epoch': 1.0}
4
  {'train_runtime': 33.8193, 'train_samples_per_second': 18.924, 'train_steps_per_second': 0.591, 'train_loss': 0.041942973931630455, 'epoch': 1.05}
 
 
 
 
 
 
 
2
  {'eval_loss': 1.3674653768539429, 'eval_wer': 95.42124542124543, 'eval_runtime': 44.1027, 'eval_samples_per_second': 1.451, 'eval_steps_per_second': 0.045, 'epoch': 0.5}
3
  {'loss': 1.256, 'learning_rate': 2e-05, 'epoch': 1.0}
4
  {'train_runtime': 33.8193, 'train_samples_per_second': 18.924, 'train_steps_per_second': 0.591, 'train_loss': 0.041942973931630455, 'epoch': 1.05}
5
+ ***** train metrics *****
6
+ epoch = 1.05
7
+ train_loss = 0.0419
8
+ train_runtime = 0:00:33.81
9
+ train_samples_per_second = 18.924
10
+ train_steps_per_second = 0.591
train_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 1.05,
3
+ "train_loss": 0.041942973931630455,
4
+ "train_runtime": 33.8193,
5
+ "train_samples_per_second": 18.924,
6
+ "train_steps_per_second": 0.591
7
+ }
trainer_state.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 75.27472527472527,
3
+ "best_model_checkpoint": "./checkpoint-20",
4
+ "epoch": 1.05,
5
+ "global_step": 21,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.5,
12
+ "learning_rate": 8.666666666666667e-05,
13
+ "loss": 2.4473,
14
+ "step": 10
15
+ },
16
+ {
17
+ "epoch": 0.5,
18
+ "eval_loss": 1.3674653768539429,
19
+ "eval_runtime": 44.1027,
20
+ "eval_samples_per_second": 1.451,
21
+ "eval_steps_per_second": 0.045,
22
+ "eval_wer": 95.42124542124543,
23
+ "step": 10
24
+ },
25
+ {
26
+ "epoch": 1.0,
27
+ "learning_rate": 2e-05,
28
+ "loss": 1.256,
29
+ "step": 20
30
+ },
31
+ {
32
+ "epoch": 1.0,
33
+ "eval_loss": 0.974454939365387,
34
+ "eval_runtime": 19.7011,
35
+ "eval_samples_per_second": 3.249,
36
+ "eval_steps_per_second": 0.102,
37
+ "eval_wer": 75.27472527472527,
38
+ "step": 20
39
+ },
40
+ {
41
+ "epoch": 1.05,
42
+ "step": 21,
43
+ "total_flos": 1.654389080064e+16,
44
+ "train_loss": 0.041942973931630455,
45
+ "train_runtime": 33.8193,
46
+ "train_samples_per_second": 18.924,
47
+ "train_steps_per_second": 0.591
48
+ }
49
+ ],
50
+ "max_steps": 20,
51
+ "num_train_epochs": 9223372036854775807,
52
+ "total_flos": 1.654389080064e+16,
53
+ "trial_name": null,
54
+ "trial_params": null
55
+ }