SushantGautam commited on
Commit
b754ece
·
1 Parent(s): e7df46f

End of training

Browse files
all_results.json CHANGED
@@ -1,17 +1,17 @@
1
  {
2
  "epoch": 10.0,
3
- "eval_accuracy": 0.6093189964157706,
4
  "eval_gen_len": 1.0,
5
- "eval_loss": 1.8930710554122925,
6
  "eval_rouge1": 0.0,
7
  "eval_rouge2": 0.0,
8
  "eval_rougeL": 0.0,
9
  "eval_rougeLsum": 0.0,
10
- "eval_runtime": 0.1102,
11
- "eval_samples": 3,
12
- "eval_samples_per_second": 27.23,
13
- "eval_steps_per_second": 9.077,
14
- "perplexity": 6.639728375930875,
15
  "predict_gen_len": 1.0,
16
  "predict_loss": 5.266044616699219,
17
  "predict_rouge1": 0.0,
@@ -22,9 +22,9 @@
22
  "predict_samples": 3527,
23
  "predict_samples_per_second": 237.858,
24
  "predict_steps_per_second": 14.904,
25
- "train_loss": 2.381487710135324,
26
- "train_runtime": 18.165,
27
- "train_samples": 49,
28
- "train_samples_per_second": 26.975,
29
- "train_steps_per_second": 3.854
30
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "eval_accuracy": 0.4444444444444444,
4
  "eval_gen_len": 1.0,
5
+ "eval_loss": 3.502009630203247,
6
  "eval_rouge1": 0.0,
7
  "eval_rouge2": 0.0,
8
  "eval_rougeL": 0.0,
9
  "eval_rougeLsum": 0.0,
10
+ "eval_runtime": 0.2824,
11
+ "eval_samples": 176,
12
+ "eval_samples_per_second": 623.144,
13
+ "eval_steps_per_second": 77.893,
14
+ "perplexity": 33.18206868621658,
15
  "predict_gen_len": 1.0,
16
  "predict_loss": 5.266044616699219,
17
  "predict_rouge1": 0.0,
 
22
  "predict_samples": 3527,
23
  "predict_samples_per_second": 237.858,
24
  "predict_steps_per_second": 14.904,
25
+ "train_loss": 3.5042898788946366,
26
+ "train_runtime": 613.1863,
27
+ "train_samples": 3507,
28
+ "train_samples_per_second": 57.193,
29
+ "train_steps_per_second": 7.159
30
  }
eval_results.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
  "epoch": 10.0,
3
- "eval_accuracy": 0.6093189964157706,
4
- "eval_loss": 1.8930710554122925,
5
- "eval_runtime": 0.1102,
6
- "eval_samples": 3,
7
- "eval_samples_per_second": 27.23,
8
- "eval_steps_per_second": 9.077,
9
- "perplexity": 6.639728375930875
10
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "eval_accuracy": 0.4444444444444444,
4
+ "eval_loss": 3.502009630203247,
5
+ "eval_runtime": 0.2824,
6
+ "eval_samples": 176,
7
+ "eval_samples_per_second": 623.144,
8
+ "eval_steps_per_second": 77.893,
9
+ "perplexity": 33.18206868621658
10
  }
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 10.0,
3
- "train_loss": 2.381487710135324,
4
- "train_runtime": 18.165,
5
- "train_samples": 49,
6
- "train_samples_per_second": 26.975,
7
- "train_steps_per_second": 3.854
8
  }
 
1
  {
2
  "epoch": 10.0,
3
+ "train_loss": 3.5042898788946366,
4
+ "train_runtime": 613.1863,
5
+ "train_samples": 3507,
6
+ "train_samples_per_second": 57.193,
7
+ "train_steps_per_second": 7.159
8
  }
trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff