{ | |
"epoch": 25.0, | |
"eval_accuracy": 0.6765868602733887, | |
"eval_loss": 4.952412128448486, | |
"eval_runtime": 130.2782, | |
"eval_samples": 120706, | |
"eval_samples_per_second": 926.525, | |
"eval_steps_per_second": 5.795, | |
"perplexity": 141.51590710222774, | |
"total_flos": 3.046251597339341e+18, | |
"train_loss": 5.746741898249789, | |
"train_runtime": 91431.3002, | |
"train_samples": 2277342, | |
"train_samples_per_second": 622.692, | |
"train_steps_per_second": 3.892 | |
} |