{ | |
"epoch": 20.0, | |
"eval_accuracy": 0.2462286333254075, | |
"eval_loss": 5.426878929138184, | |
"eval_runtime": 8.9817, | |
"eval_samples": 37, | |
"eval_samples_per_second": 4.119, | |
"eval_steps_per_second": 2.115, | |
"perplexity": 227.43828551721677, | |
"total_flos": 3.670508706988032e+16, | |
"train_loss": 3.2965724309285482, | |
"train_runtime": 9164.1975, | |
"train_samples": 767, | |
"train_samples_per_second": 1.674, | |
"train_steps_per_second": 0.21 | |
} |