{ | |
"epoch": 2.0, | |
"eval_accuracy": 0.47740403110973484, | |
"eval_loss": 2.567959785461426, | |
"eval_runtime": 4355.6296, | |
"eval_samples": 41158, | |
"eval_samples_per_second": 9.449, | |
"eval_steps_per_second": 2.362, | |
"perplexity": 13.03919453055406, | |
"total_flos": 1.502524253059154e+17, | |
"train_loss": 2.352252098808129, | |
"train_runtime": 164976.46, | |
"train_samples": 287513, | |
"train_samples_per_second": 3.486, | |
"train_steps_per_second": 0.871 | |
} |