{ "epoch": 1.0, "eval_loss": 1.7731051445007324, "eval_runtime": 1215.8742, "eval_samples_per_second": 78.599, "eval_steps_per_second": 9.825, "perplexity": 5.889111541886369, "total_flos": 5.824755462670647e+18, "train_loss": 2.213516155517568, "train_runtime": 14249.5377, "train_samples_per_second": 26.934, "train_steps_per_second": 3.367 }