{ "epoch": 2.0, "eval_accuracy": 0.47740403110973484, "eval_loss": 2.567959785461426, "eval_runtime": 4355.6296, "eval_samples": 41158, "eval_samples_per_second": 9.449, "eval_steps_per_second": 2.362, "perplexity": 13.03919453055406, "total_flos": 1.502524253059154e+17, "train_loss": 2.352252098808129, "train_runtime": 164976.46, "train_samples": 287513, "train_samples_per_second": 3.486, "train_steps_per_second": 0.871 }