{ "epoch": 25.0, "eval_accuracy": 0.6765868602733887, "eval_loss": 4.952412128448486, "eval_runtime": 130.2782, "eval_samples": 120706, "eval_samples_per_second": 926.525, "eval_steps_per_second": 5.795, "perplexity": 141.51590710222774, "total_flos": 3.046251597339341e+18, "train_loss": 5.746741898249789, "train_runtime": 91431.3002, "train_samples": 2277342, "train_samples_per_second": 622.692, "train_steps_per_second": 3.892 }