{ "epoch": 20.0, "eval_accuracy": 0.2462286333254075, "eval_loss": 5.426878929138184, "eval_runtime": 8.9817, "eval_samples": 37, "eval_samples_per_second": 4.119, "eval_steps_per_second": 2.115, "perplexity": 227.43828551721677, "total_flos": 3.670508706988032e+16, "train_loss": 3.2965724309285482, "train_runtime": 9164.1975, "train_samples": 767, "train_samples_per_second": 1.674, "train_steps_per_second": 0.21 }