{ "epoch": 2.0, "total_flos": 4998105219072.0, "train_loss": 0.08123247806327517, "train_runtime": 863.7561, "train_samples_per_second": 10.403, "train_steps_per_second": 1.301 }