{ "epoch": 40.0, "total_flos": 2.58159113404416e+18, "train_loss": 0.043670280265808104, "train_runtime": 1256.8878, "train_samples_per_second": 31.825, "train_steps_per_second": 3.978 }