epoch = 3.0 train_runtime = 2076.5315 train_samples_per_second = 1.556