gemma-2-2b-it-mt-sft-full_new / all_results.json
martimfasantos's picture
End of training
615c66b verified
raw
history blame contribute delete
418 Bytes
{
"epoch": 0.9982363315696648,
"eval_loss": 1.8862216472625732,
"eval_runtime": 61.2833,
"eval_samples": 8016,
"eval_samples_per_second": 5.434,
"eval_steps_per_second": 2.725,
"total_flos": 1.1264430584732058e+17,
"train_loss": 1.8635691063142918,
"train_runtime": 3704.3906,
"train_samples": 117404,
"train_samples_per_second": 1.224,
"train_steps_per_second": 0.076
}