|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 15.0, |
|
"global_step": 1635, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.92, |
|
"eval_loss": 3.585611343383789, |
|
"eval_runtime": 69.1996, |
|
"eval_samples_per_second": 23.801, |
|
"eval_steps_per_second": 2.977, |
|
"eval_wer": 1.0, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 1.83, |
|
"eval_loss": 3.0358903408050537, |
|
"eval_runtime": 70.0289, |
|
"eval_samples_per_second": 23.519, |
|
"eval_steps_per_second": 2.942, |
|
"eval_wer": 0.9998978653865795, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 2.75, |
|
"eval_loss": 0.9341107606887817, |
|
"eval_runtime": 69.5975, |
|
"eval_samples_per_second": 23.665, |
|
"eval_steps_per_second": 2.96, |
|
"eval_wer": 0.7737718312736186, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 3.67, |
|
"eval_loss": 0.5874470472335815, |
|
"eval_runtime": 69.8546, |
|
"eval_samples_per_second": 23.578, |
|
"eval_steps_per_second": 2.949, |
|
"eval_wer": 0.6386477377183127, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 4.59, |
|
"learning_rate": 0.0002988, |
|
"loss": 3.214, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 4.59, |
|
"eval_loss": 0.5316070914268494, |
|
"eval_runtime": 69.5825, |
|
"eval_samples_per_second": 23.67, |
|
"eval_steps_per_second": 2.961, |
|
"eval_wer": 0.5525482586048411, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 5.5, |
|
"eval_loss": 0.45860984921455383, |
|
"eval_runtime": 68.7814, |
|
"eval_samples_per_second": 23.945, |
|
"eval_steps_per_second": 2.995, |
|
"eval_wer": 0.519252374629762, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 6.42, |
|
"eval_loss": 0.45034125447273254, |
|
"eval_runtime": 67.077, |
|
"eval_samples_per_second": 24.554, |
|
"eval_steps_per_second": 3.071, |
|
"eval_wer": 0.4605249719129813, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 7.34, |
|
"eval_loss": 0.41716983914375305, |
|
"eval_runtime": 68.1176, |
|
"eval_samples_per_second": 24.179, |
|
"eval_steps_per_second": 3.024, |
|
"eval_wer": 0.4390767030946788, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 8.26, |
|
"eval_loss": 0.4093872606754303, |
|
"eval_runtime": 69.7848, |
|
"eval_samples_per_second": 23.601, |
|
"eval_steps_per_second": 2.952, |
|
"eval_wer": 0.41854764579716064, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 9.17, |
|
"learning_rate": 0.00016837004405286342, |
|
"loss": 0.2284, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 9.17, |
|
"eval_loss": 0.4091317355632782, |
|
"eval_runtime": 70.1477, |
|
"eval_samples_per_second": 23.479, |
|
"eval_steps_per_second": 2.937, |
|
"eval_wer": 0.39985701154121134, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 10.09, |
|
"eval_loss": 0.39890098571777344, |
|
"eval_runtime": 69.3262, |
|
"eval_samples_per_second": 23.757, |
|
"eval_steps_per_second": 2.971, |
|
"eval_wer": 0.40404453069145135, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 11.01, |
|
"eval_loss": 0.4066716432571411, |
|
"eval_runtime": 69.7662, |
|
"eval_samples_per_second": 23.607, |
|
"eval_steps_per_second": 2.953, |
|
"eval_wer": 0.3930139924420386, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 11.93, |
|
"eval_loss": 0.40022560954093933, |
|
"eval_runtime": 67.6908, |
|
"eval_samples_per_second": 24.331, |
|
"eval_steps_per_second": 3.043, |
|
"eval_wer": 0.3775916658155449, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 12.84, |
|
"eval_loss": 0.3982270061969757, |
|
"eval_runtime": 66.5115, |
|
"eval_samples_per_second": 24.763, |
|
"eval_steps_per_second": 3.097, |
|
"eval_wer": 0.36492697375140437, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 13.76, |
|
"learning_rate": 3.621145374449339e-05, |
|
"loss": 0.1029, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 13.76, |
|
"eval_loss": 0.38969308137893677, |
|
"eval_runtime": 65.75, |
|
"eval_samples_per_second": 25.049, |
|
"eval_steps_per_second": 3.133, |
|
"eval_wer": 0.3703401082626902, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 14.68, |
|
"eval_loss": 0.3836365342140198, |
|
"eval_runtime": 65.8183, |
|
"eval_samples_per_second": 25.023, |
|
"eval_steps_per_second": 3.13, |
|
"eval_wer": 0.3566540700643448, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"step": 1635, |
|
"total_flos": 6.429866751096261e+18, |
|
"train_loss": 1.0907053682053125, |
|
"train_runtime": 3864.236, |
|
"train_samples_per_second": 13.501, |
|
"train_steps_per_second": 0.423 |
|
} |
|
], |
|
"max_steps": 1635, |
|
"num_train_epochs": 15, |
|
"total_flos": 6.429866751096261e+18, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|