|
{ |
|
"best_metric": 60.07326007326007, |
|
"best_model_checkpoint": "./checkpoint-70", |
|
"epoch": 1.0, |
|
"global_step": 100, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.1, |
|
"learning_rate": 7e-05, |
|
"loss": 2.5622, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"eval_loss": 1.5401501655578613, |
|
"eval_runtime": 62.3188, |
|
"eval_samples_per_second": 1.027, |
|
"eval_steps_per_second": 0.032, |
|
"eval_wer": 94.5054945054945, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"learning_rate": 9.222222222222223e-05, |
|
"loss": 1.3719, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_loss": 1.001212239265442, |
|
"eval_runtime": 18.9902, |
|
"eval_samples_per_second": 3.37, |
|
"eval_steps_per_second": 0.105, |
|
"eval_wer": 75.27472527472527, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"learning_rate": 8.111111111111112e-05, |
|
"loss": 0.9898, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_loss": 0.8217034339904785, |
|
"eval_runtime": 17.7847, |
|
"eval_samples_per_second": 3.599, |
|
"eval_steps_per_second": 0.112, |
|
"eval_wer": 72.7106227106227, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"learning_rate": 7e-05, |
|
"loss": 0.9742, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"eval_loss": 0.7924289107322693, |
|
"eval_runtime": 19.063, |
|
"eval_samples_per_second": 3.357, |
|
"eval_steps_per_second": 0.105, |
|
"eval_wer": 72.52747252747253, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"learning_rate": 5.8888888888888896e-05, |
|
"loss": 0.6951, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 0.5, |
|
"eval_loss": 0.7628086805343628, |
|
"eval_runtime": 17.8327, |
|
"eval_samples_per_second": 3.589, |
|
"eval_steps_per_second": 0.112, |
|
"eval_wer": 76.19047619047619, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"learning_rate": 4.7777777777777784e-05, |
|
"loss": 0.7824, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"eval_loss": 0.6737741231918335, |
|
"eval_runtime": 18.8876, |
|
"eval_samples_per_second": 3.388, |
|
"eval_steps_per_second": 0.106, |
|
"eval_wer": 65.38461538461539, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"learning_rate": 3.6666666666666666e-05, |
|
"loss": 0.6818, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"eval_loss": 0.6388838291168213, |
|
"eval_runtime": 18.9502, |
|
"eval_samples_per_second": 3.377, |
|
"eval_steps_per_second": 0.106, |
|
"eval_wer": 60.07326007326007, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"learning_rate": 2.5555555555555554e-05, |
|
"loss": 0.7823, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"eval_loss": 0.6208388805389404, |
|
"eval_runtime": 18.1881, |
|
"eval_samples_per_second": 3.519, |
|
"eval_steps_per_second": 0.11, |
|
"eval_wer": 65.75091575091575, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"learning_rate": 1.4444444444444444e-05, |
|
"loss": 0.5994, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"eval_loss": 0.5900620818138123, |
|
"eval_runtime": 17.489, |
|
"eval_samples_per_second": 3.659, |
|
"eval_steps_per_second": 0.114, |
|
"eval_wer": 61.904761904761905, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 3.3333333333333333e-06, |
|
"loss": 0.6647, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_loss": 0.5789934992790222, |
|
"eval_runtime": 18.4962, |
|
"eval_samples_per_second": 3.46, |
|
"eval_steps_per_second": 0.108, |
|
"eval_wer": 61.72161172161172, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"step": 100, |
|
"total_flos": 7.8780432384e+16, |
|
"train_loss": 1.0103698587417602, |
|
"train_runtime": 873.4716, |
|
"train_samples_per_second": 3.664, |
|
"train_steps_per_second": 0.114 |
|
} |
|
], |
|
"max_steps": 100, |
|
"num_train_epochs": 9223372036854775807, |
|
"total_flos": 7.8780432384e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|