|
{ |
|
"best_metric": 0.10217397660017014, |
|
"best_model_checkpoint": "/workspace/output/ka/wav2vec2-xls-r-1b-ka-2/checkpoint-4000", |
|
"epoch": 64.512, |
|
"global_step": 4000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.61, |
|
"learning_rate": 1.7678499999999997e-05, |
|
"loss": 5.1431, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 3.22, |
|
"learning_rate": 3.500349999999999e-05, |
|
"loss": 2.6801, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 4.83, |
|
"learning_rate": 5.232849999999999e-05, |
|
"loss": 1.4529, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 6.45, |
|
"learning_rate": 6.965349999999999e-05, |
|
"loss": 1.2839, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 6.45, |
|
"eval_cer": 0.05568531627678561, |
|
"eval_loss": 0.22294116020202637, |
|
"eval_runtime": 52.1848, |
|
"eval_samples_per_second": 25.774, |
|
"eval_steps_per_second": 0.422, |
|
"eval_wer": 0.3608917324802559, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 8.06, |
|
"learning_rate": 7e-05, |
|
"loss": 1.2486, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 9.67, |
|
"learning_rate": 7e-05, |
|
"loss": 1.139, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 11.29, |
|
"learning_rate": 7e-05, |
|
"loss": 1.0481, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 12.9, |
|
"learning_rate": 7e-05, |
|
"loss": 0.9775, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 12.9, |
|
"eval_cer": 0.03166960125528526, |
|
"eval_loss": 0.127132385969162, |
|
"eval_runtime": 50.7158, |
|
"eval_samples_per_second": 26.52, |
|
"eval_steps_per_second": 0.434, |
|
"eval_wer": 0.2202339298210537, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 14.51, |
|
"learning_rate": 7e-05, |
|
"loss": 0.9449, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 16.13, |
|
"learning_rate": 7e-05, |
|
"loss": 0.9374, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 17.74, |
|
"learning_rate": 7e-05, |
|
"loss": 0.9197, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 19.35, |
|
"learning_rate": 7e-05, |
|
"loss": 0.9045, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 19.35, |
|
"eval_cer": 0.02939379783678896, |
|
"eval_loss": 0.12676405906677246, |
|
"eval_runtime": 50.6864, |
|
"eval_samples_per_second": 26.536, |
|
"eval_steps_per_second": 0.434, |
|
"eval_wer": 0.20303908827351794, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 20.96, |
|
"learning_rate": 7e-05, |
|
"loss": 0.8889, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 22.58, |
|
"learning_rate": 7e-05, |
|
"loss": 0.8873, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 24.19, |
|
"learning_rate": 7e-05, |
|
"loss": 0.8828, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 25.8, |
|
"learning_rate": 7e-05, |
|
"loss": 0.8652, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 25.8, |
|
"eval_cer": 0.028746990549426858, |
|
"eval_loss": 0.12111534923315048, |
|
"eval_runtime": 50.502, |
|
"eval_samples_per_second": 26.633, |
|
"eval_steps_per_second": 0.436, |
|
"eval_wer": 0.19404178746376088, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 27.42, |
|
"learning_rate": 7e-05, |
|
"loss": 0.8775, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 29.03, |
|
"learning_rate": 7e-05, |
|
"loss": 0.8587, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 30.64, |
|
"learning_rate": 7e-05, |
|
"loss": 0.8518, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 32.26, |
|
"learning_rate": 7e-05, |
|
"loss": 0.8505, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 32.26, |
|
"eval_cer": 0.027573155101991927, |
|
"eval_loss": 0.11918943375349045, |
|
"eval_runtime": 50.5112, |
|
"eval_samples_per_second": 26.628, |
|
"eval_steps_per_second": 0.436, |
|
"eval_wer": 0.19124262721183644, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 33.86, |
|
"learning_rate": 6.67415e-05, |
|
"loss": 0.8436, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 35.48, |
|
"learning_rate": 6.34165e-05, |
|
"loss": 0.8399, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 37.1, |
|
"learning_rate": 6.009149999999999e-05, |
|
"loss": 0.8258, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 38.7, |
|
"learning_rate": 5.679975e-05, |
|
"loss": 0.8168, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 38.7, |
|
"eval_cer": 0.025956136883586667, |
|
"eval_loss": 0.10860513150691986, |
|
"eval_runtime": 51.1919, |
|
"eval_samples_per_second": 26.274, |
|
"eval_steps_per_second": 0.43, |
|
"eval_wer": 0.17634709587123862, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 40.32, |
|
"learning_rate": 5.3474749999999995e-05, |
|
"loss": 0.8068, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 41.93, |
|
"learning_rate": 5.0149749999999995e-05, |
|
"loss": 0.7971, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 43.54, |
|
"learning_rate": 4.6824749999999996e-05, |
|
"loss": 0.7893, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 45.16, |
|
"learning_rate": 4.3499749999999996e-05, |
|
"loss": 0.7737, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 45.16, |
|
"eval_cer": 0.025620755327176687, |
|
"eval_loss": 0.10982357710599899, |
|
"eval_runtime": 50.6716, |
|
"eval_samples_per_second": 26.543, |
|
"eval_steps_per_second": 0.434, |
|
"eval_wer": 0.17534739578126562, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 46.77, |
|
"learning_rate": 4.017475e-05, |
|
"loss": 0.7748, |
|
"step": 2900 |
|
}, |
|
{ |
|
"epoch": 48.38, |
|
"learning_rate": 3.684974999999999e-05, |
|
"loss": 0.762, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 49.99, |
|
"learning_rate": 3.352475e-05, |
|
"loss": 0.753, |
|
"step": 3100 |
|
}, |
|
{ |
|
"epoch": 51.61, |
|
"learning_rate": 3.0199749999999995e-05, |
|
"loss": 0.744, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 51.61, |
|
"eval_cer": 0.02391989171966893, |
|
"eval_loss": 0.10541926324367523, |
|
"eval_runtime": 50.5525, |
|
"eval_samples_per_second": 26.606, |
|
"eval_steps_per_second": 0.435, |
|
"eval_wer": 0.16455063480955714, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 53.22, |
|
"learning_rate": 2.6874749999999995e-05, |
|
"loss": 0.7233, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 54.83, |
|
"learning_rate": 2.3549749999999996e-05, |
|
"loss": 0.725, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 56.45, |
|
"learning_rate": 2.0224749999999996e-05, |
|
"loss": 0.7158, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 58.06, |
|
"learning_rate": 1.6899749999999997e-05, |
|
"loss": 0.7114, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 58.06, |
|
"eval_cer": 0.022829901661336496, |
|
"eval_loss": 0.10338227450847626, |
|
"eval_runtime": 51.0232, |
|
"eval_samples_per_second": 26.361, |
|
"eval_steps_per_second": 0.431, |
|
"eval_wer": 0.15725282415275418, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 59.67, |
|
"learning_rate": 1.3574749999999999e-05, |
|
"loss": 0.696, |
|
"step": 3700 |
|
}, |
|
{ |
|
"epoch": 61.29, |
|
"learning_rate": 1.0249750000000001e-05, |
|
"loss": 0.7046, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 62.9, |
|
"learning_rate": 6.924750000000003e-06, |
|
"loss": 0.6915, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 64.51, |
|
"learning_rate": 3.5997500000000035e-06, |
|
"loss": 0.6773, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 64.51, |
|
"eval_cer": 0.02207529315941404, |
|
"eval_loss": 0.10217397660017014, |
|
"eval_runtime": 50.9761, |
|
"eval_samples_per_second": 26.385, |
|
"eval_steps_per_second": 0.432, |
|
"eval_wer": 0.15265420373887834, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 64.51, |
|
"step": 4000, |
|
"total_flos": 3.3884437885491655e+20, |
|
"train_loss": 1.020361618041992, |
|
"train_runtime": 40092.8966, |
|
"train_samples_per_second": 12.77, |
|
"train_steps_per_second": 0.1 |
|
} |
|
], |
|
"max_steps": 4000, |
|
"num_train_epochs": 65, |
|
"total_flos": 3.3884437885491655e+20, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|