|
{ |
|
"best_metric": 0.08565760403871536, |
|
"best_model_checkpoint": "BBC_CLS_deberta_v3_large_v2/checkpoint-594", |
|
"epoch": 10.0, |
|
"eval_steps": 500, |
|
"global_step": 660, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 6.6e-06, |
|
"loss": 1.235, |
|
"step": 66 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.796420581655481, |
|
"eval_f1": 0.4417921999471439, |
|
"eval_loss": 0.633094072341919, |
|
"eval_precision": 0.4046829607174435, |
|
"eval_recall": 0.4873423547822885, |
|
"eval_runtime": 6.7539, |
|
"eval_samples_per_second": 66.184, |
|
"eval_steps_per_second": 2.073, |
|
"step": 66 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 1.32e-05, |
|
"loss": 0.4336, |
|
"step": 132 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.8970917225950783, |
|
"eval_f1": 0.6910171764080433, |
|
"eval_loss": 0.22008153796195984, |
|
"eval_precision": 0.6753658536585365, |
|
"eval_recall": 0.7090775277247049, |
|
"eval_runtime": 6.7716, |
|
"eval_samples_per_second": 66.011, |
|
"eval_steps_per_second": 2.067, |
|
"step": 132 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 1.9800000000000004e-05, |
|
"loss": 0.2133, |
|
"step": 198 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.9776286353467561, |
|
"eval_f1": 0.9601648947616865, |
|
"eval_loss": 0.0990455150604248, |
|
"eval_precision": 0.9476303317535546, |
|
"eval_recall": 0.9785651349741774, |
|
"eval_runtime": 6.7752, |
|
"eval_samples_per_second": 65.976, |
|
"eval_steps_per_second": 2.066, |
|
"step": 198 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 2.64e-05, |
|
"loss": 0.1083, |
|
"step": 264 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.9821029082774049, |
|
"eval_f1": 0.9653218049514888, |
|
"eval_loss": 0.10380033403635025, |
|
"eval_precision": 0.9655642046538242, |
|
"eval_recall": 0.9650874727825403, |
|
"eval_runtime": 6.7715, |
|
"eval_samples_per_second": 66.012, |
|
"eval_steps_per_second": 2.067, |
|
"step": 264 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 3.3e-05, |
|
"loss": 0.0848, |
|
"step": 330 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.9865771812080537, |
|
"eval_f1": 0.9747350357333067, |
|
"eval_loss": 0.09066177904605865, |
|
"eval_precision": 0.9782430301452915, |
|
"eval_recall": 0.9713632225190546, |
|
"eval_runtime": 6.7664, |
|
"eval_samples_per_second": 66.062, |
|
"eval_steps_per_second": 2.069, |
|
"step": 330 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 3.960000000000001e-05, |
|
"loss": 0.1087, |
|
"step": 396 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.9798657718120806, |
|
"eval_f1": 0.9671245324193838, |
|
"eval_loss": 0.12698371708393097, |
|
"eval_precision": 0.9672288359788359, |
|
"eval_recall": 0.9688744042217826, |
|
"eval_runtime": 6.7679, |
|
"eval_samples_per_second": 66.047, |
|
"eval_steps_per_second": 2.069, |
|
"step": 396 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 4.6200000000000005e-05, |
|
"loss": 0.1011, |
|
"step": 462 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.9753914988814317, |
|
"eval_f1": 0.9666995780164981, |
|
"eval_loss": 0.12892137467861176, |
|
"eval_precision": 0.9676667575151919, |
|
"eval_recall": 0.9659549559260323, |
|
"eval_runtime": 6.7567, |
|
"eval_samples_per_second": 66.157, |
|
"eval_steps_per_second": 2.072, |
|
"step": 462 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 4.125e-05, |
|
"loss": 0.0827, |
|
"step": 528 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.9798657718120806, |
|
"eval_f1": 0.9631601759286037, |
|
"eval_loss": 0.09904194623231888, |
|
"eval_precision": 0.9818050507874383, |
|
"eval_recall": 0.9479257225190546, |
|
"eval_runtime": 6.7541, |
|
"eval_samples_per_second": 66.182, |
|
"eval_steps_per_second": 2.073, |
|
"step": 528 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 2.0625e-05, |
|
"loss": 0.0621, |
|
"step": 594 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.9865771812080537, |
|
"eval_f1": 0.9750903668573623, |
|
"eval_loss": 0.08565760403871536, |
|
"eval_precision": 0.9722969853754562, |
|
"eval_recall": 0.9780020135988667, |
|
"eval_runtime": 6.7572, |
|
"eval_samples_per_second": 66.152, |
|
"eval_steps_per_second": 2.072, |
|
"step": 594 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 0.0, |
|
"loss": 0.0444, |
|
"step": 660 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.9843400447427293, |
|
"eval_f1": 0.9714752151121933, |
|
"eval_loss": 0.10706986486911774, |
|
"eval_precision": 0.9768891875746715, |
|
"eval_recall": 0.9662611817027281, |
|
"eval_runtime": 6.7612, |
|
"eval_samples_per_second": 66.112, |
|
"eval_steps_per_second": 2.071, |
|
"step": 660 |
|
} |
|
], |
|
"logging_steps": 10, |
|
"max_steps": 660, |
|
"num_train_epochs": 10, |
|
"save_steps": 500, |
|
"total_flos": 9724835143127040.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|