|
{ |
|
"best_metric": 0.58822980593355, |
|
"best_model_checkpoint": "./CARES/checkpoints/bert-ba/checkpoint-2961", |
|
"epoch": 21.0, |
|
"global_step": 2961, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_loss": 0.22213496267795563, |
|
"eval_macro_f1": 0.08913506250646834, |
|
"eval_macro_precision": 0.1601542788476893, |
|
"eval_macro_recall": 0.07453283930073998, |
|
"eval_micro_f1": 0.3941888619854721, |
|
"eval_micro_precision": 0.7650375939849624, |
|
"eval_micro_recall": 0.2654924983692107, |
|
"eval_runtime": 3.0004, |
|
"eval_samples_per_second": 321.956, |
|
"eval_steps_per_second": 20.331, |
|
"step": 141 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_loss": 0.18322525918483734, |
|
"eval_macro_f1": 0.20542764030139582, |
|
"eval_macro_precision": 0.31153358140506404, |
|
"eval_macro_recall": 0.1749941105591186, |
|
"eval_micro_f1": 0.6042759177087536, |
|
"eval_micro_precision": 0.7917547568710359, |
|
"eval_micro_recall": 0.4885844748858447, |
|
"eval_runtime": 3.0066, |
|
"eval_samples_per_second": 321.295, |
|
"eval_steps_per_second": 20.289, |
|
"step": 282 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_loss": 0.168878972530365, |
|
"eval_macro_f1": 0.29169004336353355, |
|
"eval_macro_precision": 0.39228947650947077, |
|
"eval_macro_recall": 0.2624222179377449, |
|
"eval_micro_f1": 0.6591789310611929, |
|
"eval_micro_precision": 0.8112488083889419, |
|
"eval_micro_recall": 0.5551206784083497, |
|
"eval_runtime": 3.0155, |
|
"eval_samples_per_second": 320.35, |
|
"eval_steps_per_second": 20.229, |
|
"step": 423 |
|
}, |
|
{ |
|
"epoch": 3.55, |
|
"learning_rate": 2.8936170212765956e-05, |
|
"loss": 0.1959, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_loss": 0.1501942127943039, |
|
"eval_macro_f1": 0.35589775613243146, |
|
"eval_macro_precision": 0.4667524057986162, |
|
"eval_macro_recall": 0.3166674518971492, |
|
"eval_micro_f1": 0.7155012948575658, |
|
"eval_micro_precision": 0.8264957264957264, |
|
"eval_micro_recall": 0.6307893020221788, |
|
"eval_runtime": 3.0213, |
|
"eval_samples_per_second": 319.733, |
|
"eval_steps_per_second": 20.19, |
|
"step": 564 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_loss": 0.14672552049160004, |
|
"eval_macro_f1": 0.47974247836953543, |
|
"eval_macro_precision": 0.6466753641860046, |
|
"eval_macro_recall": 0.42420722655395326, |
|
"eval_micro_f1": 0.7180585296216989, |
|
"eval_micro_precision": 0.7927501970055162, |
|
"eval_micro_recall": 0.6562296151337247, |
|
"eval_runtime": 3.0023, |
|
"eval_samples_per_second": 321.752, |
|
"eval_steps_per_second": 20.318, |
|
"step": 705 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_loss": 0.14830899238586426, |
|
"eval_macro_f1": 0.4652554310103303, |
|
"eval_macro_precision": 0.6251017145329125, |
|
"eval_macro_recall": 0.4150412963066584, |
|
"eval_micro_f1": 0.7256140350877194, |
|
"eval_micro_precision": 0.7851176917236142, |
|
"eval_micro_recall": 0.6744944553163731, |
|
"eval_runtime": 2.9724, |
|
"eval_samples_per_second": 324.991, |
|
"eval_steps_per_second": 20.522, |
|
"step": 846 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_loss": 0.1467733532190323, |
|
"eval_macro_f1": 0.5097890383483837, |
|
"eval_macro_precision": 0.6555313836604214, |
|
"eval_macro_recall": 0.4437744774893355, |
|
"eval_micro_f1": 0.7510431154381085, |
|
"eval_micro_precision": 0.8041697691734921, |
|
"eval_micro_recall": 0.7045009784735812, |
|
"eval_runtime": 2.9801, |
|
"eval_samples_per_second": 324.15, |
|
"eval_steps_per_second": 20.469, |
|
"step": 987 |
|
}, |
|
{ |
|
"epoch": 7.09, |
|
"learning_rate": 2.7872340425531914e-05, |
|
"loss": 0.0904, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_loss": 0.14951790869235992, |
|
"eval_macro_f1": 0.5411089496886734, |
|
"eval_macro_precision": 0.6577005724429985, |
|
"eval_macro_recall": 0.47852188216570773, |
|
"eval_micro_f1": 0.7489539748953974, |
|
"eval_micro_precision": 0.8044943820224719, |
|
"eval_micro_recall": 0.700587084148728, |
|
"eval_runtime": 2.9774, |
|
"eval_samples_per_second": 324.441, |
|
"eval_steps_per_second": 20.487, |
|
"step": 1128 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_loss": 0.1488533467054367, |
|
"eval_macro_f1": 0.5590641407878995, |
|
"eval_macro_precision": 0.6102853068447548, |
|
"eval_macro_recall": 0.5269868274318028, |
|
"eval_micro_f1": 0.755420054200542, |
|
"eval_micro_precision": 0.7857646229739254, |
|
"eval_micro_recall": 0.7273320287018917, |
|
"eval_runtime": 2.9723, |
|
"eval_samples_per_second": 324.996, |
|
"eval_steps_per_second": 20.523, |
|
"step": 1269 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_loss": 0.15144900977611542, |
|
"eval_macro_f1": 0.5597430867412742, |
|
"eval_macro_precision": 0.6112400331236583, |
|
"eval_macro_recall": 0.5287805393050224, |
|
"eval_micro_f1": 0.7608550434201737, |
|
"eval_micro_precision": 0.7796030116358659, |
|
"eval_micro_recall": 0.7429876060013046, |
|
"eval_runtime": 2.9735, |
|
"eval_samples_per_second": 324.869, |
|
"eval_steps_per_second": 20.515, |
|
"step": 1410 |
|
}, |
|
{ |
|
"epoch": 10.64, |
|
"learning_rate": 2.6808510638297873e-05, |
|
"loss": 0.0424, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_loss": 0.15306253731250763, |
|
"eval_macro_f1": 0.5476291897617486, |
|
"eval_macro_precision": 0.6042943362522458, |
|
"eval_macro_recall": 0.5150958586698227, |
|
"eval_micro_f1": 0.7621293800539084, |
|
"eval_micro_precision": 0.7881533101045296, |
|
"eval_micro_recall": 0.7377690802348337, |
|
"eval_runtime": 2.9994, |
|
"eval_samples_per_second": 322.068, |
|
"eval_steps_per_second": 20.338, |
|
"step": 1551 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_loss": 0.15226905047893524, |
|
"eval_macro_f1": 0.5645136859707334, |
|
"eval_macro_precision": 0.6250404048441249, |
|
"eval_macro_recall": 0.5290350408209084, |
|
"eval_micro_f1": 0.7750586657727119, |
|
"eval_micro_precision": 0.7972413793103448, |
|
"eval_micro_recall": 0.7540769732550554, |
|
"eval_runtime": 2.9853, |
|
"eval_samples_per_second": 323.581, |
|
"eval_steps_per_second": 20.433, |
|
"step": 1692 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_loss": 0.15537378191947937, |
|
"eval_macro_f1": 0.5801357636140765, |
|
"eval_macro_precision": 0.6557226559864182, |
|
"eval_macro_recall": 0.5300773127347133, |
|
"eval_micro_f1": 0.7715736040609137, |
|
"eval_micro_precision": 0.8016877637130801, |
|
"eval_micro_recall": 0.7436399217221135, |
|
"eval_runtime": 4.9377, |
|
"eval_samples_per_second": 195.637, |
|
"eval_steps_per_second": 12.354, |
|
"step": 1833 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_loss": 0.15421901643276215, |
|
"eval_macro_f1": 0.5773329417808055, |
|
"eval_macro_precision": 0.6485175319800287, |
|
"eval_macro_recall": 0.5350306451399538, |
|
"eval_micro_f1": 0.77552400270453, |
|
"eval_micro_precision": 0.8049122807017544, |
|
"eval_micro_recall": 0.7482061317677756, |
|
"eval_runtime": 3.0097, |
|
"eval_samples_per_second": 320.96, |
|
"eval_steps_per_second": 20.268, |
|
"step": 1974 |
|
}, |
|
{ |
|
"epoch": 14.18, |
|
"learning_rate": 2.574468085106383e-05, |
|
"loss": 0.0219, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_loss": 0.15735264122486115, |
|
"eval_macro_f1": 0.5661412601117408, |
|
"eval_macro_precision": 0.5937031922346153, |
|
"eval_macro_recall": 0.5467428221378843, |
|
"eval_micro_f1": 0.7738255033557048, |
|
"eval_micro_precision": 0.796821008984105, |
|
"eval_micro_recall": 0.7521200260926288, |
|
"eval_runtime": 2.9854, |
|
"eval_samples_per_second": 323.576, |
|
"eval_steps_per_second": 20.433, |
|
"step": 2115 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_loss": 0.1617126762866974, |
|
"eval_macro_f1": 0.5686269653829785, |
|
"eval_macro_precision": 0.6170850785135864, |
|
"eval_macro_recall": 0.5368268361090598, |
|
"eval_micro_f1": 0.779524924723988, |
|
"eval_micro_precision": 0.8001373626373627, |
|
"eval_micro_recall": 0.7599478147423353, |
|
"eval_runtime": 2.9891, |
|
"eval_samples_per_second": 323.178, |
|
"eval_steps_per_second": 20.408, |
|
"step": 2256 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_loss": 0.16439199447631836, |
|
"eval_macro_f1": 0.5741609962540627, |
|
"eval_macro_precision": 0.6203354824423237, |
|
"eval_macro_recall": 0.5508776094197674, |
|
"eval_micro_f1": 0.7765251989389921, |
|
"eval_micro_precision": 0.7896156439649359, |
|
"eval_micro_recall": 0.7638617090671885, |
|
"eval_runtime": 2.979, |
|
"eval_samples_per_second": 324.271, |
|
"eval_steps_per_second": 20.477, |
|
"step": 2397 |
|
}, |
|
{ |
|
"epoch": 17.73, |
|
"learning_rate": 2.4680851063829786e-05, |
|
"loss": 0.013, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_loss": 0.16467925906181335, |
|
"eval_macro_f1": 0.5828461745953328, |
|
"eval_macro_precision": 0.6374781102044266, |
|
"eval_macro_recall": 0.5491770837420844, |
|
"eval_micro_f1": 0.7797519275896748, |
|
"eval_micro_precision": 0.8020689655172414, |
|
"eval_micro_recall": 0.7586431833007176, |
|
"eval_runtime": 2.9765, |
|
"eval_samples_per_second": 324.537, |
|
"eval_steps_per_second": 20.494, |
|
"step": 2538 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_loss": 0.17651152610778809, |
|
"eval_macro_f1": 0.578653206536447, |
|
"eval_macro_precision": 0.5940445993831301, |
|
"eval_macro_recall": 0.5738532439728641, |
|
"eval_micro_f1": 0.7715868361029651, |
|
"eval_micro_precision": 0.7708333333333334, |
|
"eval_micro_recall": 0.7723418134377038, |
|
"eval_runtime": 2.9833, |
|
"eval_samples_per_second": 323.805, |
|
"eval_steps_per_second": 20.447, |
|
"step": 2679 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_loss": 0.17114990949630737, |
|
"eval_macro_f1": 0.5779704862006727, |
|
"eval_macro_precision": 0.6285916131953179, |
|
"eval_macro_recall": 0.5455200342016094, |
|
"eval_micro_f1": 0.7783711615487315, |
|
"eval_micro_precision": 0.7969924812030075, |
|
"eval_micro_recall": 0.7606001304631441, |
|
"eval_runtime": 2.9774, |
|
"eval_samples_per_second": 324.449, |
|
"eval_steps_per_second": 20.488, |
|
"step": 2820 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_loss": 0.1727105975151062, |
|
"eval_macro_f1": 0.58822980593355, |
|
"eval_macro_precision": 0.6578174885933932, |
|
"eval_macro_recall": 0.5467783967982416, |
|
"eval_micro_f1": 0.782282793867121, |
|
"eval_micro_precision": 0.818830242510699, |
|
"eval_micro_recall": 0.7488584474885844, |
|
"eval_runtime": 2.9806, |
|
"eval_samples_per_second": 324.101, |
|
"eval_steps_per_second": 20.466, |
|
"step": 2961 |
|
} |
|
], |
|
"max_steps": 14100, |
|
"num_train_epochs": 100, |
|
"total_flos": 1.2360197339395008e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|