{ "best_metric": 0.8835274542429284, "best_model_checkpoint": "/scratch/mrahma45/pixel/finetuned_models/bert/bert-base-finetuned-masakhaner-ibo/checkpoint-3000", "epoch": 57.142857142857146, "global_step": 4000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 2.86, "eval_accuracy_score": 0.973508883248731, "eval_f1": 0.8375927452596867, "eval_loss": 0.0908978134393692, "eval_precision": 0.8287112561174551, "eval_recall": 0.8466666666666667, "eval_runtime": 4.4899, "eval_samples_per_second": 71.271, "eval_steps_per_second": 8.909, "step": 200 }, { "epoch": 5.71, "eval_accuracy_score": 0.9760469543147208, "eval_f1": 0.8602329450915143, "eval_loss": 0.10517112910747528, "eval_precision": 0.8588039867109635, "eval_recall": 0.8616666666666667, "eval_runtime": 4.4923, "eval_samples_per_second": 71.233, "eval_steps_per_second": 8.904, "step": 400 }, { "epoch": 7.14, "learning_rate": 4.865771812080537e-05, "loss": 0.1423, "step": 500 }, { "epoch": 8.57, "eval_accuracy_score": 0.9762055837563451, "eval_f1": 0.8692810457516339, "eval_loss": 0.10657743364572525, "eval_precision": 0.8525641025641025, "eval_recall": 0.8866666666666667, "eval_runtime": 4.4983, "eval_samples_per_second": 71.139, "eval_steps_per_second": 8.892, "step": 600 }, { "epoch": 11.43, "eval_accuracy_score": 0.9747779187817259, "eval_f1": 0.8621553884711779, "eval_loss": 0.14751985669136047, "eval_precision": 0.864321608040201, "eval_recall": 0.86, "eval_runtime": 4.4901, "eval_samples_per_second": 71.268, "eval_steps_per_second": 8.908, "step": 800 }, { "epoch": 14.29, "learning_rate": 4.697986577181208e-05, "loss": 0.006, "step": 1000 }, { "epoch": 14.29, "eval_accuracy_score": 0.9733502538071066, "eval_f1": 0.8581138487680544, "eval_loss": 0.1495266854763031, "eval_precision": 0.8752166377816292, "eval_recall": 0.8416666666666667, "eval_runtime": 4.4785, "eval_samples_per_second": 71.453, "eval_steps_per_second": 8.932, "step": 1000 }, { "epoch": 17.14, "eval_accuracy_score": 0.9743020304568528, "eval_f1": 0.8580912863070539, "eval_loss": 0.13109683990478516, "eval_precision": 0.8545454545454545, "eval_recall": 0.8616666666666667, "eval_runtime": 4.4894, "eval_samples_per_second": 71.279, "eval_steps_per_second": 8.91, "step": 1200 }, { "epoch": 20.0, "eval_accuracy_score": 0.975729695431472, "eval_f1": 0.8702791461412152, "eval_loss": 0.12132257223129272, "eval_precision": 0.8576051779935275, "eval_recall": 0.8833333333333333, "eval_runtime": 4.4948, "eval_samples_per_second": 71.193, "eval_steps_per_second": 8.899, "step": 1400 }, { "epoch": 21.43, "learning_rate": 4.530201342281879e-05, "loss": 0.0039, "step": 1500 }, { "epoch": 22.86, "eval_accuracy_score": 0.9727157360406091, "eval_f1": 0.8521594684385383, "eval_loss": 0.14406903088092804, "eval_precision": 0.8493377483443708, "eval_recall": 0.855, "eval_runtime": 4.488, "eval_samples_per_second": 71.301, "eval_steps_per_second": 8.913, "step": 1600 }, { "epoch": 25.71, "eval_accuracy_score": 0.9760469543147208, "eval_f1": 0.8736401673640167, "eval_loss": 0.13323232531547546, "eval_precision": 0.8773109243697479, "eval_recall": 0.87, "eval_runtime": 4.4884, "eval_samples_per_second": 71.295, "eval_steps_per_second": 8.912, "step": 1800 }, { "epoch": 28.57, "learning_rate": 4.36241610738255e-05, "loss": 0.003, "step": 2000 }, { "epoch": 28.57, "eval_accuracy_score": 0.9768401015228426, "eval_f1": 0.8747940691927514, "eval_loss": 0.1382114142179489, "eval_precision": 0.8648208469055375, "eval_recall": 0.885, "eval_runtime": 4.4872, "eval_samples_per_second": 71.313, "eval_steps_per_second": 8.914, "step": 2000 }, { "epoch": 31.43, "eval_accuracy_score": 0.9774746192893401, "eval_f1": 0.8793969849246231, "eval_loss": 0.1348169445991516, "eval_precision": 0.8838383838383839, "eval_recall": 0.875, "eval_runtime": 4.4981, "eval_samples_per_second": 71.141, "eval_steps_per_second": 8.893, "step": 2200 }, { "epoch": 34.29, "eval_accuracy_score": 0.9762055837563451, "eval_f1": 0.8757297748123437, "eval_loss": 0.16189880669116974, "eval_precision": 0.8764607679465777, "eval_recall": 0.875, "eval_runtime": 4.491, "eval_samples_per_second": 71.253, "eval_steps_per_second": 8.907, "step": 2400 }, { "epoch": 35.71, "learning_rate": 4.194630872483222e-05, "loss": 0.002, "step": 2500 }, { "epoch": 37.14, "eval_accuracy_score": 0.9741434010152284, "eval_f1": 0.8702928870292886, "eval_loss": 0.18092279136180878, "eval_precision": 0.8739495798319328, "eval_recall": 0.8666666666666667, "eval_runtime": 4.4888, "eval_samples_per_second": 71.289, "eval_steps_per_second": 8.911, "step": 2600 }, { "epoch": 40.0, "eval_accuracy_score": 0.9768401015228426, "eval_f1": 0.8835672997522708, "eval_loss": 0.14144042134284973, "eval_precision": 0.8756137479541735, "eval_recall": 0.8916666666666667, "eval_runtime": 4.4955, "eval_samples_per_second": 71.183, "eval_steps_per_second": 8.898, "step": 2800 }, { "epoch": 42.86, "learning_rate": 4.026845637583892e-05, "loss": 0.0022, "step": 3000 }, { "epoch": 42.86, "eval_accuracy_score": 0.9779505076142132, "eval_f1": 0.8835274542429284, "eval_loss": 0.1496778428554535, "eval_precision": 0.8820598006644518, "eval_recall": 0.885, "eval_runtime": 4.4823, "eval_samples_per_second": 71.392, "eval_steps_per_second": 8.924, "step": 3000 }, { "epoch": 45.71, "eval_accuracy_score": 0.9755710659898477, "eval_f1": 0.8616404308202154, "eval_loss": 0.1561731994152069, "eval_precision": 0.85667215815486, "eval_recall": 0.8666666666666667, "eval_runtime": 4.4881, "eval_samples_per_second": 71.3, "eval_steps_per_second": 8.913, "step": 3200 }, { "epoch": 48.57, "eval_accuracy_score": 0.9766814720812182, "eval_f1": 0.8719665271966527, "eval_loss": 0.1539183408021927, "eval_precision": 0.8756302521008403, "eval_recall": 0.8683333333333333, "eval_runtime": 4.4822, "eval_samples_per_second": 71.393, "eval_steps_per_second": 8.924, "step": 3400 }, { "epoch": 50.0, "learning_rate": 3.859060402684564e-05, "loss": 0.0014, "step": 3500 }, { "epoch": 51.43, "eval_accuracy_score": 0.9744606598984772, "eval_f1": 0.8673894912427023, "eval_loss": 0.1729230135679245, "eval_precision": 0.8681135225375626, "eval_recall": 0.8666666666666667, "eval_runtime": 4.4847, "eval_samples_per_second": 71.354, "eval_steps_per_second": 8.919, "step": 3600 }, { "epoch": 54.29, "eval_accuracy_score": 0.9743020304568528, "eval_f1": 0.8600167644593462, "eval_loss": 0.1779366433620453, "eval_precision": 0.8650927487352446, "eval_recall": 0.855, "eval_runtime": 4.4776, "eval_samples_per_second": 71.467, "eval_steps_per_second": 8.933, "step": 3800 }, { "epoch": 57.14, "learning_rate": 3.6912751677852356e-05, "loss": 0.0024, "step": 4000 }, { "epoch": 57.14, "eval_accuracy_score": 0.9758883248730964, "eval_f1": 0.8710217755443885, "eval_loss": 0.14653384685516357, "eval_precision": 0.8754208754208754, "eval_recall": 0.8666666666666667, "eval_runtime": 4.4684, "eval_samples_per_second": 71.614, "eval_steps_per_second": 8.952, "step": 4000 }, { "epoch": 57.14, "step": 4000, "total_flos": 1.668681362767104e+16, "train_loss": 0.020399520963430406, "train_runtime": 4498.3257, "train_samples_per_second": 106.706, "train_steps_per_second": 3.335 } ], "max_steps": 15000, "num_train_epochs": 215, "total_flos": 1.668681362767104e+16, "trial_name": null, "trial_params": null }