{ "best_metric": 0.7236024844720498, "best_model_checkpoint": "/scratch/mrahma45/pixel/finetuned_models/bert/bert-base-finetuned-masakhaner-lug/checkpoint-1000", "epoch": 44.44444444444444, "global_step": 2000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 4.44, "eval_accuracy_score": 0.9551843012463538, "eval_f1": 0.6815286624203821, "eval_loss": 0.16579905152320862, "eval_precision": 0.6294117647058823, "eval_recall": 0.7430555555555556, "eval_runtime": 2.7912, "eval_samples_per_second": 71.653, "eval_steps_per_second": 8.957, "step": 200 }, { "epoch": 8.89, "eval_accuracy_score": 0.9612834791832405, "eval_f1": 0.7149917627677099, "eval_loss": 0.17872951924800873, "eval_precision": 0.6802507836990596, "eval_recall": 0.7534722222222222, "eval_runtime": 2.7823, "eval_samples_per_second": 71.883, "eval_steps_per_second": 8.985, "step": 400 }, { "epoch": 11.11, "learning_rate": 4.865771812080537e-05, "loss": 0.1436, "step": 500 }, { "epoch": 13.33, "eval_accuracy_score": 0.9554494828957836, "eval_f1": 0.6777408637873754, "eval_loss": 0.2497468888759613, "eval_precision": 0.6496815286624203, "eval_recall": 0.7083333333333334, "eval_runtime": 2.7827, "eval_samples_per_second": 71.874, "eval_steps_per_second": 8.984, "step": 600 }, { "epoch": 17.78, "eval_accuracy_score": 0.9562450278440732, "eval_f1": 0.701095461658842, "eval_loss": 0.24442537128925323, "eval_precision": 0.6381766381766382, "eval_recall": 0.7777777777777778, "eval_runtime": 2.7834, "eval_samples_per_second": 71.856, "eval_steps_per_second": 8.982, "step": 800 }, { "epoch": 22.22, "learning_rate": 4.697986577181208e-05, "loss": 0.0037, "step": 1000 }, { "epoch": 22.22, "eval_accuracy_score": 0.9588968443383717, "eval_f1": 0.7236024844720498, "eval_loss": 0.267472505569458, "eval_precision": 0.6544943820224719, "eval_recall": 0.8090277777777778, "eval_runtime": 2.7845, "eval_samples_per_second": 71.826, "eval_steps_per_second": 8.978, "step": 1000 }, { "epoch": 26.67, "eval_accuracy_score": 0.9554494828957836, "eval_f1": 0.7093750000000001, "eval_loss": 0.2541872262954712, "eval_precision": 0.6448863636363636, "eval_recall": 0.7881944444444444, "eval_runtime": 2.7822, "eval_samples_per_second": 71.884, "eval_steps_per_second": 8.986, "step": 1200 }, { "epoch": 31.11, "eval_accuracy_score": 0.9549191195969239, "eval_f1": 0.7097791798107256, "eval_loss": 0.28504014015197754, "eval_precision": 0.6502890173410405, "eval_recall": 0.78125, "eval_runtime": 2.7835, "eval_samples_per_second": 71.853, "eval_steps_per_second": 8.982, "step": 1400 }, { "epoch": 33.33, "learning_rate": 4.530201342281879e-05, "loss": 0.0029, "step": 1500 }, { "epoch": 35.56, "eval_accuracy_score": 0.9549191195969239, "eval_f1": 0.717391304347826, "eval_loss": 0.281220942735672, "eval_precision": 0.648876404494382, "eval_recall": 0.8020833333333334, "eval_runtime": 2.7818, "eval_samples_per_second": 71.896, "eval_steps_per_second": 8.987, "step": 1600 }, { "epoch": 40.0, "eval_accuracy_score": 0.9551843012463538, "eval_f1": 0.7015873015873016, "eval_loss": 0.2895739674568176, "eval_precision": 0.6461988304093568, "eval_recall": 0.7673611111111112, "eval_runtime": 2.7843, "eval_samples_per_second": 71.83, "eval_steps_per_second": 8.979, "step": 1800 }, { "epoch": 44.44, "learning_rate": 4.36241610738255e-05, "loss": 0.0021, "step": 2000 }, { "epoch": 44.44, "eval_accuracy_score": 0.9557146645452135, "eval_f1": 0.699367088607595, "eval_loss": 0.3147318959236145, "eval_precision": 0.6424418604651163, "eval_recall": 0.7673611111111112, "eval_runtime": 2.7746, "eval_samples_per_second": 72.081, "eval_steps_per_second": 9.01, "step": 2000 }, { "epoch": 44.44, "step": 2000, "total_flos": 8293038676549632.0, "train_loss": 0.03808441823720932, "train_runtime": 2216.7922, "train_samples_per_second": 216.529, "train_steps_per_second": 6.767 } ], "max_steps": 15000, "num_train_epochs": 334, "total_flos": 8293038676549632.0, "trial_name": null, "trial_params": null }