|
{ |
|
"best_metric": 0.95625, |
|
"best_model_checkpoint": "resnet-18-feature-extraction/checkpoint-26", |
|
"epoch": 49.8, |
|
"global_step": 100, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.8, |
|
"eval_accuracy": 0.75, |
|
"eval_f1": 0.8412698412698413, |
|
"eval_loss": 0.6231745481491089, |
|
"eval_precision": 0.9636363636363636, |
|
"eval_recall": 0.7464788732394366, |
|
"eval_roc_auc": 0.7621283255086071, |
|
"eval_runtime": 5.3474, |
|
"eval_samples_per_second": 29.921, |
|
"eval_steps_per_second": 0.561, |
|
"step": 2 |
|
}, |
|
{ |
|
"epoch": 1.8, |
|
"eval_accuracy": 0.4875, |
|
"eval_f1": 0.5940594059405941, |
|
"eval_loss": 0.6971184611320496, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.4225352112676056, |
|
"eval_roc_auc": 0.7112676056338028, |
|
"eval_runtime": 4.1245, |
|
"eval_samples_per_second": 38.792, |
|
"eval_steps_per_second": 0.727, |
|
"step": 4 |
|
}, |
|
{ |
|
"epoch": 2.8, |
|
"eval_accuracy": 0.2875, |
|
"eval_f1": 0.32941176470588235, |
|
"eval_loss": 0.7914562821388245, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.19718309859154928, |
|
"eval_roc_auc": 0.5985915492957746, |
|
"eval_runtime": 4.0788, |
|
"eval_samples_per_second": 39.227, |
|
"eval_steps_per_second": 0.736, |
|
"step": 6 |
|
}, |
|
{ |
|
"epoch": 3.8, |
|
"eval_accuracy": 0.2875, |
|
"eval_f1": 0.32941176470588235, |
|
"eval_loss": 0.8479948043823242, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.19718309859154928, |
|
"eval_roc_auc": 0.5985915492957746, |
|
"eval_runtime": 3.9544, |
|
"eval_samples_per_second": 40.462, |
|
"eval_steps_per_second": 0.759, |
|
"step": 8 |
|
}, |
|
{ |
|
"epoch": 4.8, |
|
"learning_rate": 2e-05, |
|
"loss": 0.8651, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 4.8, |
|
"eval_accuracy": 0.25625, |
|
"eval_f1": 0.2787878787878788, |
|
"eval_loss": 0.9093517065048218, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.1619718309859155, |
|
"eval_roc_auc": 0.5809859154929577, |
|
"eval_runtime": 4.143, |
|
"eval_samples_per_second": 38.62, |
|
"eval_steps_per_second": 0.724, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 5.8, |
|
"eval_accuracy": 0.5625, |
|
"eval_f1": 0.6728971962616822, |
|
"eval_loss": 0.7470346689224243, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.5070422535211268, |
|
"eval_roc_auc": 0.7535211267605634, |
|
"eval_runtime": 3.9679, |
|
"eval_samples_per_second": 40.323, |
|
"eval_steps_per_second": 0.756, |
|
"step": 12 |
|
}, |
|
{ |
|
"epoch": 6.8, |
|
"eval_accuracy": 0.85, |
|
"eval_f1": 0.9076923076923077, |
|
"eval_loss": 0.5915343165397644, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.8309859154929577, |
|
"eval_roc_auc": 0.9154929577464789, |
|
"eval_runtime": 4.0338, |
|
"eval_samples_per_second": 39.665, |
|
"eval_steps_per_second": 0.744, |
|
"step": 14 |
|
}, |
|
{ |
|
"epoch": 7.8, |
|
"eval_accuracy": 0.8875, |
|
"eval_f1": 0.9333333333333333, |
|
"eval_loss": 0.4816938042640686, |
|
"eval_precision": 0.984375, |
|
"eval_recall": 0.8873239436619719, |
|
"eval_roc_auc": 0.8881064162754304, |
|
"eval_runtime": 4.0258, |
|
"eval_samples_per_second": 39.743, |
|
"eval_steps_per_second": 0.745, |
|
"step": 16 |
|
}, |
|
{ |
|
"epoch": 8.8, |
|
"eval_accuracy": 0.91875, |
|
"eval_f1": 0.9530685920577617, |
|
"eval_loss": 0.34547853469848633, |
|
"eval_precision": 0.9777777777777777, |
|
"eval_recall": 0.9295774647887324, |
|
"eval_roc_auc": 0.881455399061033, |
|
"eval_runtime": 3.9749, |
|
"eval_samples_per_second": 40.253, |
|
"eval_steps_per_second": 0.755, |
|
"step": 18 |
|
}, |
|
{ |
|
"epoch": 9.8, |
|
"learning_rate": 1.7777777777777777e-05, |
|
"loss": 0.5349, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 9.8, |
|
"eval_accuracy": 0.91875, |
|
"eval_f1": 0.9534050179211471, |
|
"eval_loss": 0.29664501547813416, |
|
"eval_precision": 0.9708029197080292, |
|
"eval_recall": 0.9366197183098591, |
|
"eval_roc_auc": 0.8571987480438183, |
|
"eval_runtime": 4.2704, |
|
"eval_samples_per_second": 37.467, |
|
"eval_steps_per_second": 0.703, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 10.8, |
|
"eval_accuracy": 0.95, |
|
"eval_f1": 0.972027972027972, |
|
"eval_loss": 0.23471388220787048, |
|
"eval_precision": 0.9652777777777778, |
|
"eval_recall": 0.9788732394366197, |
|
"eval_roc_auc": 0.850547730829421, |
|
"eval_runtime": 3.9069, |
|
"eval_samples_per_second": 40.953, |
|
"eval_steps_per_second": 0.768, |
|
"step": 22 |
|
}, |
|
{ |
|
"epoch": 11.8, |
|
"eval_accuracy": 0.93125, |
|
"eval_f1": 0.9611307420494699, |
|
"eval_loss": 0.2467934787273407, |
|
"eval_precision": 0.9645390070921985, |
|
"eval_recall": 0.9577464788732394, |
|
"eval_roc_auc": 0.8399843505477309, |
|
"eval_runtime": 4.025, |
|
"eval_samples_per_second": 39.751, |
|
"eval_steps_per_second": 0.745, |
|
"step": 24 |
|
}, |
|
{ |
|
"epoch": 12.8, |
|
"eval_accuracy": 0.95625, |
|
"eval_f1": 0.9754385964912281, |
|
"eval_loss": 0.23101434111595154, |
|
"eval_precision": 0.972027972027972, |
|
"eval_recall": 0.9788732394366197, |
|
"eval_roc_auc": 0.8783255086071988, |
|
"eval_runtime": 4.0457, |
|
"eval_samples_per_second": 39.548, |
|
"eval_steps_per_second": 0.742, |
|
"step": 26 |
|
}, |
|
{ |
|
"epoch": 13.8, |
|
"eval_accuracy": 0.93125, |
|
"eval_f1": 0.9614035087719298, |
|
"eval_loss": 0.2082931101322174, |
|
"eval_precision": 0.958041958041958, |
|
"eval_recall": 0.9647887323943662, |
|
"eval_roc_auc": 0.8157276995305165, |
|
"eval_runtime": 4.0645, |
|
"eval_samples_per_second": 39.366, |
|
"eval_steps_per_second": 0.738, |
|
"step": 28 |
|
}, |
|
{ |
|
"epoch": 14.8, |
|
"learning_rate": 1.555555555555556e-05, |
|
"loss": 0.3593, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 14.8, |
|
"eval_accuracy": 0.9375, |
|
"eval_f1": 0.9652777777777778, |
|
"eval_loss": 0.18395133316516876, |
|
"eval_precision": 0.952054794520548, |
|
"eval_recall": 0.9788732394366197, |
|
"eval_roc_auc": 0.7949921752738655, |
|
"eval_runtime": 3.8518, |
|
"eval_samples_per_second": 41.539, |
|
"eval_steps_per_second": 0.779, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 15.8, |
|
"eval_accuracy": 0.9375, |
|
"eval_f1": 0.9647887323943662, |
|
"eval_loss": 0.19472570717334747, |
|
"eval_precision": 0.9647887323943662, |
|
"eval_recall": 0.9647887323943662, |
|
"eval_roc_auc": 0.8435054773082942, |
|
"eval_runtime": 4.1431, |
|
"eval_samples_per_second": 38.618, |
|
"eval_steps_per_second": 0.724, |
|
"step": 32 |
|
}, |
|
{ |
|
"epoch": 16.8, |
|
"eval_accuracy": 0.93125, |
|
"eval_f1": 0.9616724738675958, |
|
"eval_loss": 0.1836571842432022, |
|
"eval_precision": 0.9517241379310345, |
|
"eval_recall": 0.971830985915493, |
|
"eval_roc_auc": 0.7914710485133021, |
|
"eval_runtime": 4.0848, |
|
"eval_samples_per_second": 39.17, |
|
"eval_steps_per_second": 0.734, |
|
"step": 34 |
|
}, |
|
{ |
|
"epoch": 17.8, |
|
"eval_accuracy": 0.94375, |
|
"eval_f1": 0.9688581314878894, |
|
"eval_loss": 0.1819494664669037, |
|
"eval_precision": 0.9523809523809523, |
|
"eval_recall": 0.9859154929577465, |
|
"eval_roc_auc": 0.7985133020344288, |
|
"eval_runtime": 3.9897, |
|
"eval_samples_per_second": 40.104, |
|
"eval_steps_per_second": 0.752, |
|
"step": 36 |
|
}, |
|
{ |
|
"epoch": 18.8, |
|
"eval_accuracy": 0.94375, |
|
"eval_f1": 0.968421052631579, |
|
"eval_loss": 0.19235201179981232, |
|
"eval_precision": 0.965034965034965, |
|
"eval_recall": 0.971830985915493, |
|
"eval_roc_auc": 0.8470266040688575, |
|
"eval_runtime": 4.041, |
|
"eval_samples_per_second": 39.594, |
|
"eval_steps_per_second": 0.742, |
|
"step": 38 |
|
}, |
|
{ |
|
"epoch": 19.8, |
|
"learning_rate": 1.3333333333333333e-05, |
|
"loss": 0.2737, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 19.8, |
|
"eval_accuracy": 0.95, |
|
"eval_f1": 0.972027972027972, |
|
"eval_loss": 0.1990378201007843, |
|
"eval_precision": 0.9652777777777778, |
|
"eval_recall": 0.9788732394366197, |
|
"eval_roc_auc": 0.850547730829421, |
|
"eval_runtime": 4.1236, |
|
"eval_samples_per_second": 38.801, |
|
"eval_steps_per_second": 0.728, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 20.8, |
|
"eval_accuracy": 0.95, |
|
"eval_f1": 0.971830985915493, |
|
"eval_loss": 0.1758503019809723, |
|
"eval_precision": 0.971830985915493, |
|
"eval_recall": 0.971830985915493, |
|
"eval_roc_auc": 0.8748043818466354, |
|
"eval_runtime": 4.1193, |
|
"eval_samples_per_second": 38.841, |
|
"eval_steps_per_second": 0.728, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 21.8, |
|
"eval_accuracy": 0.93125, |
|
"eval_f1": 0.9616724738675958, |
|
"eval_loss": 0.18040268123149872, |
|
"eval_precision": 0.9517241379310345, |
|
"eval_recall": 0.971830985915493, |
|
"eval_roc_auc": 0.7914710485133021, |
|
"eval_runtime": 3.8662, |
|
"eval_samples_per_second": 41.384, |
|
"eval_steps_per_second": 0.776, |
|
"step": 44 |
|
}, |
|
{ |
|
"epoch": 22.8, |
|
"eval_accuracy": 0.93125, |
|
"eval_f1": 0.9616724738675958, |
|
"eval_loss": 0.16663400828838348, |
|
"eval_precision": 0.9517241379310345, |
|
"eval_recall": 0.971830985915493, |
|
"eval_roc_auc": 0.7914710485133021, |
|
"eval_runtime": 4.3016, |
|
"eval_samples_per_second": 37.195, |
|
"eval_steps_per_second": 0.697, |
|
"step": 46 |
|
}, |
|
{ |
|
"epoch": 23.8, |
|
"eval_accuracy": 0.94375, |
|
"eval_f1": 0.9688581314878894, |
|
"eval_loss": 0.15337304770946503, |
|
"eval_precision": 0.9523809523809523, |
|
"eval_recall": 0.9859154929577465, |
|
"eval_roc_auc": 0.7985133020344288, |
|
"eval_runtime": 4.0456, |
|
"eval_samples_per_second": 39.549, |
|
"eval_steps_per_second": 0.742, |
|
"step": 48 |
|
}, |
|
{ |
|
"epoch": 24.8, |
|
"learning_rate": 1.1111111111111113e-05, |
|
"loss": 0.2278, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 24.8, |
|
"eval_accuracy": 0.9375, |
|
"eval_f1": 0.9652777777777778, |
|
"eval_loss": 0.16116251051425934, |
|
"eval_precision": 0.952054794520548, |
|
"eval_recall": 0.9788732394366197, |
|
"eval_roc_auc": 0.7949921752738655, |
|
"eval_runtime": 4.0452, |
|
"eval_samples_per_second": 39.553, |
|
"eval_steps_per_second": 0.742, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 25.8, |
|
"eval_accuracy": 0.94375, |
|
"eval_f1": 0.9686411149825783, |
|
"eval_loss": 0.15349864959716797, |
|
"eval_precision": 0.9586206896551724, |
|
"eval_recall": 0.9788732394366197, |
|
"eval_roc_auc": 0.8227699530516432, |
|
"eval_runtime": 6.0991, |
|
"eval_samples_per_second": 26.233, |
|
"eval_steps_per_second": 0.492, |
|
"step": 52 |
|
}, |
|
{ |
|
"epoch": 26.8, |
|
"eval_accuracy": 0.94375, |
|
"eval_f1": 0.9681978798586572, |
|
"eval_loss": 0.1568022519350052, |
|
"eval_precision": 0.9716312056737588, |
|
"eval_recall": 0.9647887323943662, |
|
"eval_roc_auc": 0.871283255086072, |
|
"eval_runtime": 4.0891, |
|
"eval_samples_per_second": 39.128, |
|
"eval_steps_per_second": 0.734, |
|
"step": 54 |
|
}, |
|
{ |
|
"epoch": 27.8, |
|
"eval_accuracy": 0.9375, |
|
"eval_f1": 0.9645390070921985, |
|
"eval_loss": 0.21069078147411346, |
|
"eval_precision": 0.9714285714285714, |
|
"eval_recall": 0.9577464788732394, |
|
"eval_roc_auc": 0.8677621283255086, |
|
"eval_runtime": 4.1257, |
|
"eval_samples_per_second": 38.781, |
|
"eval_steps_per_second": 0.727, |
|
"step": 56 |
|
}, |
|
{ |
|
"epoch": 28.8, |
|
"eval_accuracy": 0.93125, |
|
"eval_f1": 0.9616724738675958, |
|
"eval_loss": 0.15922358632087708, |
|
"eval_precision": 0.9517241379310345, |
|
"eval_recall": 0.971830985915493, |
|
"eval_roc_auc": 0.7914710485133021, |
|
"eval_runtime": 3.944, |
|
"eval_samples_per_second": 40.568, |
|
"eval_steps_per_second": 0.761, |
|
"step": 58 |
|
}, |
|
{ |
|
"epoch": 29.8, |
|
"learning_rate": 8.888888888888888e-06, |
|
"loss": 0.2057, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 29.8, |
|
"eval_accuracy": 0.9375, |
|
"eval_f1": 0.9647887323943662, |
|
"eval_loss": 0.15567776560783386, |
|
"eval_precision": 0.9647887323943662, |
|
"eval_recall": 0.9647887323943662, |
|
"eval_roc_auc": 0.8435054773082942, |
|
"eval_runtime": 3.9386, |
|
"eval_samples_per_second": 40.624, |
|
"eval_steps_per_second": 0.762, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 30.8, |
|
"eval_accuracy": 0.94375, |
|
"eval_f1": 0.968421052631579, |
|
"eval_loss": 0.1714434176683426, |
|
"eval_precision": 0.965034965034965, |
|
"eval_recall": 0.971830985915493, |
|
"eval_roc_auc": 0.8470266040688575, |
|
"eval_runtime": 4.1925, |
|
"eval_samples_per_second": 38.164, |
|
"eval_steps_per_second": 0.716, |
|
"step": 62 |
|
}, |
|
{ |
|
"epoch": 31.8, |
|
"eval_accuracy": 0.95, |
|
"eval_f1": 0.972027972027972, |
|
"eval_loss": 0.15714499354362488, |
|
"eval_precision": 0.9652777777777778, |
|
"eval_recall": 0.9788732394366197, |
|
"eval_roc_auc": 0.850547730829421, |
|
"eval_runtime": 4.3684, |
|
"eval_samples_per_second": 36.627, |
|
"eval_steps_per_second": 0.687, |
|
"step": 64 |
|
}, |
|
{ |
|
"epoch": 32.8, |
|
"eval_accuracy": 0.9375, |
|
"eval_f1": 0.965034965034965, |
|
"eval_loss": 0.15739548206329346, |
|
"eval_precision": 0.9583333333333334, |
|
"eval_recall": 0.971830985915493, |
|
"eval_roc_auc": 0.8192488262910799, |
|
"eval_runtime": 3.9613, |
|
"eval_samples_per_second": 40.39, |
|
"eval_steps_per_second": 0.757, |
|
"step": 66 |
|
}, |
|
{ |
|
"epoch": 33.8, |
|
"eval_accuracy": 0.95625, |
|
"eval_f1": 0.9754385964912281, |
|
"eval_loss": 0.1422826498746872, |
|
"eval_precision": 0.972027972027972, |
|
"eval_recall": 0.9788732394366197, |
|
"eval_roc_auc": 0.8783255086071988, |
|
"eval_runtime": 3.9825, |
|
"eval_samples_per_second": 40.175, |
|
"eval_steps_per_second": 0.753, |
|
"step": 68 |
|
}, |
|
{ |
|
"epoch": 34.8, |
|
"learning_rate": 6.666666666666667e-06, |
|
"loss": 0.2, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 34.8, |
|
"eval_accuracy": 0.94375, |
|
"eval_f1": 0.968421052631579, |
|
"eval_loss": 0.16770192980766296, |
|
"eval_precision": 0.965034965034965, |
|
"eval_recall": 0.971830985915493, |
|
"eval_roc_auc": 0.8470266040688575, |
|
"eval_runtime": 4.1697, |
|
"eval_samples_per_second": 38.372, |
|
"eval_steps_per_second": 0.719, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 35.8, |
|
"eval_accuracy": 0.9375, |
|
"eval_f1": 0.965034965034965, |
|
"eval_loss": 0.1559743881225586, |
|
"eval_precision": 0.9583333333333334, |
|
"eval_recall": 0.971830985915493, |
|
"eval_roc_auc": 0.8192488262910799, |
|
"eval_runtime": 4.0897, |
|
"eval_samples_per_second": 39.123, |
|
"eval_steps_per_second": 0.734, |
|
"step": 72 |
|
}, |
|
{ |
|
"epoch": 36.8, |
|
"eval_accuracy": 0.9375, |
|
"eval_f1": 0.9652777777777778, |
|
"eval_loss": 0.15941758453845978, |
|
"eval_precision": 0.952054794520548, |
|
"eval_recall": 0.9788732394366197, |
|
"eval_roc_auc": 0.7949921752738655, |
|
"eval_runtime": 4.0474, |
|
"eval_samples_per_second": 39.531, |
|
"eval_steps_per_second": 0.741, |
|
"step": 74 |
|
}, |
|
{ |
|
"epoch": 37.8, |
|
"eval_accuracy": 0.94375, |
|
"eval_f1": 0.9686411149825783, |
|
"eval_loss": 0.15121030807495117, |
|
"eval_precision": 0.9586206896551724, |
|
"eval_recall": 0.9788732394366197, |
|
"eval_roc_auc": 0.8227699530516432, |
|
"eval_runtime": 4.2667, |
|
"eval_samples_per_second": 37.499, |
|
"eval_steps_per_second": 0.703, |
|
"step": 76 |
|
}, |
|
{ |
|
"epoch": 38.8, |
|
"eval_accuracy": 0.95625, |
|
"eval_f1": 0.975609756097561, |
|
"eval_loss": 0.13959212601184845, |
|
"eval_precision": 0.9655172413793104, |
|
"eval_recall": 0.9859154929577465, |
|
"eval_roc_auc": 0.8540688575899843, |
|
"eval_runtime": 4.0576, |
|
"eval_samples_per_second": 39.432, |
|
"eval_steps_per_second": 0.739, |
|
"step": 78 |
|
}, |
|
{ |
|
"epoch": 39.8, |
|
"learning_rate": 4.444444444444444e-06, |
|
"loss": 0.1838, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 39.8, |
|
"eval_accuracy": 0.9375, |
|
"eval_f1": 0.965034965034965, |
|
"eval_loss": 0.15085594356060028, |
|
"eval_precision": 0.9583333333333334, |
|
"eval_recall": 0.971830985915493, |
|
"eval_roc_auc": 0.8192488262910799, |
|
"eval_runtime": 3.9857, |
|
"eval_samples_per_second": 40.144, |
|
"eval_steps_per_second": 0.753, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 40.8, |
|
"eval_accuracy": 0.95, |
|
"eval_f1": 0.971830985915493, |
|
"eval_loss": 0.15287616848945618, |
|
"eval_precision": 0.971830985915493, |
|
"eval_recall": 0.971830985915493, |
|
"eval_roc_auc": 0.8748043818466354, |
|
"eval_runtime": 5.1236, |
|
"eval_samples_per_second": 31.228, |
|
"eval_steps_per_second": 0.586, |
|
"step": 82 |
|
}, |
|
{ |
|
"epoch": 41.8, |
|
"eval_accuracy": 0.95, |
|
"eval_f1": 0.972027972027972, |
|
"eval_loss": 0.1505597084760666, |
|
"eval_precision": 0.9652777777777778, |
|
"eval_recall": 0.9788732394366197, |
|
"eval_roc_auc": 0.850547730829421, |
|
"eval_runtime": 4.2192, |
|
"eval_samples_per_second": 37.921, |
|
"eval_steps_per_second": 0.711, |
|
"step": 84 |
|
}, |
|
{ |
|
"epoch": 42.8, |
|
"eval_accuracy": 0.95, |
|
"eval_f1": 0.972027972027972, |
|
"eval_loss": 0.1549244374036789, |
|
"eval_precision": 0.9652777777777778, |
|
"eval_recall": 0.9788732394366197, |
|
"eval_roc_auc": 0.850547730829421, |
|
"eval_runtime": 3.8602, |
|
"eval_samples_per_second": 41.448, |
|
"eval_steps_per_second": 0.777, |
|
"step": 86 |
|
}, |
|
{ |
|
"epoch": 43.8, |
|
"eval_accuracy": 0.95625, |
|
"eval_f1": 0.975609756097561, |
|
"eval_loss": 0.13305585086345673, |
|
"eval_precision": 0.9655172413793104, |
|
"eval_recall": 0.9859154929577465, |
|
"eval_roc_auc": 0.8540688575899843, |
|
"eval_runtime": 4.2919, |
|
"eval_samples_per_second": 37.28, |
|
"eval_steps_per_second": 0.699, |
|
"step": 88 |
|
}, |
|
{ |
|
"epoch": 44.8, |
|
"learning_rate": 2.222222222222222e-06, |
|
"loss": 0.1872, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 44.8, |
|
"eval_accuracy": 0.94375, |
|
"eval_f1": 0.9688581314878894, |
|
"eval_loss": 0.14087018370628357, |
|
"eval_precision": 0.9523809523809523, |
|
"eval_recall": 0.9859154929577465, |
|
"eval_roc_auc": 0.7985133020344288, |
|
"eval_runtime": 4.0748, |
|
"eval_samples_per_second": 39.266, |
|
"eval_steps_per_second": 0.736, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 45.8, |
|
"eval_accuracy": 0.9375, |
|
"eval_f1": 0.965034965034965, |
|
"eval_loss": 0.1639305055141449, |
|
"eval_precision": 0.9583333333333334, |
|
"eval_recall": 0.971830985915493, |
|
"eval_roc_auc": 0.8192488262910799, |
|
"eval_runtime": 3.9376, |
|
"eval_samples_per_second": 40.634, |
|
"eval_steps_per_second": 0.762, |
|
"step": 92 |
|
}, |
|
{ |
|
"epoch": 46.8, |
|
"eval_accuracy": 0.95, |
|
"eval_f1": 0.9722222222222222, |
|
"eval_loss": 0.1390833854675293, |
|
"eval_precision": 0.958904109589041, |
|
"eval_recall": 0.9859154929577465, |
|
"eval_roc_auc": 0.8262910798122067, |
|
"eval_runtime": 3.9934, |
|
"eval_samples_per_second": 40.066, |
|
"eval_steps_per_second": 0.751, |
|
"step": 94 |
|
}, |
|
{ |
|
"epoch": 47.8, |
|
"eval_accuracy": 0.95625, |
|
"eval_f1": 0.975609756097561, |
|
"eval_loss": 0.14361494779586792, |
|
"eval_precision": 0.9655172413793104, |
|
"eval_recall": 0.9859154929577465, |
|
"eval_roc_auc": 0.8540688575899843, |
|
"eval_runtime": 4.2477, |
|
"eval_samples_per_second": 37.667, |
|
"eval_steps_per_second": 0.706, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 48.8, |
|
"eval_accuracy": 0.94375, |
|
"eval_f1": 0.9686411149825783, |
|
"eval_loss": 0.1442493200302124, |
|
"eval_precision": 0.9586206896551724, |
|
"eval_recall": 0.9788732394366197, |
|
"eval_roc_auc": 0.8227699530516432, |
|
"eval_runtime": 4.0963, |
|
"eval_samples_per_second": 39.059, |
|
"eval_steps_per_second": 0.732, |
|
"step": 98 |
|
}, |
|
{ |
|
"epoch": 49.8, |
|
"learning_rate": 0.0, |
|
"loss": 0.185, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 49.8, |
|
"eval_accuracy": 0.95, |
|
"eval_f1": 0.972027972027972, |
|
"eval_loss": 0.1484707146883011, |
|
"eval_precision": 0.9652777777777778, |
|
"eval_recall": 0.9788732394366197, |
|
"eval_roc_auc": 0.850547730829421, |
|
"eval_runtime": 3.8936, |
|
"eval_samples_per_second": 41.093, |
|
"eval_steps_per_second": 0.77, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 49.8, |
|
"step": 100, |
|
"total_flos": 3.197753854288036e+17, |
|
"train_loss": 0.3222511351108551, |
|
"train_runtime": 425.6784, |
|
"train_samples_per_second": 74.704, |
|
"train_steps_per_second": 0.235 |
|
} |
|
], |
|
"max_steps": 100, |
|
"num_train_epochs": 50, |
|
"total_flos": 3.197753854288036e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|