|
{ |
|
"best_metric": 0.43965517241379304, |
|
"best_model_checkpoint": "car_identified_model_7/checkpoint-165", |
|
"epoch": 228.36363636363637, |
|
"eval_steps": 500, |
|
"global_step": 314, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.73, |
|
"learning_rate": 1.9950000000000004e-05, |
|
"loss": 0.6943, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 0.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.09523809523809525, |
|
"eval_loss": 0.6940220594406128, |
|
"eval_roc_auc": 0.4290890269151138, |
|
"eval_runtime": 2.3165, |
|
"eval_samples_per_second": 18.131, |
|
"eval_steps_per_second": 1.295, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 1.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.09126984126984126, |
|
"eval_loss": 0.6954004764556885, |
|
"eval_roc_auc": 0.4314182194616977, |
|
"eval_runtime": 2.1188, |
|
"eval_samples_per_second": 19.823, |
|
"eval_steps_per_second": 1.416, |
|
"step": 2 |
|
}, |
|
{ |
|
"epoch": 2.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.10158730158730159, |
|
"eval_loss": 0.7020308971405029, |
|
"eval_roc_auc": 0.4244306418219462, |
|
"eval_runtime": 2.0566, |
|
"eval_samples_per_second": 20.422, |
|
"eval_steps_per_second": 1.459, |
|
"step": 4 |
|
}, |
|
{ |
|
"epoch": 3.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.1020408163265306, |
|
"eval_loss": 0.7104746103286743, |
|
"eval_roc_auc": 0.43322981366459634, |
|
"eval_runtime": 2.0845, |
|
"eval_samples_per_second": 20.149, |
|
"eval_steps_per_second": 1.439, |
|
"step": 5 |
|
}, |
|
{ |
|
"epoch": 4.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.15476190476190477, |
|
"eval_loss": 0.7156671285629272, |
|
"eval_roc_auc": 0.5320910973084887, |
|
"eval_runtime": 2.0793, |
|
"eval_samples_per_second": 20.199, |
|
"eval_steps_per_second": 1.443, |
|
"step": 6 |
|
}, |
|
{ |
|
"epoch": 5.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.1546218487394958, |
|
"eval_loss": 0.6987839937210083, |
|
"eval_roc_auc": 0.5331262939958592, |
|
"eval_runtime": 2.1617, |
|
"eval_samples_per_second": 19.429, |
|
"eval_steps_per_second": 1.388, |
|
"step": 8 |
|
}, |
|
{ |
|
"epoch": 6.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.15355805243445694, |
|
"eval_loss": 0.6832717061042786, |
|
"eval_roc_auc": 0.5323498964803313, |
|
"eval_runtime": 2.117, |
|
"eval_samples_per_second": 19.84, |
|
"eval_steps_per_second": 1.417, |
|
"step": 9 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.18217054263565893, |
|
"eval_loss": 0.6745525598526001, |
|
"eval_roc_auc": 0.5804865424430642, |
|
"eval_runtime": 2.0693, |
|
"eval_samples_per_second": 20.297, |
|
"eval_steps_per_second": 1.45, |
|
"step": 11 |
|
}, |
|
{ |
|
"epoch": 8.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2058252427184466, |
|
"eval_loss": 0.6750043034553528, |
|
"eval_roc_auc": 0.619824016563147, |
|
"eval_runtime": 2.0585, |
|
"eval_samples_per_second": 20.403, |
|
"eval_steps_per_second": 1.457, |
|
"step": 12 |
|
}, |
|
{ |
|
"epoch": 9.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2152641878669276, |
|
"eval_loss": 0.673625648021698, |
|
"eval_roc_auc": 0.6348343685300206, |
|
"eval_runtime": 2.1768, |
|
"eval_samples_per_second": 19.294, |
|
"eval_steps_per_second": 1.378, |
|
"step": 13 |
|
}, |
|
{ |
|
"epoch": 10.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2222222222222222, |
|
"eval_loss": 0.6704300045967102, |
|
"eval_roc_auc": 0.644927536231884, |
|
"eval_runtime": 2.2148, |
|
"eval_samples_per_second": 18.963, |
|
"eval_steps_per_second": 1.355, |
|
"step": 15 |
|
}, |
|
{ |
|
"epoch": 11.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2258064516129032, |
|
"eval_loss": 0.6693084836006165, |
|
"eval_roc_auc": 0.6490683229813665, |
|
"eval_runtime": 2.0734, |
|
"eval_samples_per_second": 20.257, |
|
"eval_steps_per_second": 1.447, |
|
"step": 16 |
|
}, |
|
{ |
|
"epoch": 12.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.23293172690763056, |
|
"eval_loss": 0.6673960089683533, |
|
"eval_roc_auc": 0.6609730848861284, |
|
"eval_runtime": 2.1348, |
|
"eval_samples_per_second": 19.674, |
|
"eval_steps_per_second": 1.405, |
|
"step": 17 |
|
}, |
|
{ |
|
"epoch": 13.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2240325865580448, |
|
"eval_loss": 0.6640763282775879, |
|
"eval_roc_auc": 0.6451863354037266, |
|
"eval_runtime": 2.1666, |
|
"eval_samples_per_second": 19.385, |
|
"eval_steps_per_second": 1.385, |
|
"step": 19 |
|
}, |
|
{ |
|
"epoch": 14.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.22085889570552147, |
|
"eval_loss": 0.6631330847740173, |
|
"eval_roc_auc": 0.639751552795031, |
|
"eval_runtime": 2.0574, |
|
"eval_samples_per_second": 20.414, |
|
"eval_steps_per_second": 1.458, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.22406639004149378, |
|
"eval_loss": 0.6598684191703796, |
|
"eval_roc_auc": 0.6433747412008283, |
|
"eval_runtime": 2.1618, |
|
"eval_samples_per_second": 19.428, |
|
"eval_steps_per_second": 1.388, |
|
"step": 22 |
|
}, |
|
{ |
|
"epoch": 16.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.23454157782515989, |
|
"eval_loss": 0.6574246287345886, |
|
"eval_roc_auc": 0.6565734989648033, |
|
"eval_runtime": 2.0709, |
|
"eval_samples_per_second": 20.281, |
|
"eval_steps_per_second": 1.449, |
|
"step": 23 |
|
}, |
|
{ |
|
"epoch": 17.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.24017467248908297, |
|
"eval_loss": 0.6559909582138062, |
|
"eval_roc_auc": 0.6622670807453417, |
|
"eval_runtime": 2.2938, |
|
"eval_samples_per_second": 18.311, |
|
"eval_steps_per_second": 1.308, |
|
"step": 24 |
|
}, |
|
{ |
|
"epoch": 18.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.23399558498896247, |
|
"eval_loss": 0.6524508595466614, |
|
"eval_roc_auc": 0.6519151138716356, |
|
"eval_runtime": 2.1408, |
|
"eval_samples_per_second": 19.619, |
|
"eval_steps_per_second": 1.401, |
|
"step": 26 |
|
}, |
|
{ |
|
"epoch": 19.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.24608501118568235, |
|
"eval_loss": 0.650789737701416, |
|
"eval_roc_auc": 0.6679606625258798, |
|
"eval_runtime": 2.1461, |
|
"eval_samples_per_second": 19.571, |
|
"eval_steps_per_second": 1.398, |
|
"step": 27 |
|
}, |
|
{ |
|
"epoch": 20.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.24074074074074073, |
|
"eval_loss": 0.6483226418495178, |
|
"eval_roc_auc": 0.6563146997929606, |
|
"eval_runtime": 2.2028, |
|
"eval_samples_per_second": 19.067, |
|
"eval_steps_per_second": 1.362, |
|
"step": 28 |
|
}, |
|
{ |
|
"epoch": 21.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.24545454545454545, |
|
"eval_loss": 0.6458417177200317, |
|
"eval_roc_auc": 0.6651138716356108, |
|
"eval_runtime": 2.2709, |
|
"eval_samples_per_second": 18.495, |
|
"eval_steps_per_second": 1.321, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 22.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.24601366742596809, |
|
"eval_loss": 0.644438624382019, |
|
"eval_roc_auc": 0.665631469979296, |
|
"eval_runtime": 2.1455, |
|
"eval_samples_per_second": 19.576, |
|
"eval_steps_per_second": 1.398, |
|
"step": 31 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.25116279069767444, |
|
"eval_loss": 0.6407680511474609, |
|
"eval_roc_auc": 0.6702898550724637, |
|
"eval_runtime": 2.3067, |
|
"eval_samples_per_second": 18.208, |
|
"eval_steps_per_second": 1.301, |
|
"step": 33 |
|
}, |
|
{ |
|
"epoch": 24.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2523809523809524, |
|
"eval_loss": 0.6386719346046448, |
|
"eval_roc_auc": 0.6689958592132504, |
|
"eval_runtime": 2.1261, |
|
"eval_samples_per_second": 19.754, |
|
"eval_steps_per_second": 1.411, |
|
"step": 34 |
|
}, |
|
{ |
|
"epoch": 25.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2579075425790754, |
|
"eval_loss": 0.6363871693611145, |
|
"eval_roc_auc": 0.6736542443064182, |
|
"eval_runtime": 2.0731, |
|
"eval_samples_per_second": 20.259, |
|
"eval_steps_per_second": 1.447, |
|
"step": 35 |
|
}, |
|
{ |
|
"epoch": 26.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2706766917293233, |
|
"eval_loss": 0.633211076259613, |
|
"eval_roc_auc": 0.686335403726708, |
|
"eval_runtime": 2.1802, |
|
"eval_samples_per_second": 19.264, |
|
"eval_steps_per_second": 1.376, |
|
"step": 37 |
|
}, |
|
{ |
|
"epoch": 27.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.26153846153846155, |
|
"eval_loss": 0.6316937208175659, |
|
"eval_roc_auc": 0.671583850931677, |
|
"eval_runtime": 2.2588, |
|
"eval_samples_per_second": 18.594, |
|
"eval_steps_per_second": 1.328, |
|
"step": 38 |
|
}, |
|
{ |
|
"epoch": 28.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.26666666666666666, |
|
"eval_loss": 0.6295819878578186, |
|
"eval_roc_auc": 0.6780538302277432, |
|
"eval_runtime": 2.0803, |
|
"eval_samples_per_second": 20.189, |
|
"eval_steps_per_second": 1.442, |
|
"step": 39 |
|
}, |
|
{ |
|
"epoch": 29.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2819843342036553, |
|
"eval_loss": 0.6249864101409912, |
|
"eval_roc_auc": 0.6946169772256728, |
|
"eval_runtime": 2.1933, |
|
"eval_samples_per_second": 19.149, |
|
"eval_steps_per_second": 1.368, |
|
"step": 41 |
|
}, |
|
{ |
|
"epoch": 30.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2872340425531915, |
|
"eval_loss": 0.624562680721283, |
|
"eval_roc_auc": 0.6982401656314701, |
|
"eval_runtime": 2.1386, |
|
"eval_samples_per_second": 19.639, |
|
"eval_steps_per_second": 1.403, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2936288088642659, |
|
"eval_loss": 0.6203415393829346, |
|
"eval_roc_auc": 0.6995341614906833, |
|
"eval_runtime": 2.0334, |
|
"eval_samples_per_second": 20.655, |
|
"eval_steps_per_second": 1.475, |
|
"step": 44 |
|
}, |
|
{ |
|
"epoch": 32.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.27932960893854747, |
|
"eval_loss": 0.619665265083313, |
|
"eval_roc_auc": 0.6816770186335404, |
|
"eval_runtime": 2.2329, |
|
"eval_samples_per_second": 18.809, |
|
"eval_steps_per_second": 1.344, |
|
"step": 45 |
|
}, |
|
{ |
|
"epoch": 33.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2832861189801699, |
|
"eval_loss": 0.6191604733467102, |
|
"eval_roc_auc": 0.6842650103519669, |
|
"eval_runtime": 2.1287, |
|
"eval_samples_per_second": 19.73, |
|
"eval_steps_per_second": 1.409, |
|
"step": 46 |
|
}, |
|
{ |
|
"epoch": 34.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.29059829059829057, |
|
"eval_loss": 0.6188385486602783, |
|
"eval_roc_auc": 0.6917701863354038, |
|
"eval_runtime": 1.9704, |
|
"eval_samples_per_second": 21.316, |
|
"eval_steps_per_second": 1.523, |
|
"step": 48 |
|
}, |
|
{ |
|
"epoch": 35.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.2994350282485876, |
|
"eval_loss": 0.6187217831611633, |
|
"eval_roc_auc": 0.7031573498964803, |
|
"eval_runtime": 2.1103, |
|
"eval_samples_per_second": 19.902, |
|
"eval_steps_per_second": 1.422, |
|
"step": 49 |
|
}, |
|
{ |
|
"epoch": 36.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.29394812680115273, |
|
"eval_loss": 0.6172403693199158, |
|
"eval_roc_auc": 0.6938405797101449, |
|
"eval_runtime": 2.0512, |
|
"eval_samples_per_second": 20.476, |
|
"eval_steps_per_second": 1.463, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 37.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3072289156626506, |
|
"eval_loss": 0.6139649748802185, |
|
"eval_roc_auc": 0.7016045548654244, |
|
"eval_runtime": 2.0138, |
|
"eval_samples_per_second": 20.857, |
|
"eval_steps_per_second": 1.49, |
|
"step": 52 |
|
}, |
|
{ |
|
"epoch": 38.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.30538922155688625, |
|
"eval_loss": 0.6133411526679993, |
|
"eval_roc_auc": 0.7005693581780539, |
|
"eval_runtime": 2.1136, |
|
"eval_samples_per_second": 19.871, |
|
"eval_steps_per_second": 1.419, |
|
"step": 53 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3081570996978852, |
|
"eval_loss": 0.6092615723609924, |
|
"eval_roc_auc": 0.7021221532091098, |
|
"eval_runtime": 2.0132, |
|
"eval_samples_per_second": 20.863, |
|
"eval_steps_per_second": 1.49, |
|
"step": 55 |
|
}, |
|
{ |
|
"epoch": 40.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3151515151515151, |
|
"eval_loss": 0.6076943278312683, |
|
"eval_roc_auc": 0.7091097308488613, |
|
"eval_runtime": 2.0499, |
|
"eval_samples_per_second": 20.489, |
|
"eval_steps_per_second": 1.463, |
|
"step": 56 |
|
}, |
|
{ |
|
"epoch": 41.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.31097560975609756, |
|
"eval_loss": 0.6047279238700867, |
|
"eval_roc_auc": 0.7036749482401656, |
|
"eval_runtime": 2.2835, |
|
"eval_samples_per_second": 18.392, |
|
"eval_steps_per_second": 1.314, |
|
"step": 57 |
|
}, |
|
{ |
|
"epoch": 42.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3164556962025316, |
|
"eval_loss": 0.6036221385002136, |
|
"eval_roc_auc": 0.7034161490683231, |
|
"eval_runtime": 1.9891, |
|
"eval_samples_per_second": 21.115, |
|
"eval_steps_per_second": 1.508, |
|
"step": 59 |
|
}, |
|
{ |
|
"epoch": 43.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.33116883116883117, |
|
"eval_loss": 0.6039034128189087, |
|
"eval_roc_auc": 0.7140269151138717, |
|
"eval_runtime": 2.2035, |
|
"eval_samples_per_second": 19.061, |
|
"eval_steps_per_second": 1.361, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 44.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.32258064516129037, |
|
"eval_loss": 0.6021687984466553, |
|
"eval_roc_auc": 0.7065217391304347, |
|
"eval_runtime": 1.9925, |
|
"eval_samples_per_second": 21.079, |
|
"eval_steps_per_second": 1.506, |
|
"step": 61 |
|
}, |
|
{ |
|
"epoch": 45.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.326797385620915, |
|
"eval_loss": 0.6014130711555481, |
|
"eval_roc_auc": 0.708592132505176, |
|
"eval_runtime": 2.0419, |
|
"eval_samples_per_second": 20.569, |
|
"eval_steps_per_second": 1.469, |
|
"step": 63 |
|
}, |
|
{ |
|
"epoch": 46.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3130990415335463, |
|
"eval_loss": 0.6009289622306824, |
|
"eval_roc_auc": 0.6984989648033127, |
|
"eval_runtime": 1.9923, |
|
"eval_samples_per_second": 21.081, |
|
"eval_steps_per_second": 1.506, |
|
"step": 64 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3411371237458194, |
|
"eval_loss": 0.5962069034576416, |
|
"eval_roc_auc": 0.7186853002070394, |
|
"eval_runtime": 2.2383, |
|
"eval_samples_per_second": 18.764, |
|
"eval_steps_per_second": 1.34, |
|
"step": 66 |
|
}, |
|
{ |
|
"epoch": 48.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.34576271186440677, |
|
"eval_loss": 0.5965468287467957, |
|
"eval_roc_auc": 0.7207556935817806, |
|
"eval_runtime": 2.0677, |
|
"eval_samples_per_second": 20.312, |
|
"eval_steps_per_second": 1.451, |
|
"step": 67 |
|
}, |
|
{ |
|
"epoch": 49.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.341296928327645, |
|
"eval_loss": 0.5968855023384094, |
|
"eval_roc_auc": 0.7153209109730849, |
|
"eval_runtime": 2.0241, |
|
"eval_samples_per_second": 20.75, |
|
"eval_steps_per_second": 1.482, |
|
"step": 68 |
|
}, |
|
{ |
|
"epoch": 50.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.34, |
|
"eval_loss": 0.593564510345459, |
|
"eval_roc_auc": 0.7181677018633541, |
|
"eval_runtime": 2.0433, |
|
"eval_samples_per_second": 20.555, |
|
"eval_steps_per_second": 1.468, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 51.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3411371237458194, |
|
"eval_loss": 0.591184139251709, |
|
"eval_roc_auc": 0.7186853002070394, |
|
"eval_runtime": 2.0663, |
|
"eval_samples_per_second": 20.326, |
|
"eval_steps_per_second": 1.452, |
|
"step": 71 |
|
}, |
|
{ |
|
"epoch": 52.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3310344827586207, |
|
"eval_loss": 0.592108428478241, |
|
"eval_roc_auc": 0.7039337474120083, |
|
"eval_runtime": 2.2694, |
|
"eval_samples_per_second": 18.507, |
|
"eval_steps_per_second": 1.322, |
|
"step": 72 |
|
}, |
|
{ |
|
"epoch": 53.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.34657039711191334, |
|
"eval_loss": 0.5902323722839355, |
|
"eval_roc_auc": 0.7106625258799172, |
|
"eval_runtime": 2.0722, |
|
"eval_samples_per_second": 20.269, |
|
"eval_steps_per_second": 1.448, |
|
"step": 74 |
|
}, |
|
{ |
|
"epoch": 54.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.34306569343065696, |
|
"eval_loss": 0.5893351435661316, |
|
"eval_roc_auc": 0.7057453416149069, |
|
"eval_runtime": 2.055, |
|
"eval_samples_per_second": 20.438, |
|
"eval_steps_per_second": 1.46, |
|
"step": 75 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3404255319148936, |
|
"eval_loss": 0.5895388722419739, |
|
"eval_roc_auc": 0.7080745341614907, |
|
"eval_runtime": 2.0467, |
|
"eval_samples_per_second": 20.52, |
|
"eval_steps_per_second": 1.466, |
|
"step": 77 |
|
}, |
|
{ |
|
"epoch": 56.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3252595155709343, |
|
"eval_loss": 0.5894604921340942, |
|
"eval_roc_auc": 0.6979813664596274, |
|
"eval_runtime": 2.1145, |
|
"eval_samples_per_second": 19.863, |
|
"eval_steps_per_second": 1.419, |
|
"step": 78 |
|
}, |
|
{ |
|
"epoch": 57.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.35294117647058826, |
|
"eval_loss": 0.5903995037078857, |
|
"eval_roc_auc": 0.7238612836438924, |
|
"eval_runtime": 2.1187, |
|
"eval_samples_per_second": 19.824, |
|
"eval_steps_per_second": 1.416, |
|
"step": 79 |
|
}, |
|
{ |
|
"epoch": 58.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.33793103448275863, |
|
"eval_loss": 0.5916685461997986, |
|
"eval_roc_auc": 0.7104037267080746, |
|
"eval_runtime": 2.1241, |
|
"eval_samples_per_second": 19.773, |
|
"eval_steps_per_second": 1.412, |
|
"step": 81 |
|
}, |
|
{ |
|
"epoch": 59.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3298245614035088, |
|
"eval_loss": 0.5893025994300842, |
|
"eval_roc_auc": 0.7000517598343685, |
|
"eval_runtime": 2.1145, |
|
"eval_samples_per_second": 19.863, |
|
"eval_steps_per_second": 1.419, |
|
"step": 82 |
|
}, |
|
{ |
|
"epoch": 60.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.36823104693140796, |
|
"eval_loss": 0.5839800238609314, |
|
"eval_roc_auc": 0.7300724637681159, |
|
"eval_runtime": 2.0295, |
|
"eval_samples_per_second": 20.695, |
|
"eval_steps_per_second": 1.478, |
|
"step": 83 |
|
}, |
|
{ |
|
"epoch": 61.82, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3636363636363636, |
|
"eval_loss": 0.5821632146835327, |
|
"eval_roc_auc": 0.7246376811594203, |
|
"eval_runtime": 2.1312, |
|
"eval_samples_per_second": 19.707, |
|
"eval_steps_per_second": 1.408, |
|
"step": 85 |
|
}, |
|
{ |
|
"epoch": 62.55, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.35507246376811596, |
|
"eval_loss": 0.5816187858581543, |
|
"eval_roc_auc": 0.7176501035196688, |
|
"eval_runtime": 2.1966, |
|
"eval_samples_per_second": 19.121, |
|
"eval_steps_per_second": 1.366, |
|
"step": 86 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.34532374100719426, |
|
"eval_loss": 0.5823355317115784, |
|
"eval_roc_auc": 0.7101449275362319, |
|
"eval_runtime": 2.4993, |
|
"eval_samples_per_second": 16.804, |
|
"eval_steps_per_second": 1.2, |
|
"step": 88 |
|
}, |
|
{ |
|
"epoch": 64.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3537906137184116, |
|
"eval_loss": 0.5836206674575806, |
|
"eval_roc_auc": 0.7171325051759834, |
|
"eval_runtime": 1.9876, |
|
"eval_samples_per_second": 21.131, |
|
"eval_steps_per_second": 1.509, |
|
"step": 89 |
|
}, |
|
{ |
|
"epoch": 65.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.36823104693140796, |
|
"eval_loss": 0.5811671018600464, |
|
"eval_roc_auc": 0.7300724637681159, |
|
"eval_runtime": 2.2487, |
|
"eval_samples_per_second": 18.677, |
|
"eval_steps_per_second": 1.334, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 66.91, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.35294117647058826, |
|
"eval_loss": 0.5822634100914001, |
|
"eval_roc_auc": 0.7132505175983437, |
|
"eval_runtime": 2.1189, |
|
"eval_samples_per_second": 19.821, |
|
"eval_steps_per_second": 1.416, |
|
"step": 92 |
|
}, |
|
{ |
|
"epoch": 67.64, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3468634686346863, |
|
"eval_loss": 0.5832495093345642, |
|
"eval_roc_auc": 0.7072981366459627, |
|
"eval_runtime": 2.1564, |
|
"eval_samples_per_second": 19.477, |
|
"eval_steps_per_second": 1.391, |
|
"step": 93 |
|
}, |
|
{ |
|
"epoch": 68.36, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.34558823529411764, |
|
"eval_loss": 0.5849612355232239, |
|
"eval_roc_auc": 0.7067805383022774, |
|
"eval_runtime": 2.2328, |
|
"eval_samples_per_second": 18.811, |
|
"eval_steps_per_second": 1.344, |
|
"step": 94 |
|
}, |
|
{ |
|
"epoch": 69.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.35125448028673834, |
|
"eval_loss": 0.5786746144294739, |
|
"eval_roc_auc": 0.7160973084886129, |
|
"eval_runtime": 2.0885, |
|
"eval_samples_per_second": 20.11, |
|
"eval_steps_per_second": 1.436, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 70.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3695652173913044, |
|
"eval_loss": 0.5768818855285645, |
|
"eval_roc_auc": 0.7305900621118012, |
|
"eval_runtime": 2.1063, |
|
"eval_samples_per_second": 19.94, |
|
"eval_steps_per_second": 1.424, |
|
"step": 97 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3684210526315789, |
|
"eval_loss": 0.5726543068885803, |
|
"eval_roc_auc": 0.7228260869565218, |
|
"eval_runtime": 2.2057, |
|
"eval_samples_per_second": 19.042, |
|
"eval_steps_per_second": 1.36, |
|
"step": 99 |
|
}, |
|
{ |
|
"epoch": 72.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3863636363636363, |
|
"eval_loss": 0.5710762739181519, |
|
"eval_roc_auc": 0.736801242236025, |
|
"eval_runtime": 2.1542, |
|
"eval_samples_per_second": 19.496, |
|
"eval_steps_per_second": 1.393, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 73.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.37037037037037035, |
|
"eval_loss": 0.5743962526321411, |
|
"eval_roc_auc": 0.7272256728778468, |
|
"eval_runtime": 2.0601, |
|
"eval_samples_per_second": 20.387, |
|
"eval_steps_per_second": 1.456, |
|
"step": 101 |
|
}, |
|
{ |
|
"epoch": 74.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.36363636363636365, |
|
"eval_loss": 0.5718241333961487, |
|
"eval_roc_auc": 0.7173913043478259, |
|
"eval_runtime": 2.3822, |
|
"eval_samples_per_second": 17.631, |
|
"eval_steps_per_second": 1.259, |
|
"step": 103 |
|
}, |
|
{ |
|
"epoch": 75.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.36296296296296293, |
|
"eval_loss": 0.5745264887809753, |
|
"eval_roc_auc": 0.7207556935817806, |
|
"eval_runtime": 2.1941, |
|
"eval_samples_per_second": 19.143, |
|
"eval_steps_per_second": 1.367, |
|
"step": 104 |
|
}, |
|
{ |
|
"epoch": 76.36, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3676470588235294, |
|
"eval_loss": 0.5776281952857971, |
|
"eval_roc_auc": 0.7261904761904763, |
|
"eval_runtime": 2.4317, |
|
"eval_samples_per_second": 17.272, |
|
"eval_steps_per_second": 1.234, |
|
"step": 105 |
|
}, |
|
{ |
|
"epoch": 77.82, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.36296296296296293, |
|
"eval_loss": 0.5703898668289185, |
|
"eval_roc_auc": 0.7207556935817806, |
|
"eval_runtime": 2.0787, |
|
"eval_samples_per_second": 20.205, |
|
"eval_steps_per_second": 1.443, |
|
"step": 107 |
|
}, |
|
{ |
|
"epoch": 78.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.37547892720306514, |
|
"eval_loss": 0.5683363676071167, |
|
"eval_roc_auc": 0.7254140786749483, |
|
"eval_runtime": 2.2741, |
|
"eval_samples_per_second": 18.469, |
|
"eval_steps_per_second": 1.319, |
|
"step": 108 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.41600000000000004, |
|
"eval_loss": 0.5640491247177124, |
|
"eval_roc_auc": 0.7505175983436853, |
|
"eval_runtime": 2.3409, |
|
"eval_samples_per_second": 17.941, |
|
"eval_steps_per_second": 1.282, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 80.73, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.38095238095238093, |
|
"eval_loss": 0.5674084424972534, |
|
"eval_roc_auc": 0.7236024844720497, |
|
"eval_runtime": 2.19, |
|
"eval_samples_per_second": 19.178, |
|
"eval_steps_per_second": 1.37, |
|
"step": 111 |
|
}, |
|
{ |
|
"epoch": 81.45, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3730158730158731, |
|
"eval_loss": 0.564328670501709, |
|
"eval_roc_auc": 0.7171325051759834, |
|
"eval_runtime": 2.4742, |
|
"eval_samples_per_second": 16.975, |
|
"eval_steps_per_second": 1.213, |
|
"step": 112 |
|
}, |
|
{ |
|
"epoch": 82.91, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3813229571984436, |
|
"eval_loss": 0.5711435675621033, |
|
"eval_roc_auc": 0.7274844720496896, |
|
"eval_runtime": 2.1624, |
|
"eval_samples_per_second": 19.423, |
|
"eval_steps_per_second": 1.387, |
|
"step": 114 |
|
}, |
|
{ |
|
"epoch": 83.64, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.366412213740458, |
|
"eval_loss": 0.5771781206130981, |
|
"eval_roc_auc": 0.7184265010351967, |
|
"eval_runtime": 2.2132, |
|
"eval_samples_per_second": 18.977, |
|
"eval_steps_per_second": 1.356, |
|
"step": 115 |
|
}, |
|
{ |
|
"epoch": 84.36, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3582089552238805, |
|
"eval_loss": 0.5758051872253418, |
|
"eval_roc_auc": 0.7153209109730849, |
|
"eval_runtime": 2.2313, |
|
"eval_samples_per_second": 18.823, |
|
"eval_steps_per_second": 1.345, |
|
"step": 116 |
|
}, |
|
{ |
|
"epoch": 85.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.37209302325581395, |
|
"eval_loss": 0.5687234401702881, |
|
"eval_roc_auc": 0.7204968944099378, |
|
"eval_runtime": 2.117, |
|
"eval_samples_per_second": 19.839, |
|
"eval_steps_per_second": 1.417, |
|
"step": 118 |
|
}, |
|
{ |
|
"epoch": 86.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3904382470119522, |
|
"eval_loss": 0.565062403678894, |
|
"eval_roc_auc": 0.7305900621118013, |
|
"eval_runtime": 2.145, |
|
"eval_samples_per_second": 19.58, |
|
"eval_steps_per_second": 1.399, |
|
"step": 119 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.4, |
|
"eval_loss": 0.5594702959060669, |
|
"eval_roc_auc": 0.7375776397515528, |
|
"eval_runtime": 2.141, |
|
"eval_samples_per_second": 19.617, |
|
"eval_steps_per_second": 1.401, |
|
"step": 121 |
|
}, |
|
{ |
|
"epoch": 88.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.421875, |
|
"eval_loss": 0.5597259998321533, |
|
"eval_roc_auc": 0.760351966873706, |
|
"eval_runtime": 2.2421, |
|
"eval_samples_per_second": 18.733, |
|
"eval_steps_per_second": 1.338, |
|
"step": 122 |
|
}, |
|
{ |
|
"epoch": 89.45, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.4156862745098039, |
|
"eval_loss": 0.5603341460227966, |
|
"eval_roc_auc": 0.754399585921325, |
|
"eval_runtime": 2.1509, |
|
"eval_samples_per_second": 19.527, |
|
"eval_steps_per_second": 1.395, |
|
"step": 123 |
|
}, |
|
{ |
|
"epoch": 90.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.4108527131782946, |
|
"eval_loss": 0.554810643196106, |
|
"eval_roc_auc": 0.7528467908902691, |
|
"eval_runtime": 2.0949, |
|
"eval_samples_per_second": 20.049, |
|
"eval_steps_per_second": 1.432, |
|
"step": 125 |
|
}, |
|
{ |
|
"epoch": 91.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.41406249999999994, |
|
"eval_loss": 0.55705326795578, |
|
"eval_roc_auc": 0.7538819875776397, |
|
"eval_runtime": 2.1818, |
|
"eval_samples_per_second": 19.25, |
|
"eval_steps_per_second": 1.375, |
|
"step": 126 |
|
}, |
|
{ |
|
"epoch": 92.36, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.40476190476190477, |
|
"eval_loss": 0.5568869709968567, |
|
"eval_roc_auc": 0.7430124223602484, |
|
"eval_runtime": 2.1783, |
|
"eval_samples_per_second": 19.281, |
|
"eval_steps_per_second": 1.377, |
|
"step": 127 |
|
}, |
|
{ |
|
"epoch": 93.82, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.41732283464566927, |
|
"eval_loss": 0.5582275986671448, |
|
"eval_roc_auc": 0.7549171842650103, |
|
"eval_runtime": 2.1395, |
|
"eval_samples_per_second": 19.63, |
|
"eval_steps_per_second": 1.402, |
|
"step": 129 |
|
}, |
|
{ |
|
"epoch": 94.55, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.40310077519379844, |
|
"eval_loss": 0.561271071434021, |
|
"eval_roc_auc": 0.7463768115942029, |
|
"eval_runtime": 2.1505, |
|
"eval_samples_per_second": 19.53, |
|
"eval_steps_per_second": 1.395, |
|
"step": 130 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.40800000000000003, |
|
"eval_loss": 0.5574062466621399, |
|
"eval_roc_auc": 0.7440476190476191, |
|
"eval_runtime": 2.2873, |
|
"eval_samples_per_second": 18.362, |
|
"eval_steps_per_second": 1.312, |
|
"step": 132 |
|
}, |
|
{ |
|
"epoch": 96.73, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.421875, |
|
"eval_loss": 0.5570902228355408, |
|
"eval_roc_auc": 0.760351966873706, |
|
"eval_runtime": 2.2328, |
|
"eval_samples_per_second": 18.81, |
|
"eval_steps_per_second": 1.344, |
|
"step": 133 |
|
}, |
|
{ |
|
"epoch": 97.45, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.41732283464566927, |
|
"eval_loss": 0.5585192441940308, |
|
"eval_roc_auc": 0.7549171842650103, |
|
"eval_runtime": 2.1462, |
|
"eval_samples_per_second": 19.569, |
|
"eval_steps_per_second": 1.398, |
|
"step": 134 |
|
}, |
|
{ |
|
"epoch": 98.91, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.40625, |
|
"eval_loss": 0.5598769783973694, |
|
"eval_roc_auc": 0.7474120082815735, |
|
"eval_runtime": 2.1253, |
|
"eval_samples_per_second": 19.762, |
|
"eval_steps_per_second": 1.412, |
|
"step": 136 |
|
}, |
|
{ |
|
"epoch": 99.64, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.40476190476190477, |
|
"eval_loss": 0.5586134195327759, |
|
"eval_roc_auc": 0.7430124223602484, |
|
"eval_runtime": 2.1887, |
|
"eval_samples_per_second": 19.189, |
|
"eval_steps_per_second": 1.371, |
|
"step": 137 |
|
}, |
|
{ |
|
"epoch": 100.36, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.4112903225806452, |
|
"eval_loss": 0.5581173300743103, |
|
"eval_roc_auc": 0.7450828157349897, |
|
"eval_runtime": 2.1216, |
|
"eval_samples_per_second": 19.796, |
|
"eval_steps_per_second": 1.414, |
|
"step": 138 |
|
}, |
|
{ |
|
"epoch": 101.82, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.4117647058823529, |
|
"eval_loss": 0.554703414440155, |
|
"eval_roc_auc": 0.7373188405797102, |
|
"eval_runtime": 2.199, |
|
"eval_samples_per_second": 19.1, |
|
"eval_steps_per_second": 1.364, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 102.55, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.430379746835443, |
|
"eval_loss": 0.5479743480682373, |
|
"eval_roc_auc": 0.7507763975155279, |
|
"eval_runtime": 2.2214, |
|
"eval_samples_per_second": 18.907, |
|
"eval_steps_per_second": 1.35, |
|
"step": 141 |
|
}, |
|
{ |
|
"epoch": 104.0, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.43333333333333335, |
|
"eval_loss": 0.5521491169929504, |
|
"eval_roc_auc": 0.7556935817805382, |
|
"eval_runtime": 2.0733, |
|
"eval_samples_per_second": 20.258, |
|
"eval_steps_per_second": 1.447, |
|
"step": 143 |
|
}, |
|
{ |
|
"epoch": 104.73, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.4193548387096774, |
|
"eval_loss": 0.5539843440055847, |
|
"eval_roc_auc": 0.7515527950310559, |
|
"eval_runtime": 2.1533, |
|
"eval_samples_per_second": 19.505, |
|
"eval_steps_per_second": 1.393, |
|
"step": 144 |
|
}, |
|
{ |
|
"epoch": 105.45, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.4032921810699588, |
|
"eval_loss": 0.5572003126144409, |
|
"eval_roc_auc": 0.7347308488612837, |
|
"eval_runtime": 2.1589, |
|
"eval_samples_per_second": 19.454, |
|
"eval_steps_per_second": 1.39, |
|
"step": 145 |
|
}, |
|
{ |
|
"epoch": 106.91, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.40322580645161293, |
|
"eval_loss": 0.5563521981239319, |
|
"eval_roc_auc": 0.7386128364389234, |
|
"eval_runtime": 2.1472, |
|
"eval_samples_per_second": 19.561, |
|
"eval_steps_per_second": 1.397, |
|
"step": 147 |
|
}, |
|
{ |
|
"epoch": 107.64, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.39669421487603307, |
|
"eval_loss": 0.5568532943725586, |
|
"eval_roc_auc": 0.7287784679089027, |
|
"eval_runtime": 2.2259, |
|
"eval_samples_per_second": 18.869, |
|
"eval_steps_per_second": 1.348, |
|
"step": 148 |
|
}, |
|
{ |
|
"epoch": 108.36, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.41201716738197425, |
|
"eval_loss": 0.557677149772644, |
|
"eval_roc_auc": 0.7334368530020704, |
|
"eval_runtime": 2.0947, |
|
"eval_samples_per_second": 20.051, |
|
"eval_steps_per_second": 1.432, |
|
"step": 149 |
|
}, |
|
{ |
|
"epoch": 109.82, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.39004149377593367, |
|
"eval_loss": 0.552203357219696, |
|
"eval_roc_auc": 0.7228260869565217, |
|
"eval_runtime": 2.2966, |
|
"eval_samples_per_second": 18.288, |
|
"eval_steps_per_second": 1.306, |
|
"step": 151 |
|
}, |
|
{ |
|
"epoch": 110.55, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.3949579831932773, |
|
"eval_loss": 0.5478394031524658, |
|
"eval_roc_auc": 0.7243788819875777, |
|
"eval_runtime": 2.2413, |
|
"eval_samples_per_second": 18.739, |
|
"eval_steps_per_second": 1.339, |
|
"step": 152 |
|
}, |
|
{ |
|
"epoch": 112.0, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.41841004184100417, |
|
"eval_loss": 0.5458911061286926, |
|
"eval_roc_auc": 0.7432712215320911, |
|
"eval_runtime": 2.2404, |
|
"eval_samples_per_second": 18.747, |
|
"eval_steps_per_second": 1.339, |
|
"step": 154 |
|
}, |
|
{ |
|
"epoch": 112.73, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.40506329113924044, |
|
"eval_loss": 0.5490586161613464, |
|
"eval_roc_auc": 0.731366459627329, |
|
"eval_runtime": 2.2886, |
|
"eval_samples_per_second": 18.352, |
|
"eval_steps_per_second": 1.311, |
|
"step": 155 |
|
}, |
|
{ |
|
"epoch": 113.45, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.41841004184100417, |
|
"eval_loss": 0.5519034266471863, |
|
"eval_roc_auc": 0.7432712215320911, |
|
"eval_runtime": 2.1727, |
|
"eval_samples_per_second": 19.331, |
|
"eval_steps_per_second": 1.381, |
|
"step": 156 |
|
}, |
|
{ |
|
"epoch": 114.91, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.3950617283950617, |
|
"eval_loss": 0.550848662853241, |
|
"eval_roc_auc": 0.7282608695652175, |
|
"eval_runtime": 2.5249, |
|
"eval_samples_per_second": 16.635, |
|
"eval_steps_per_second": 1.188, |
|
"step": 158 |
|
}, |
|
{ |
|
"epoch": 115.64, |
|
"eval_accuracy": 0.0, |
|
"eval_f1": 0.4032921810699588, |
|
"eval_loss": 0.5499736070632935, |
|
"eval_roc_auc": 0.7347308488612837, |
|
"eval_runtime": 2.203, |
|
"eval_samples_per_second": 19.065, |
|
"eval_steps_per_second": 1.362, |
|
"step": 159 |
|
}, |
|
{ |
|
"epoch": 116.36, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.38866396761133604, |
|
"eval_loss": 0.5513898134231567, |
|
"eval_roc_auc": 0.7261904761904762, |
|
"eval_runtime": 2.1649, |
|
"eval_samples_per_second": 19.4, |
|
"eval_steps_per_second": 1.386, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 117.82, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.4255319148936171, |
|
"eval_loss": 0.544844388961792, |
|
"eval_roc_auc": 0.7453416149068324, |
|
"eval_runtime": 2.2226, |
|
"eval_samples_per_second": 18.897, |
|
"eval_steps_per_second": 1.35, |
|
"step": 162 |
|
}, |
|
{ |
|
"epoch": 118.55, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.430379746835443, |
|
"eval_loss": 0.5451788306236267, |
|
"eval_roc_auc": 0.7507763975155279, |
|
"eval_runtime": 2.2158, |
|
"eval_samples_per_second": 18.955, |
|
"eval_steps_per_second": 1.354, |
|
"step": 163 |
|
}, |
|
{ |
|
"epoch": 120.0, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.43965517241379304, |
|
"eval_loss": 0.5420504212379456, |
|
"eval_roc_auc": 0.7533643892339544, |
|
"eval_runtime": 2.2713, |
|
"eval_samples_per_second": 18.492, |
|
"eval_steps_per_second": 1.321, |
|
"step": 165 |
|
}, |
|
{ |
|
"epoch": 120.73, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.43478260869565216, |
|
"eval_loss": 0.5413345098495483, |
|
"eval_roc_auc": 0.7479296066252589, |
|
"eval_runtime": 2.1593, |
|
"eval_samples_per_second": 19.451, |
|
"eval_steps_per_second": 1.389, |
|
"step": 166 |
|
}, |
|
{ |
|
"epoch": 121.45, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.42735042735042733, |
|
"eval_loss": 0.5442317724227905, |
|
"eval_roc_auc": 0.7458592132505176, |
|
"eval_runtime": 2.22, |
|
"eval_samples_per_second": 18.919, |
|
"eval_steps_per_second": 1.351, |
|
"step": 167 |
|
}, |
|
{ |
|
"epoch": 122.91, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.430379746835443, |
|
"eval_loss": 0.5420621037483215, |
|
"eval_roc_auc": 0.7507763975155279, |
|
"eval_runtime": 2.2358, |
|
"eval_samples_per_second": 18.785, |
|
"eval_steps_per_second": 1.342, |
|
"step": 169 |
|
}, |
|
{ |
|
"epoch": 123.64, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.42372881355932207, |
|
"eval_loss": 0.5403344035148621, |
|
"eval_roc_auc": 0.7448240165631471, |
|
"eval_runtime": 2.1592, |
|
"eval_samples_per_second": 19.451, |
|
"eval_steps_per_second": 1.389, |
|
"step": 170 |
|
}, |
|
{ |
|
"epoch": 124.36, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.43478260869565216, |
|
"eval_loss": 0.5386914014816284, |
|
"eval_roc_auc": 0.7479296066252589, |
|
"eval_runtime": 2.1762, |
|
"eval_samples_per_second": 19.3, |
|
"eval_steps_per_second": 1.379, |
|
"step": 171 |
|
}, |
|
{ |
|
"epoch": 125.82, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.42241379310344834, |
|
"eval_loss": 0.5383176207542419, |
|
"eval_roc_auc": 0.740424430641822, |
|
"eval_runtime": 2.3145, |
|
"eval_samples_per_second": 18.147, |
|
"eval_steps_per_second": 1.296, |
|
"step": 173 |
|
}, |
|
{ |
|
"epoch": 126.55, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.42290748898678415, |
|
"eval_loss": 0.5346717238426208, |
|
"eval_roc_auc": 0.7365424430641822, |
|
"eval_runtime": 2.2566, |
|
"eval_samples_per_second": 18.612, |
|
"eval_steps_per_second": 1.329, |
|
"step": 174 |
|
}, |
|
{ |
|
"epoch": 128.0, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.43478260869565216, |
|
"eval_loss": 0.5410609245300293, |
|
"eval_roc_auc": 0.7479296066252589, |
|
"eval_runtime": 2.2479, |
|
"eval_samples_per_second": 18.684, |
|
"eval_steps_per_second": 1.335, |
|
"step": 176 |
|
}, |
|
{ |
|
"epoch": 128.73, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.40869565217391307, |
|
"eval_loss": 0.5448868870735168, |
|
"eval_roc_auc": 0.72851966873706, |
|
"eval_runtime": 2.2593, |
|
"eval_samples_per_second": 18.59, |
|
"eval_steps_per_second": 1.328, |
|
"step": 177 |
|
}, |
|
{ |
|
"epoch": 129.45, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.4188034188034188, |
|
"eval_loss": 0.5426321029663086, |
|
"eval_roc_auc": 0.7393892339544514, |
|
"eval_runtime": 2.1827, |
|
"eval_samples_per_second": 19.242, |
|
"eval_steps_per_second": 1.374, |
|
"step": 178 |
|
}, |
|
{ |
|
"epoch": 130.91, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.4034334763948498, |
|
"eval_loss": 0.5429388880729675, |
|
"eval_roc_auc": 0.7269668737060041, |
|
"eval_runtime": 2.1992, |
|
"eval_samples_per_second": 19.098, |
|
"eval_steps_per_second": 1.364, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 131.64, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.4255319148936171, |
|
"eval_loss": 0.5380597710609436, |
|
"eval_roc_auc": 0.7453416149068324, |
|
"eval_runtime": 2.2546, |
|
"eval_samples_per_second": 18.628, |
|
"eval_steps_per_second": 1.331, |
|
"step": 181 |
|
}, |
|
{ |
|
"epoch": 132.36, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.4279475982532751, |
|
"eval_loss": 0.5344164967536926, |
|
"eval_roc_auc": 0.7419772256728779, |
|
"eval_runtime": 2.2146, |
|
"eval_samples_per_second": 18.965, |
|
"eval_steps_per_second": 1.355, |
|
"step": 182 |
|
}, |
|
{ |
|
"epoch": 133.82, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.39316239316239315, |
|
"eval_loss": 0.5364577174186707, |
|
"eval_roc_auc": 0.7199792960662525, |
|
"eval_runtime": 2.1956, |
|
"eval_samples_per_second": 19.129, |
|
"eval_steps_per_second": 1.366, |
|
"step": 184 |
|
}, |
|
{ |
|
"epoch": 134.55, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.40869565217391307, |
|
"eval_loss": 0.5361512303352356, |
|
"eval_roc_auc": 0.72851966873706, |
|
"eval_runtime": 2.2016, |
|
"eval_samples_per_second": 19.077, |
|
"eval_steps_per_second": 1.363, |
|
"step": 185 |
|
}, |
|
{ |
|
"epoch": 136.0, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.39999999999999997, |
|
"eval_loss": 0.5336142182350159, |
|
"eval_roc_auc": 0.7142857142857142, |
|
"eval_runtime": 2.176, |
|
"eval_samples_per_second": 19.302, |
|
"eval_steps_per_second": 1.379, |
|
"step": 187 |
|
}, |
|
{ |
|
"epoch": 136.73, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.42533936651583715, |
|
"eval_loss": 0.5356618762016296, |
|
"eval_roc_auc": 0.7331780538302277, |
|
"eval_runtime": 2.3066, |
|
"eval_samples_per_second": 18.209, |
|
"eval_steps_per_second": 1.301, |
|
"step": 188 |
|
}, |
|
{ |
|
"epoch": 137.45, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.4266666666666666, |
|
"eval_loss": 0.5409244894981384, |
|
"eval_roc_auc": 0.7375776397515528, |
|
"eval_runtime": 2.269, |
|
"eval_samples_per_second": 18.51, |
|
"eval_steps_per_second": 1.322, |
|
"step": 189 |
|
}, |
|
{ |
|
"epoch": 138.91, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.41558441558441556, |
|
"eval_loss": 0.5381691455841064, |
|
"eval_roc_auc": 0.7344720496894409, |
|
"eval_runtime": 2.2181, |
|
"eval_samples_per_second": 18.935, |
|
"eval_steps_per_second": 1.353, |
|
"step": 191 |
|
}, |
|
{ |
|
"epoch": 139.64, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.41558441558441556, |
|
"eval_loss": 0.5408413410186768, |
|
"eval_roc_auc": 0.7344720496894409, |
|
"eval_runtime": 2.1767, |
|
"eval_samples_per_second": 19.296, |
|
"eval_steps_per_second": 1.378, |
|
"step": 192 |
|
}, |
|
{ |
|
"epoch": 140.36, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.39473684210526316, |
|
"eval_loss": 0.54255610704422, |
|
"eval_roc_auc": 0.716614906832298, |
|
"eval_runtime": 2.3421, |
|
"eval_samples_per_second": 17.933, |
|
"eval_steps_per_second": 1.281, |
|
"step": 193 |
|
}, |
|
{ |
|
"epoch": 141.82, |
|
"eval_accuracy": 0.023809523809523808, |
|
"eval_f1": 0.38260869565217387, |
|
"eval_loss": 0.5436768531799316, |
|
"eval_roc_auc": 0.7091097308488613, |
|
"eval_runtime": 2.2168, |
|
"eval_samples_per_second": 18.946, |
|
"eval_steps_per_second": 1.353, |
|
"step": 195 |
|
}, |
|
{ |
|
"epoch": 142.55, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3876651982378855, |
|
"eval_loss": 0.540955662727356, |
|
"eval_roc_auc": 0.7106625258799172, |
|
"eval_runtime": 2.1746, |
|
"eval_samples_per_second": 19.314, |
|
"eval_steps_per_second": 1.38, |
|
"step": 196 |
|
}, |
|
{ |
|
"epoch": 144.0, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.3982683982683983, |
|
"eval_loss": 0.5399672389030457, |
|
"eval_roc_auc": 0.7215320910973085, |
|
"eval_runtime": 2.2745, |
|
"eval_samples_per_second": 18.466, |
|
"eval_steps_per_second": 1.319, |
|
"step": 198 |
|
}, |
|
{ |
|
"epoch": 144.73, |
|
"eval_accuracy": 0.047619047619047616, |
|
"eval_f1": 0.3859649122807018, |
|
"eval_loss": 0.5390969514846802, |
|
"eval_roc_auc": 0.7101449275362318, |
|
"eval_runtime": 2.3353, |
|
"eval_samples_per_second": 17.984, |
|
"eval_steps_per_second": 1.285, |
|
"step": 199 |
|
}, |
|
{ |
|
"epoch": 145.45, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.42290748898678415, |
|
"eval_loss": 0.5356051325798035, |
|
"eval_roc_auc": 0.7365424430641822, |
|
"eval_runtime": 2.238, |
|
"eval_samples_per_second": 18.767, |
|
"eval_steps_per_second": 1.34, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 146.91, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.41441441441441446, |
|
"eval_loss": 0.5343185663223267, |
|
"eval_roc_auc": 0.7261904761904762, |
|
"eval_runtime": 2.2389, |
|
"eval_samples_per_second": 18.759, |
|
"eval_steps_per_second": 1.34, |
|
"step": 202 |
|
}, |
|
{ |
|
"epoch": 147.64, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.42857142857142855, |
|
"eval_loss": 0.5286682844161987, |
|
"eval_roc_auc": 0.7380952380952381, |
|
"eval_runtime": 2.2757, |
|
"eval_samples_per_second": 18.456, |
|
"eval_steps_per_second": 1.318, |
|
"step": 203 |
|
}, |
|
{ |
|
"epoch": 148.36, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.41071428571428575, |
|
"eval_loss": 0.5306946635246277, |
|
"eval_roc_auc": 0.7251552795031057, |
|
"eval_runtime": 2.1874, |
|
"eval_samples_per_second": 19.201, |
|
"eval_steps_per_second": 1.372, |
|
"step": 204 |
|
}, |
|
{ |
|
"epoch": 149.82, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.4177777777777778, |
|
"eval_loss": 0.5335448384284973, |
|
"eval_roc_auc": 0.7311076604554866, |
|
"eval_runtime": 2.3633, |
|
"eval_samples_per_second": 17.772, |
|
"eval_steps_per_second": 1.269, |
|
"step": 206 |
|
}, |
|
{ |
|
"epoch": 150.55, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.4000000000000001, |
|
"eval_loss": 0.535821795463562, |
|
"eval_roc_auc": 0.7220496894409938, |
|
"eval_runtime": 2.1476, |
|
"eval_samples_per_second": 19.557, |
|
"eval_steps_per_second": 1.397, |
|
"step": 207 |
|
}, |
|
{ |
|
"epoch": 152.0, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.4052863436123348, |
|
"eval_loss": 0.5356825590133667, |
|
"eval_roc_auc": 0.7236024844720497, |
|
"eval_runtime": 2.2782, |
|
"eval_samples_per_second": 18.436, |
|
"eval_steps_per_second": 1.317, |
|
"step": 209 |
|
}, |
|
{ |
|
"epoch": 152.73, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.4069264069264069, |
|
"eval_loss": 0.5324029922485352, |
|
"eval_roc_auc": 0.7280020703933747, |
|
"eval_runtime": 2.2465, |
|
"eval_samples_per_second": 18.696, |
|
"eval_steps_per_second": 1.335, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 153.45, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.39316239316239315, |
|
"eval_loss": 0.5348923802375793, |
|
"eval_roc_auc": 0.7199792960662525, |
|
"eval_runtime": 2.1592, |
|
"eval_samples_per_second": 19.452, |
|
"eval_steps_per_second": 1.389, |
|
"step": 211 |
|
}, |
|
{ |
|
"epoch": 154.91, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.41379310344827586, |
|
"eval_loss": 0.5328140258789062, |
|
"eval_roc_auc": 0.7339544513457557, |
|
"eval_runtime": 2.1367, |
|
"eval_samples_per_second": 19.657, |
|
"eval_steps_per_second": 1.404, |
|
"step": 213 |
|
}, |
|
{ |
|
"epoch": 155.64, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.412280701754386, |
|
"eval_loss": 0.533903956413269, |
|
"eval_roc_auc": 0.7295548654244306, |
|
"eval_runtime": 2.1392, |
|
"eval_samples_per_second": 19.634, |
|
"eval_steps_per_second": 1.402, |
|
"step": 214 |
|
}, |
|
{ |
|
"epoch": 156.36, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.43049327354260086, |
|
"eval_loss": 0.5287569761276245, |
|
"eval_roc_auc": 0.7386128364389234, |
|
"eval_runtime": 2.3564, |
|
"eval_samples_per_second": 17.824, |
|
"eval_steps_per_second": 1.273, |
|
"step": 215 |
|
}, |
|
{ |
|
"epoch": 157.82, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.4272727272727273, |
|
"eval_loss": 0.5261039137840271, |
|
"eval_roc_auc": 0.733695652173913, |
|
"eval_runtime": 2.1573, |
|
"eval_samples_per_second": 19.469, |
|
"eval_steps_per_second": 1.391, |
|
"step": 217 |
|
}, |
|
{ |
|
"epoch": 158.55, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.42290748898678415, |
|
"eval_loss": 0.5312274694442749, |
|
"eval_roc_auc": 0.7365424430641822, |
|
"eval_runtime": 2.2337, |
|
"eval_samples_per_second": 18.803, |
|
"eval_steps_per_second": 1.343, |
|
"step": 218 |
|
}, |
|
{ |
|
"epoch": 160.0, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.40358744394618834, |
|
"eval_loss": 0.5341694951057434, |
|
"eval_roc_auc": 0.7192028985507245, |
|
"eval_runtime": 2.2456, |
|
"eval_samples_per_second": 18.703, |
|
"eval_steps_per_second": 1.336, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 160.73, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.3981900452488688, |
|
"eval_loss": 0.5362971425056458, |
|
"eval_roc_auc": 0.7137681159420289, |
|
"eval_runtime": 2.212, |
|
"eval_samples_per_second": 18.988, |
|
"eval_steps_per_second": 1.356, |
|
"step": 221 |
|
}, |
|
{ |
|
"epoch": 161.45, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.41409691629955947, |
|
"eval_loss": 0.532296895980835, |
|
"eval_roc_auc": 0.730072463768116, |
|
"eval_runtime": 2.3611, |
|
"eval_samples_per_second": 17.788, |
|
"eval_steps_per_second": 1.271, |
|
"step": 222 |
|
}, |
|
{ |
|
"epoch": 162.91, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.41071428571428575, |
|
"eval_loss": 0.5253220796585083, |
|
"eval_roc_auc": 0.7251552795031057, |
|
"eval_runtime": 2.1376, |
|
"eval_samples_per_second": 19.648, |
|
"eval_steps_per_second": 1.403, |
|
"step": 224 |
|
}, |
|
{ |
|
"epoch": 163.64, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.4234234234234235, |
|
"eval_loss": 0.5222101807594299, |
|
"eval_roc_auc": 0.7326604554865425, |
|
"eval_runtime": 2.2698, |
|
"eval_samples_per_second": 18.504, |
|
"eval_steps_per_second": 1.322, |
|
"step": 225 |
|
}, |
|
{ |
|
"epoch": 164.36, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.412280701754386, |
|
"eval_loss": 0.5278355479240417, |
|
"eval_roc_auc": 0.7295548654244306, |
|
"eval_runtime": 2.2788, |
|
"eval_samples_per_second": 18.431, |
|
"eval_steps_per_second": 1.316, |
|
"step": 226 |
|
}, |
|
{ |
|
"epoch": 165.82, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.415929203539823, |
|
"eval_loss": 0.5236978530883789, |
|
"eval_roc_auc": 0.7305900621118012, |
|
"eval_runtime": 2.3596, |
|
"eval_samples_per_second": 17.8, |
|
"eval_steps_per_second": 1.271, |
|
"step": 228 |
|
}, |
|
{ |
|
"epoch": 166.55, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.42290748898678415, |
|
"eval_loss": 0.5267902612686157, |
|
"eval_roc_auc": 0.7365424430641822, |
|
"eval_runtime": 2.2183, |
|
"eval_samples_per_second": 18.933, |
|
"eval_steps_per_second": 1.352, |
|
"step": 229 |
|
}, |
|
{ |
|
"epoch": 168.0, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.39639639639639634, |
|
"eval_loss": 0.5275822877883911, |
|
"eval_roc_auc": 0.7132505175983436, |
|
"eval_runtime": 2.1555, |
|
"eval_samples_per_second": 19.485, |
|
"eval_steps_per_second": 1.392, |
|
"step": 231 |
|
}, |
|
{ |
|
"epoch": 168.73, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.41409691629955947, |
|
"eval_loss": 0.522292971611023, |
|
"eval_roc_auc": 0.730072463768116, |
|
"eval_runtime": 2.5244, |
|
"eval_samples_per_second": 16.638, |
|
"eval_steps_per_second": 1.188, |
|
"step": 232 |
|
}, |
|
{ |
|
"epoch": 169.45, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.4177777777777778, |
|
"eval_loss": 0.5228198170661926, |
|
"eval_roc_auc": 0.7311076604554866, |
|
"eval_runtime": 2.2486, |
|
"eval_samples_per_second": 18.678, |
|
"eval_steps_per_second": 1.334, |
|
"step": 233 |
|
}, |
|
{ |
|
"epoch": 170.91, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.4234234234234235, |
|
"eval_loss": 0.5201071500778198, |
|
"eval_roc_auc": 0.7326604554865425, |
|
"eval_runtime": 2.2664, |
|
"eval_samples_per_second": 18.531, |
|
"eval_steps_per_second": 1.324, |
|
"step": 235 |
|
}, |
|
{ |
|
"epoch": 171.64, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.42152466367713004, |
|
"eval_loss": 0.5248059034347534, |
|
"eval_roc_auc": 0.7321428571428572, |
|
"eval_runtime": 2.1597, |
|
"eval_samples_per_second": 19.447, |
|
"eval_steps_per_second": 1.389, |
|
"step": 236 |
|
}, |
|
{ |
|
"epoch": 172.36, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.4125560538116592, |
|
"eval_loss": 0.5245119333267212, |
|
"eval_roc_auc": 0.7256728778467909, |
|
"eval_runtime": 2.2008, |
|
"eval_samples_per_second": 19.084, |
|
"eval_steps_per_second": 1.363, |
|
"step": 237 |
|
}, |
|
{ |
|
"epoch": 173.82, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.4177777777777778, |
|
"eval_loss": 0.5223248600959778, |
|
"eval_roc_auc": 0.7311076604554866, |
|
"eval_runtime": 2.2306, |
|
"eval_samples_per_second": 18.829, |
|
"eval_steps_per_second": 1.345, |
|
"step": 239 |
|
}, |
|
{ |
|
"epoch": 174.55, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.409090909090909, |
|
"eval_loss": 0.5221878886222839, |
|
"eval_roc_auc": 0.7207556935817805, |
|
"eval_runtime": 2.2812, |
|
"eval_samples_per_second": 18.411, |
|
"eval_steps_per_second": 1.315, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 176.0, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.41628959276018096, |
|
"eval_loss": 0.5217894315719604, |
|
"eval_roc_auc": 0.7267080745341615, |
|
"eval_runtime": 2.3942, |
|
"eval_samples_per_second": 17.542, |
|
"eval_steps_per_second": 1.253, |
|
"step": 242 |
|
}, |
|
{ |
|
"epoch": 176.73, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.40540540540540543, |
|
"eval_loss": 0.5226414203643799, |
|
"eval_roc_auc": 0.7197204968944099, |
|
"eval_runtime": 2.1776, |
|
"eval_samples_per_second": 19.287, |
|
"eval_steps_per_second": 1.378, |
|
"step": 243 |
|
}, |
|
{ |
|
"epoch": 177.45, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.39823008849557523, |
|
"eval_loss": 0.5248770713806152, |
|
"eval_roc_auc": 0.7176501035196686, |
|
"eval_runtime": 2.26, |
|
"eval_samples_per_second": 18.584, |
|
"eval_steps_per_second": 1.327, |
|
"step": 244 |
|
}, |
|
{ |
|
"epoch": 178.91, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.4017857142857143, |
|
"eval_loss": 0.5241516828536987, |
|
"eval_roc_auc": 0.7186853002070392, |
|
"eval_runtime": 2.1743, |
|
"eval_samples_per_second": 19.317, |
|
"eval_steps_per_second": 1.38, |
|
"step": 246 |
|
}, |
|
{ |
|
"epoch": 179.64, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.38914027149321273, |
|
"eval_loss": 0.5245065093040466, |
|
"eval_roc_auc": 0.7072981366459626, |
|
"eval_runtime": 2.2384, |
|
"eval_samples_per_second": 18.763, |
|
"eval_steps_per_second": 1.34, |
|
"step": 247 |
|
}, |
|
{ |
|
"epoch": 180.36, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.39449541284403666, |
|
"eval_loss": 0.5249381065368652, |
|
"eval_roc_auc": 0.7088509316770186, |
|
"eval_runtime": 2.2201, |
|
"eval_samples_per_second": 18.918, |
|
"eval_steps_per_second": 1.351, |
|
"step": 248 |
|
}, |
|
{ |
|
"epoch": 181.82, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.4234234234234235, |
|
"eval_loss": 0.52437824010849, |
|
"eval_roc_auc": 0.7326604554865425, |
|
"eval_runtime": 2.2705, |
|
"eval_samples_per_second": 18.498, |
|
"eval_steps_per_second": 1.321, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 182.55, |
|
"eval_accuracy": 0.07142857142857142, |
|
"eval_f1": 0.409090909090909, |
|
"eval_loss": 0.5216240286827087, |
|
"eval_roc_auc": 0.7207556935817805, |
|
"eval_runtime": 2.238, |
|
"eval_samples_per_second": 18.767, |
|
"eval_steps_per_second": 1.34, |
|
"step": 251 |
|
}, |
|
{ |
|
"epoch": 184.0, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.40358744394618834, |
|
"eval_loss": 0.5211586952209473, |
|
"eval_roc_auc": 0.7192028985507245, |
|
"eval_runtime": 2.244, |
|
"eval_samples_per_second": 18.716, |
|
"eval_steps_per_second": 1.337, |
|
"step": 253 |
|
}, |
|
{ |
|
"epoch": 184.73, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.41628959276018096, |
|
"eval_loss": 0.5235975384712219, |
|
"eval_roc_auc": 0.7267080745341615, |
|
"eval_runtime": 2.1767, |
|
"eval_samples_per_second": 19.295, |
|
"eval_steps_per_second": 1.378, |
|
"step": 254 |
|
}, |
|
{ |
|
"epoch": 185.45, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.41441441441441446, |
|
"eval_loss": 0.5226503610610962, |
|
"eval_roc_auc": 0.7261904761904762, |
|
"eval_runtime": 2.3845, |
|
"eval_samples_per_second": 17.614, |
|
"eval_steps_per_second": 1.258, |
|
"step": 255 |
|
}, |
|
{ |
|
"epoch": 186.91, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.40540540540540543, |
|
"eval_loss": 0.5200766324996948, |
|
"eval_roc_auc": 0.7197204968944099, |
|
"eval_runtime": 2.2501, |
|
"eval_samples_per_second": 18.666, |
|
"eval_steps_per_second": 1.333, |
|
"step": 257 |
|
}, |
|
{ |
|
"epoch": 187.64, |
|
"eval_accuracy": 0.14285714285714285, |
|
"eval_f1": 0.4181818181818182, |
|
"eval_loss": 0.5195832848548889, |
|
"eval_roc_auc": 0.7272256728778468, |
|
"eval_runtime": 2.2154, |
|
"eval_samples_per_second": 18.958, |
|
"eval_steps_per_second": 1.354, |
|
"step": 258 |
|
}, |
|
{ |
|
"epoch": 188.36, |
|
"eval_accuracy": 0.14285714285714285, |
|
"eval_f1": 0.4177777777777778, |
|
"eval_loss": 0.5187467336654663, |
|
"eval_roc_auc": 0.7311076604554866, |
|
"eval_runtime": 2.2882, |
|
"eval_samples_per_second": 18.355, |
|
"eval_steps_per_second": 1.311, |
|
"step": 259 |
|
}, |
|
{ |
|
"epoch": 189.82, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.4125560538116592, |
|
"eval_loss": 0.5165961384773254, |
|
"eval_roc_auc": 0.7256728778467909, |
|
"eval_runtime": 2.2388, |
|
"eval_samples_per_second": 18.76, |
|
"eval_steps_per_second": 1.34, |
|
"step": 261 |
|
}, |
|
{ |
|
"epoch": 190.55, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.3873873873873873, |
|
"eval_loss": 0.5241953730583191, |
|
"eval_roc_auc": 0.7067805383022774, |
|
"eval_runtime": 2.4908, |
|
"eval_samples_per_second": 16.862, |
|
"eval_steps_per_second": 1.204, |
|
"step": 262 |
|
}, |
|
{ |
|
"epoch": 192.0, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.42533936651583715, |
|
"eval_loss": 0.5164801478385925, |
|
"eval_roc_auc": 0.7331780538302277, |
|
"eval_runtime": 2.2626, |
|
"eval_samples_per_second": 18.563, |
|
"eval_steps_per_second": 1.326, |
|
"step": 264 |
|
}, |
|
{ |
|
"epoch": 192.73, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.43518518518518523, |
|
"eval_loss": 0.5178862810134888, |
|
"eval_roc_auc": 0.7357660455486543, |
|
"eval_runtime": 2.5128, |
|
"eval_samples_per_second": 16.714, |
|
"eval_steps_per_second": 1.194, |
|
"step": 265 |
|
}, |
|
{ |
|
"epoch": 193.45, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.42452830188679247, |
|
"eval_loss": 0.5133179426193237, |
|
"eval_roc_auc": 0.7248964803312629, |
|
"eval_runtime": 2.5865, |
|
"eval_samples_per_second": 16.238, |
|
"eval_steps_per_second": 1.16, |
|
"step": 266 |
|
}, |
|
{ |
|
"epoch": 194.91, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.42790697674418604, |
|
"eval_loss": 0.5165557861328125, |
|
"eval_roc_auc": 0.7298136645962733, |
|
"eval_runtime": 2.2181, |
|
"eval_samples_per_second": 18.935, |
|
"eval_steps_per_second": 1.353, |
|
"step": 268 |
|
}, |
|
{ |
|
"epoch": 195.64, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.4125560538116592, |
|
"eval_loss": 0.5179272294044495, |
|
"eval_roc_auc": 0.7256728778467909, |
|
"eval_runtime": 2.1768, |
|
"eval_samples_per_second": 19.294, |
|
"eval_steps_per_second": 1.378, |
|
"step": 269 |
|
}, |
|
{ |
|
"epoch": 196.36, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.4311926605504587, |
|
"eval_loss": 0.5189908146858215, |
|
"eval_roc_auc": 0.7347308488612837, |
|
"eval_runtime": 2.1519, |
|
"eval_samples_per_second": 19.517, |
|
"eval_steps_per_second": 1.394, |
|
"step": 270 |
|
}, |
|
{ |
|
"epoch": 197.82, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.40552995391705066, |
|
"eval_loss": 0.5177509784698486, |
|
"eval_roc_auc": 0.7158385093167701, |
|
"eval_runtime": 2.24, |
|
"eval_samples_per_second": 18.75, |
|
"eval_steps_per_second": 1.339, |
|
"step": 272 |
|
}, |
|
{ |
|
"epoch": 198.55, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.40740740740740733, |
|
"eval_loss": 0.5172959566116333, |
|
"eval_roc_auc": 0.7163561076604554, |
|
"eval_runtime": 2.2769, |
|
"eval_samples_per_second": 18.447, |
|
"eval_steps_per_second": 1.318, |
|
"step": 273 |
|
}, |
|
{ |
|
"epoch": 200.0, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.39639639639639634, |
|
"eval_loss": 0.5173150897026062, |
|
"eval_roc_auc": 0.7132505175983436, |
|
"eval_runtime": 2.4473, |
|
"eval_samples_per_second": 17.162, |
|
"eval_steps_per_second": 1.226, |
|
"step": 275 |
|
}, |
|
{ |
|
"epoch": 200.73, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.41666666666666663, |
|
"eval_loss": 0.5198870897293091, |
|
"eval_roc_auc": 0.7228260869565216, |
|
"eval_runtime": 2.2209, |
|
"eval_samples_per_second": 18.911, |
|
"eval_steps_per_second": 1.351, |
|
"step": 276 |
|
}, |
|
{ |
|
"epoch": 201.45, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.3981900452488688, |
|
"eval_loss": 0.5189902186393738, |
|
"eval_roc_auc": 0.7137681159420289, |
|
"eval_runtime": 2.2872, |
|
"eval_samples_per_second": 18.363, |
|
"eval_steps_per_second": 1.312, |
|
"step": 277 |
|
}, |
|
{ |
|
"epoch": 202.91, |
|
"eval_accuracy": 0.14285714285714285, |
|
"eval_f1": 0.42452830188679247, |
|
"eval_loss": 0.5163199305534363, |
|
"eval_roc_auc": 0.7248964803312629, |
|
"eval_runtime": 2.2888, |
|
"eval_samples_per_second": 18.35, |
|
"eval_steps_per_second": 1.311, |
|
"step": 279 |
|
}, |
|
{ |
|
"epoch": 203.64, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.4170616113744076, |
|
"eval_loss": 0.5172598958015442, |
|
"eval_roc_auc": 0.7189440993788819, |
|
"eval_runtime": 2.2409, |
|
"eval_samples_per_second": 18.743, |
|
"eval_steps_per_second": 1.339, |
|
"step": 280 |
|
}, |
|
{ |
|
"epoch": 204.36, |
|
"eval_accuracy": 0.14285714285714285, |
|
"eval_f1": 0.41314553990610325, |
|
"eval_loss": 0.5206424593925476, |
|
"eval_roc_auc": 0.7179089026915114, |
|
"eval_runtime": 2.2107, |
|
"eval_samples_per_second": 18.999, |
|
"eval_steps_per_second": 1.357, |
|
"step": 281 |
|
}, |
|
{ |
|
"epoch": 205.82, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.411214953271028, |
|
"eval_loss": 0.5185695886611938, |
|
"eval_roc_auc": 0.717391304347826, |
|
"eval_runtime": 2.2741, |
|
"eval_samples_per_second": 18.468, |
|
"eval_steps_per_second": 1.319, |
|
"step": 283 |
|
}, |
|
{ |
|
"epoch": 206.55, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.43317972350230416, |
|
"eval_loss": 0.5186063647270203, |
|
"eval_roc_auc": 0.735248447204969, |
|
"eval_runtime": 2.2252, |
|
"eval_samples_per_second": 18.875, |
|
"eval_steps_per_second": 1.348, |
|
"step": 284 |
|
}, |
|
{ |
|
"epoch": 208.0, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.39639639639639634, |
|
"eval_loss": 0.5183053016662598, |
|
"eval_roc_auc": 0.7132505175983436, |
|
"eval_runtime": 2.2662, |
|
"eval_samples_per_second": 18.533, |
|
"eval_steps_per_second": 1.324, |
|
"step": 286 |
|
}, |
|
{ |
|
"epoch": 208.73, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.3946188340807175, |
|
"eval_loss": 0.5180411338806152, |
|
"eval_roc_auc": 0.7127329192546583, |
|
"eval_runtime": 2.1744, |
|
"eval_samples_per_second": 19.316, |
|
"eval_steps_per_second": 1.38, |
|
"step": 287 |
|
}, |
|
{ |
|
"epoch": 209.45, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.40930232558139534, |
|
"eval_loss": 0.5190138220787048, |
|
"eval_roc_auc": 0.7168737060041408, |
|
"eval_runtime": 2.2594, |
|
"eval_samples_per_second": 18.589, |
|
"eval_steps_per_second": 1.328, |
|
"step": 288 |
|
}, |
|
{ |
|
"epoch": 210.91, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.3761467889908257, |
|
"eval_loss": 0.5196405053138733, |
|
"eval_roc_auc": 0.6959109730848861, |
|
"eval_runtime": 2.2692, |
|
"eval_samples_per_second": 18.509, |
|
"eval_steps_per_second": 1.322, |
|
"step": 290 |
|
}, |
|
{ |
|
"epoch": 211.64, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.3981900452488688, |
|
"eval_loss": 0.5149042010307312, |
|
"eval_roc_auc": 0.7137681159420289, |
|
"eval_runtime": 2.2833, |
|
"eval_samples_per_second": 18.395, |
|
"eval_steps_per_second": 1.314, |
|
"step": 291 |
|
}, |
|
{ |
|
"epoch": 212.36, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.39285714285714285, |
|
"eval_loss": 0.5198233723640442, |
|
"eval_roc_auc": 0.7122153209109731, |
|
"eval_runtime": 2.5159, |
|
"eval_samples_per_second": 16.694, |
|
"eval_steps_per_second": 1.192, |
|
"step": 292 |
|
}, |
|
{ |
|
"epoch": 213.82, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.3888888888888889, |
|
"eval_loss": 0.5179316401481628, |
|
"eval_roc_auc": 0.703416149068323, |
|
"eval_runtime": 2.3615, |
|
"eval_samples_per_second": 17.786, |
|
"eval_steps_per_second": 1.27, |
|
"step": 294 |
|
}, |
|
{ |
|
"epoch": 214.55, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.3981900452488688, |
|
"eval_loss": 0.5147101879119873, |
|
"eval_roc_auc": 0.7137681159420289, |
|
"eval_runtime": 2.2382, |
|
"eval_samples_per_second": 18.765, |
|
"eval_steps_per_second": 1.34, |
|
"step": 295 |
|
}, |
|
{ |
|
"epoch": 216.0, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.3870967741935484, |
|
"eval_loss": 0.5126305818557739, |
|
"eval_roc_auc": 0.7028985507246377, |
|
"eval_runtime": 2.2182, |
|
"eval_samples_per_second": 18.934, |
|
"eval_steps_per_second": 1.352, |
|
"step": 297 |
|
}, |
|
{ |
|
"epoch": 216.73, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.40740740740740733, |
|
"eval_loss": 0.5115792751312256, |
|
"eval_roc_auc": 0.7163561076604554, |
|
"eval_runtime": 2.1407, |
|
"eval_samples_per_second": 19.619, |
|
"eval_steps_per_second": 1.401, |
|
"step": 298 |
|
}, |
|
{ |
|
"epoch": 217.45, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.4170616113744076, |
|
"eval_loss": 0.5107331275939941, |
|
"eval_roc_auc": 0.7189440993788819, |
|
"eval_runtime": 2.5127, |
|
"eval_samples_per_second": 16.715, |
|
"eval_steps_per_second": 1.194, |
|
"step": 299 |
|
}, |
|
{ |
|
"epoch": 218.91, |
|
"eval_accuracy": 0.14285714285714285, |
|
"eval_f1": 0.41095890410958896, |
|
"eval_loss": 0.511676549911499, |
|
"eval_roc_auc": 0.7212732919254659, |
|
"eval_runtime": 2.3542, |
|
"eval_samples_per_second": 17.84, |
|
"eval_steps_per_second": 1.274, |
|
"step": 301 |
|
}, |
|
{ |
|
"epoch": 219.64, |
|
"eval_accuracy": 0.14285714285714285, |
|
"eval_f1": 0.41666666666666663, |
|
"eval_loss": 0.5091940760612488, |
|
"eval_roc_auc": 0.7228260869565216, |
|
"eval_runtime": 2.1376, |
|
"eval_samples_per_second": 19.648, |
|
"eval_steps_per_second": 1.403, |
|
"step": 302 |
|
}, |
|
{ |
|
"epoch": 220.36, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.3873873873873873, |
|
"eval_loss": 0.5167934894561768, |
|
"eval_roc_auc": 0.7067805383022774, |
|
"eval_runtime": 2.2065, |
|
"eval_samples_per_second": 19.035, |
|
"eval_steps_per_second": 1.36, |
|
"step": 303 |
|
}, |
|
{ |
|
"epoch": 221.82, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.39069767441860465, |
|
"eval_loss": 0.5202212333679199, |
|
"eval_roc_auc": 0.7039337474120083, |
|
"eval_runtime": 2.483, |
|
"eval_samples_per_second": 16.915, |
|
"eval_steps_per_second": 1.208, |
|
"step": 305 |
|
}, |
|
{ |
|
"epoch": 222.55, |
|
"eval_accuracy": 0.09523809523809523, |
|
"eval_f1": 0.40740740740740733, |
|
"eval_loss": 0.5138672590255737, |
|
"eval_roc_auc": 0.7163561076604554, |
|
"eval_runtime": 2.2543, |
|
"eval_samples_per_second": 18.631, |
|
"eval_steps_per_second": 1.331, |
|
"step": 306 |
|
}, |
|
{ |
|
"epoch": 224.0, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.40552995391705066, |
|
"eval_loss": 0.5207112431526184, |
|
"eval_roc_auc": 0.7158385093167701, |
|
"eval_runtime": 2.3791, |
|
"eval_samples_per_second": 17.654, |
|
"eval_steps_per_second": 1.261, |
|
"step": 308 |
|
}, |
|
{ |
|
"epoch": 224.73, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.4292237442922375, |
|
"eval_loss": 0.5156222581863403, |
|
"eval_roc_auc": 0.7342132505175983, |
|
"eval_runtime": 2.6317, |
|
"eval_samples_per_second": 15.96, |
|
"eval_steps_per_second": 1.14, |
|
"step": 309 |
|
}, |
|
{ |
|
"epoch": 225.45, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.4181818181818182, |
|
"eval_loss": 0.5122308731079102, |
|
"eval_roc_auc": 0.7272256728778468, |
|
"eval_runtime": 2.6565, |
|
"eval_samples_per_second": 15.81, |
|
"eval_steps_per_second": 1.129, |
|
"step": 310 |
|
}, |
|
{ |
|
"epoch": 226.91, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.40540540540540543, |
|
"eval_loss": 0.511935830116272, |
|
"eval_roc_auc": 0.7197204968944099, |
|
"eval_runtime": 2.4688, |
|
"eval_samples_per_second": 17.012, |
|
"eval_steps_per_second": 1.215, |
|
"step": 312 |
|
}, |
|
{ |
|
"epoch": 227.64, |
|
"eval_accuracy": 0.11904761904761904, |
|
"eval_f1": 0.41441441441441446, |
|
"eval_loss": 0.510082483291626, |
|
"eval_roc_auc": 0.7261904761904762, |
|
"eval_runtime": 2.2331, |
|
"eval_samples_per_second": 18.808, |
|
"eval_steps_per_second": 1.343, |
|
"step": 313 |
|
}, |
|
{ |
|
"epoch": 228.36, |
|
"eval_accuracy": 0.14285714285714285, |
|
"eval_f1": 0.4186046511627907, |
|
"eval_loss": 0.5066081285476685, |
|
"eval_roc_auc": 0.7233436853002071, |
|
"eval_runtime": 2.3108, |
|
"eval_samples_per_second": 18.176, |
|
"eval_steps_per_second": 1.298, |
|
"step": 314 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 400, |
|
"num_train_epochs": 400, |
|
"save_steps": 500, |
|
"total_flos": 2.136295306761339e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|