|
{ |
|
"best_metric": 0.8440366972477065, |
|
"best_model_checkpoint": "microsoft-resnet-50-cartoon-emotion-detection/checkpoint-528", |
|
"epoch": 79.96969696969697, |
|
"global_step": 640, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.97, |
|
"eval_accuracy": 0.22935779816513763, |
|
"eval_f1": 0.21647331951741566, |
|
"eval_loss": 1.3854628801345825, |
|
"eval_precision": 0.2697355008315897, |
|
"eval_recall": 0.22935779816513763, |
|
"eval_runtime": 6.0845, |
|
"eval_samples_per_second": 17.914, |
|
"eval_steps_per_second": 0.329, |
|
"step": 8 |
|
}, |
|
{ |
|
"epoch": 1.24, |
|
"learning_rate": 1.8750000000000002e-05, |
|
"loss": 1.4222, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 1.97, |
|
"eval_accuracy": 0.25688073394495414, |
|
"eval_f1": 0.25434987070599063, |
|
"eval_loss": 1.3791918754577637, |
|
"eval_precision": 0.2807708571335123, |
|
"eval_recall": 0.25688073394495414, |
|
"eval_runtime": 4.2925, |
|
"eval_samples_per_second": 25.393, |
|
"eval_steps_per_second": 0.466, |
|
"step": 16 |
|
}, |
|
{ |
|
"epoch": 2.48, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 1.4183, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 2.97, |
|
"eval_accuracy": 0.3853211009174312, |
|
"eval_f1": 0.3511144563688655, |
|
"eval_loss": 1.3646042346954346, |
|
"eval_precision": 0.4102155235182758, |
|
"eval_recall": 0.3853211009174312, |
|
"eval_runtime": 4.3579, |
|
"eval_samples_per_second": 25.012, |
|
"eval_steps_per_second": 0.459, |
|
"step": 24 |
|
}, |
|
{ |
|
"epoch": 3.73, |
|
"learning_rate": 5.625e-05, |
|
"loss": 1.4097, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 3.97, |
|
"eval_accuracy": 0.41284403669724773, |
|
"eval_f1": 0.32452248836490605, |
|
"eval_loss": 1.3562716245651245, |
|
"eval_precision": 0.5062447369587377, |
|
"eval_recall": 0.41284403669724773, |
|
"eval_runtime": 4.3612, |
|
"eval_samples_per_second": 24.993, |
|
"eval_steps_per_second": 0.459, |
|
"step": 32 |
|
}, |
|
{ |
|
"epoch": 4.97, |
|
"learning_rate": 7.500000000000001e-05, |
|
"loss": 1.3944, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 4.97, |
|
"eval_accuracy": 0.4036697247706422, |
|
"eval_f1": 0.293905028882093, |
|
"eval_loss": 1.3461558818817139, |
|
"eval_precision": 0.3927443217900042, |
|
"eval_recall": 0.4036697247706422, |
|
"eval_runtime": 4.4159, |
|
"eval_samples_per_second": 24.684, |
|
"eval_steps_per_second": 0.453, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 5.97, |
|
"eval_accuracy": 0.4036697247706422, |
|
"eval_f1": 0.2840541721275666, |
|
"eval_loss": 1.322252631187439, |
|
"eval_precision": 0.5152005756431013, |
|
"eval_recall": 0.4036697247706422, |
|
"eval_runtime": 4.2725, |
|
"eval_samples_per_second": 25.512, |
|
"eval_steps_per_second": 0.468, |
|
"step": 48 |
|
}, |
|
{ |
|
"epoch": 6.24, |
|
"learning_rate": 9.375e-05, |
|
"loss": 1.411, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 6.97, |
|
"eval_accuracy": 0.41284403669724773, |
|
"eval_f1": 0.29851761513413444, |
|
"eval_loss": 1.304025411605835, |
|
"eval_precision": 0.44039013993142434, |
|
"eval_recall": 0.41284403669724773, |
|
"eval_runtime": 4.4737, |
|
"eval_samples_per_second": 24.365, |
|
"eval_steps_per_second": 0.447, |
|
"step": 56 |
|
}, |
|
{ |
|
"epoch": 7.48, |
|
"learning_rate": 0.0001125, |
|
"loss": 1.346, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 7.97, |
|
"eval_accuracy": 0.4954128440366973, |
|
"eval_f1": 0.4092687533729088, |
|
"eval_loss": 1.2699785232543945, |
|
"eval_precision": 0.49603902723168775, |
|
"eval_recall": 0.4954128440366973, |
|
"eval_runtime": 4.5079, |
|
"eval_samples_per_second": 24.18, |
|
"eval_steps_per_second": 0.444, |
|
"step": 64 |
|
}, |
|
{ |
|
"epoch": 8.73, |
|
"learning_rate": 0.00011875000000000001, |
|
"loss": 1.3031, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 8.97, |
|
"eval_accuracy": 0.5596330275229358, |
|
"eval_f1": 0.46723852012270245, |
|
"eval_loss": 1.2149937152862549, |
|
"eval_precision": 0.5440134711415631, |
|
"eval_recall": 0.5596330275229358, |
|
"eval_runtime": 4.3712, |
|
"eval_samples_per_second": 24.936, |
|
"eval_steps_per_second": 0.458, |
|
"step": 72 |
|
}, |
|
{ |
|
"epoch": 9.97, |
|
"learning_rate": 0.00011666666666666667, |
|
"loss": 1.2371, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 9.97, |
|
"eval_accuracy": 0.5963302752293578, |
|
"eval_f1": 0.5100508405791544, |
|
"eval_loss": 1.1580270528793335, |
|
"eval_precision": 0.5659333353788879, |
|
"eval_recall": 0.5963302752293578, |
|
"eval_runtime": 4.2133, |
|
"eval_samples_per_second": 25.87, |
|
"eval_steps_per_second": 0.475, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 10.97, |
|
"eval_accuracy": 0.6055045871559633, |
|
"eval_f1": 0.5211004609031267, |
|
"eval_loss": 1.066982388496399, |
|
"eval_precision": 0.7279186904119446, |
|
"eval_recall": 0.6055045871559633, |
|
"eval_runtime": 14.5277, |
|
"eval_samples_per_second": 7.503, |
|
"eval_steps_per_second": 0.138, |
|
"step": 88 |
|
}, |
|
{ |
|
"epoch": 11.24, |
|
"learning_rate": 0.00011458333333333334, |
|
"loss": 1.1736, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 11.97, |
|
"eval_accuracy": 0.6605504587155964, |
|
"eval_f1": 0.5771675777046106, |
|
"eval_loss": 0.9855989813804626, |
|
"eval_precision": 0.5536726213674042, |
|
"eval_recall": 0.6605504587155964, |
|
"eval_runtime": 4.2828, |
|
"eval_samples_per_second": 25.451, |
|
"eval_steps_per_second": 0.467, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 12.48, |
|
"learning_rate": 0.0001125, |
|
"loss": 1.0457, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 12.97, |
|
"eval_accuracy": 0.6697247706422018, |
|
"eval_f1": 0.5964926350313968, |
|
"eval_loss": 0.896264374256134, |
|
"eval_precision": 0.763141515721791, |
|
"eval_recall": 0.6697247706422018, |
|
"eval_runtime": 4.2315, |
|
"eval_samples_per_second": 25.759, |
|
"eval_steps_per_second": 0.473, |
|
"step": 104 |
|
}, |
|
{ |
|
"epoch": 13.73, |
|
"learning_rate": 0.00011041666666666666, |
|
"loss": 0.953, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 13.97, |
|
"eval_accuracy": 0.6697247706422018, |
|
"eval_f1": 0.6081464096911078, |
|
"eval_loss": 0.8546512722969055, |
|
"eval_precision": 0.6884856947005512, |
|
"eval_recall": 0.6697247706422018, |
|
"eval_runtime": 4.4534, |
|
"eval_samples_per_second": 24.476, |
|
"eval_steps_per_second": 0.449, |
|
"step": 112 |
|
}, |
|
{ |
|
"epoch": 14.97, |
|
"learning_rate": 0.00010833333333333334, |
|
"loss": 0.8579, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 14.97, |
|
"eval_accuracy": 0.7155963302752294, |
|
"eval_f1": 0.6643295304342026, |
|
"eval_loss": 0.7848823070526123, |
|
"eval_precision": 0.7396182317656428, |
|
"eval_recall": 0.7155963302752294, |
|
"eval_runtime": 4.1662, |
|
"eval_samples_per_second": 26.163, |
|
"eval_steps_per_second": 0.48, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 15.97, |
|
"eval_accuracy": 0.7431192660550459, |
|
"eval_f1": 0.711852075310986, |
|
"eval_loss": 0.7563745379447937, |
|
"eval_precision": 0.7371817784661822, |
|
"eval_recall": 0.7431192660550459, |
|
"eval_runtime": 4.2674, |
|
"eval_samples_per_second": 25.542, |
|
"eval_steps_per_second": 0.469, |
|
"step": 128 |
|
}, |
|
{ |
|
"epoch": 16.24, |
|
"learning_rate": 0.00010625, |
|
"loss": 0.8167, |
|
"step": 130 |
|
}, |
|
{ |
|
"epoch": 16.97, |
|
"eval_accuracy": 0.7614678899082569, |
|
"eval_f1": 0.7210716889645992, |
|
"eval_loss": 0.7132583260536194, |
|
"eval_precision": 0.7506553079947577, |
|
"eval_recall": 0.7614678899082569, |
|
"eval_runtime": 4.1418, |
|
"eval_samples_per_second": 26.317, |
|
"eval_steps_per_second": 0.483, |
|
"step": 136 |
|
}, |
|
{ |
|
"epoch": 17.48, |
|
"learning_rate": 0.00010416666666666667, |
|
"loss": 0.7273, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 17.97, |
|
"eval_accuracy": 0.7522935779816514, |
|
"eval_f1": 0.7202155642522615, |
|
"eval_loss": 0.6887747645378113, |
|
"eval_precision": 0.7378685592291271, |
|
"eval_recall": 0.7522935779816514, |
|
"eval_runtime": 4.5118, |
|
"eval_samples_per_second": 24.159, |
|
"eval_steps_per_second": 0.443, |
|
"step": 144 |
|
}, |
|
{ |
|
"epoch": 18.73, |
|
"learning_rate": 0.00010208333333333334, |
|
"loss": 0.6547, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 18.97, |
|
"eval_accuracy": 0.7798165137614679, |
|
"eval_f1": 0.7576525411387797, |
|
"eval_loss": 0.659186065196991, |
|
"eval_precision": 0.7772903701802784, |
|
"eval_recall": 0.7798165137614679, |
|
"eval_runtime": 4.3816, |
|
"eval_samples_per_second": 24.877, |
|
"eval_steps_per_second": 0.456, |
|
"step": 152 |
|
}, |
|
{ |
|
"epoch": 19.97, |
|
"learning_rate": 0.0001, |
|
"loss": 0.5963, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 19.97, |
|
"eval_accuracy": 0.7706422018348624, |
|
"eval_f1": 0.7550663564666461, |
|
"eval_loss": 0.6136144399642944, |
|
"eval_precision": 0.764159781184113, |
|
"eval_recall": 0.7706422018348624, |
|
"eval_runtime": 4.2561, |
|
"eval_samples_per_second": 25.61, |
|
"eval_steps_per_second": 0.47, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 20.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.7786916064255194, |
|
"eval_loss": 0.5723462700843811, |
|
"eval_precision": 0.7801645588430826, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 5.2546, |
|
"eval_samples_per_second": 20.744, |
|
"eval_steps_per_second": 0.381, |
|
"step": 168 |
|
}, |
|
{ |
|
"epoch": 21.24, |
|
"learning_rate": 9.791666666666667e-05, |
|
"loss": 0.551, |
|
"step": 170 |
|
}, |
|
{ |
|
"epoch": 21.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.7780894219567608, |
|
"eval_loss": 0.5686229467391968, |
|
"eval_precision": 0.776092121476891, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 4.3144, |
|
"eval_samples_per_second": 25.264, |
|
"eval_steps_per_second": 0.464, |
|
"step": 176 |
|
}, |
|
{ |
|
"epoch": 22.48, |
|
"learning_rate": 9.583333333333334e-05, |
|
"loss": 0.4929, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 22.97, |
|
"eval_accuracy": 0.7706422018348624, |
|
"eval_f1": 0.7651464296127533, |
|
"eval_loss": 0.5596823692321777, |
|
"eval_precision": 0.7649127896435436, |
|
"eval_recall": 0.7706422018348624, |
|
"eval_runtime": 4.4326, |
|
"eval_samples_per_second": 24.59, |
|
"eval_steps_per_second": 0.451, |
|
"step": 184 |
|
}, |
|
{ |
|
"epoch": 23.73, |
|
"learning_rate": 9.375e-05, |
|
"loss": 0.4309, |
|
"step": 190 |
|
}, |
|
{ |
|
"epoch": 23.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.781022184850044, |
|
"eval_loss": 0.5233965516090393, |
|
"eval_precision": 0.7774110647118855, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 4.3167, |
|
"eval_samples_per_second": 25.251, |
|
"eval_steps_per_second": 0.463, |
|
"step": 192 |
|
}, |
|
{ |
|
"epoch": 24.97, |
|
"learning_rate": 9.166666666666667e-05, |
|
"loss": 0.3945, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 24.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.7812909567496724, |
|
"eval_loss": 0.5007840991020203, |
|
"eval_precision": 0.7836723839914905, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 4.3513, |
|
"eval_samples_per_second": 25.05, |
|
"eval_steps_per_second": 0.46, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 25.97, |
|
"eval_accuracy": 0.7522935779816514, |
|
"eval_f1": 0.7528893125223401, |
|
"eval_loss": 0.5289302468299866, |
|
"eval_precision": 0.7537344154316632, |
|
"eval_recall": 0.7522935779816514, |
|
"eval_runtime": 4.3647, |
|
"eval_samples_per_second": 24.973, |
|
"eval_steps_per_second": 0.458, |
|
"step": 208 |
|
}, |
|
{ |
|
"epoch": 26.24, |
|
"learning_rate": 8.958333333333333e-05, |
|
"loss": 0.3704, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 26.97, |
|
"eval_accuracy": 0.7981651376146789, |
|
"eval_f1": 0.7962706746091569, |
|
"eval_loss": 0.4399118423461914, |
|
"eval_precision": 0.7957732392169626, |
|
"eval_recall": 0.7981651376146789, |
|
"eval_runtime": 4.2147, |
|
"eval_samples_per_second": 25.862, |
|
"eval_steps_per_second": 0.475, |
|
"step": 216 |
|
}, |
|
{ |
|
"epoch": 27.48, |
|
"learning_rate": 8.75e-05, |
|
"loss": 0.3267, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 27.97, |
|
"eval_accuracy": 0.8073394495412844, |
|
"eval_f1": 0.8005365278178692, |
|
"eval_loss": 0.4539415240287781, |
|
"eval_precision": 0.7983420088683247, |
|
"eval_recall": 0.8073394495412844, |
|
"eval_runtime": 4.2272, |
|
"eval_samples_per_second": 25.785, |
|
"eval_steps_per_second": 0.473, |
|
"step": 224 |
|
}, |
|
{ |
|
"epoch": 28.73, |
|
"learning_rate": 8.541666666666668e-05, |
|
"loss": 0.2966, |
|
"step": 230 |
|
}, |
|
{ |
|
"epoch": 28.97, |
|
"eval_accuracy": 0.7798165137614679, |
|
"eval_f1": 0.7837137974455839, |
|
"eval_loss": 0.4734969735145569, |
|
"eval_precision": 0.789241175758926, |
|
"eval_recall": 0.7798165137614679, |
|
"eval_runtime": 4.2368, |
|
"eval_samples_per_second": 25.727, |
|
"eval_steps_per_second": 0.472, |
|
"step": 232 |
|
}, |
|
{ |
|
"epoch": 29.97, |
|
"learning_rate": 8.333333333333333e-05, |
|
"loss": 0.2645, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 29.97, |
|
"eval_accuracy": 0.7706422018348624, |
|
"eval_f1": 0.7706422018348624, |
|
"eval_loss": 0.4594463109970093, |
|
"eval_precision": 0.7706422018348624, |
|
"eval_recall": 0.7706422018348624, |
|
"eval_runtime": 4.3943, |
|
"eval_samples_per_second": 24.805, |
|
"eval_steps_per_second": 0.455, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 30.97, |
|
"eval_accuracy": 0.7522935779816514, |
|
"eval_f1": 0.7533140030125614, |
|
"eval_loss": 0.4698648750782013, |
|
"eval_precision": 0.7554437319096274, |
|
"eval_recall": 0.7522935779816514, |
|
"eval_runtime": 4.1296, |
|
"eval_samples_per_second": 26.394, |
|
"eval_steps_per_second": 0.484, |
|
"step": 248 |
|
}, |
|
{ |
|
"epoch": 31.24, |
|
"learning_rate": 8.125000000000001e-05, |
|
"loss": 0.2527, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 31.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.7856523955147808, |
|
"eval_loss": 0.45513755083084106, |
|
"eval_precision": 0.785609816323817, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 4.1348, |
|
"eval_samples_per_second": 26.361, |
|
"eval_steps_per_second": 0.484, |
|
"step": 256 |
|
}, |
|
{ |
|
"epoch": 32.48, |
|
"learning_rate": 7.916666666666666e-05, |
|
"loss": 0.2202, |
|
"step": 260 |
|
}, |
|
{ |
|
"epoch": 32.97, |
|
"eval_accuracy": 0.8165137614678899, |
|
"eval_f1": 0.8170336224601304, |
|
"eval_loss": 0.4457748532295227, |
|
"eval_precision": 0.8197900424266599, |
|
"eval_recall": 0.8165137614678899, |
|
"eval_runtime": 5.1689, |
|
"eval_samples_per_second": 21.087, |
|
"eval_steps_per_second": 0.387, |
|
"step": 264 |
|
}, |
|
{ |
|
"epoch": 33.73, |
|
"learning_rate": 7.708333333333334e-05, |
|
"loss": 0.2006, |
|
"step": 270 |
|
}, |
|
{ |
|
"epoch": 33.97, |
|
"eval_accuracy": 0.7798165137614679, |
|
"eval_f1": 0.7850412357933325, |
|
"eval_loss": 0.46321260929107666, |
|
"eval_precision": 0.7940749153601442, |
|
"eval_recall": 0.7798165137614679, |
|
"eval_runtime": 4.2326, |
|
"eval_samples_per_second": 25.752, |
|
"eval_steps_per_second": 0.473, |
|
"step": 272 |
|
}, |
|
{ |
|
"epoch": 34.97, |
|
"learning_rate": 7.500000000000001e-05, |
|
"loss": 0.1589, |
|
"step": 280 |
|
}, |
|
{ |
|
"epoch": 34.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.7925041274199247, |
|
"eval_loss": 0.46511203050613403, |
|
"eval_precision": 0.7993275970140749, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 4.1566, |
|
"eval_samples_per_second": 26.223, |
|
"eval_steps_per_second": 0.481, |
|
"step": 280 |
|
}, |
|
{ |
|
"epoch": 35.97, |
|
"eval_accuracy": 0.7798165137614679, |
|
"eval_f1": 0.7803733958918072, |
|
"eval_loss": 0.45948973298072815, |
|
"eval_precision": 0.7823930357635982, |
|
"eval_recall": 0.7798165137614679, |
|
"eval_runtime": 4.3202, |
|
"eval_samples_per_second": 25.23, |
|
"eval_steps_per_second": 0.463, |
|
"step": 288 |
|
}, |
|
{ |
|
"epoch": 36.24, |
|
"learning_rate": 7.291666666666666e-05, |
|
"loss": 0.153, |
|
"step": 290 |
|
}, |
|
{ |
|
"epoch": 36.97, |
|
"eval_accuracy": 0.7614678899082569, |
|
"eval_f1": 0.7632546001327497, |
|
"eval_loss": 0.458363801240921, |
|
"eval_precision": 0.7690950187958565, |
|
"eval_recall": 0.7614678899082569, |
|
"eval_runtime": 4.4275, |
|
"eval_samples_per_second": 24.619, |
|
"eval_steps_per_second": 0.452, |
|
"step": 296 |
|
}, |
|
{ |
|
"epoch": 37.48, |
|
"learning_rate": 7.083333333333334e-05, |
|
"loss": 0.1427, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 37.97, |
|
"eval_accuracy": 0.7798165137614679, |
|
"eval_f1": 0.7796360891921739, |
|
"eval_loss": 0.46078726649284363, |
|
"eval_precision": 0.782995656118911, |
|
"eval_recall": 0.7798165137614679, |
|
"eval_runtime": 4.4461, |
|
"eval_samples_per_second": 24.516, |
|
"eval_steps_per_second": 0.45, |
|
"step": 304 |
|
}, |
|
{ |
|
"epoch": 38.73, |
|
"learning_rate": 6.874999999999999e-05, |
|
"loss": 0.113, |
|
"step": 310 |
|
}, |
|
{ |
|
"epoch": 38.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.7898954921921011, |
|
"eval_loss": 0.45713570713996887, |
|
"eval_precision": 0.7922270390160299, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 4.3087, |
|
"eval_samples_per_second": 25.297, |
|
"eval_steps_per_second": 0.464, |
|
"step": 312 |
|
}, |
|
{ |
|
"epoch": 39.97, |
|
"learning_rate": 6.666666666666667e-05, |
|
"loss": 0.1146, |
|
"step": 320 |
|
}, |
|
{ |
|
"epoch": 39.97, |
|
"eval_accuracy": 0.7614678899082569, |
|
"eval_f1": 0.7612891030218949, |
|
"eval_loss": 0.5269873142242432, |
|
"eval_precision": 0.765128347697155, |
|
"eval_recall": 0.7614678899082569, |
|
"eval_runtime": 4.2908, |
|
"eval_samples_per_second": 25.403, |
|
"eval_steps_per_second": 0.466, |
|
"step": 320 |
|
}, |
|
{ |
|
"epoch": 40.97, |
|
"eval_accuracy": 0.7706422018348624, |
|
"eval_f1": 0.7709516996486127, |
|
"eval_loss": 0.48878130316734314, |
|
"eval_precision": 0.7781771515945828, |
|
"eval_recall": 0.7706422018348624, |
|
"eval_runtime": 4.3303, |
|
"eval_samples_per_second": 25.171, |
|
"eval_steps_per_second": 0.462, |
|
"step": 328 |
|
}, |
|
{ |
|
"epoch": 41.24, |
|
"learning_rate": 6.458333333333334e-05, |
|
"loss": 0.1275, |
|
"step": 330 |
|
}, |
|
{ |
|
"epoch": 41.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.7836706749228535, |
|
"eval_loss": 0.4523099958896637, |
|
"eval_precision": 0.780905883107718, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 4.2033, |
|
"eval_samples_per_second": 25.932, |
|
"eval_steps_per_second": 0.476, |
|
"step": 336 |
|
}, |
|
{ |
|
"epoch": 42.48, |
|
"learning_rate": 6.25e-05, |
|
"loss": 0.0959, |
|
"step": 340 |
|
}, |
|
{ |
|
"epoch": 42.97, |
|
"eval_accuracy": 0.7798165137614679, |
|
"eval_f1": 0.7767063396275014, |
|
"eval_loss": 0.46965503692626953, |
|
"eval_precision": 0.7753268138589239, |
|
"eval_recall": 0.7798165137614679, |
|
"eval_runtime": 4.3242, |
|
"eval_samples_per_second": 25.207, |
|
"eval_steps_per_second": 0.463, |
|
"step": 344 |
|
}, |
|
{ |
|
"epoch": 43.73, |
|
"learning_rate": 6.041666666666667e-05, |
|
"loss": 0.0882, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 43.97, |
|
"eval_accuracy": 0.7706422018348624, |
|
"eval_f1": 0.7685729724992435, |
|
"eval_loss": 0.4286104738712311, |
|
"eval_precision": 0.7685932721712537, |
|
"eval_recall": 0.7706422018348624, |
|
"eval_runtime": 4.4175, |
|
"eval_samples_per_second": 24.675, |
|
"eval_steps_per_second": 0.453, |
|
"step": 352 |
|
}, |
|
{ |
|
"epoch": 44.97, |
|
"learning_rate": 5.833333333333333e-05, |
|
"loss": 0.0847, |
|
"step": 360 |
|
}, |
|
{ |
|
"epoch": 44.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.7925041274199247, |
|
"eval_loss": 0.5317460298538208, |
|
"eval_precision": 0.7993275970140749, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 6.0042, |
|
"eval_samples_per_second": 18.154, |
|
"eval_steps_per_second": 0.333, |
|
"step": 360 |
|
}, |
|
{ |
|
"epoch": 45.97, |
|
"eval_accuracy": 0.7614678899082569, |
|
"eval_f1": 0.7646893115457605, |
|
"eval_loss": 0.5431071519851685, |
|
"eval_precision": 0.7699552364490537, |
|
"eval_recall": 0.7614678899082569, |
|
"eval_runtime": 4.3547, |
|
"eval_samples_per_second": 25.03, |
|
"eval_steps_per_second": 0.459, |
|
"step": 368 |
|
}, |
|
{ |
|
"epoch": 46.24, |
|
"learning_rate": 5.625e-05, |
|
"loss": 0.0813, |
|
"step": 370 |
|
}, |
|
{ |
|
"epoch": 46.97, |
|
"eval_accuracy": 0.8256880733944955, |
|
"eval_f1": 0.8284158367266842, |
|
"eval_loss": 0.44316479563713074, |
|
"eval_precision": 0.843538901662607, |
|
"eval_recall": 0.8256880733944955, |
|
"eval_runtime": 4.2714, |
|
"eval_samples_per_second": 25.519, |
|
"eval_steps_per_second": 0.468, |
|
"step": 376 |
|
}, |
|
{ |
|
"epoch": 47.48, |
|
"learning_rate": 5.416666666666667e-05, |
|
"loss": 0.0768, |
|
"step": 380 |
|
}, |
|
{ |
|
"epoch": 47.97, |
|
"eval_accuracy": 0.7981651376146789, |
|
"eval_f1": 0.7955546490941502, |
|
"eval_loss": 0.4885597229003906, |
|
"eval_precision": 0.8005162605636117, |
|
"eval_recall": 0.7981651376146789, |
|
"eval_runtime": 4.2576, |
|
"eval_samples_per_second": 25.602, |
|
"eval_steps_per_second": 0.47, |
|
"step": 384 |
|
}, |
|
{ |
|
"epoch": 48.73, |
|
"learning_rate": 5.208333333333334e-05, |
|
"loss": 0.0627, |
|
"step": 390 |
|
}, |
|
{ |
|
"epoch": 48.97, |
|
"eval_accuracy": 0.7981651376146789, |
|
"eval_f1": 0.8009727230444837, |
|
"eval_loss": 0.5372528433799744, |
|
"eval_precision": 0.8071912929511652, |
|
"eval_recall": 0.7981651376146789, |
|
"eval_runtime": 4.3763, |
|
"eval_samples_per_second": 24.907, |
|
"eval_steps_per_second": 0.457, |
|
"step": 392 |
|
}, |
|
{ |
|
"epoch": 49.97, |
|
"learning_rate": 5e-05, |
|
"loss": 0.0688, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 49.97, |
|
"eval_accuracy": 0.7798165137614679, |
|
"eval_f1": 0.7822443312570955, |
|
"eval_loss": 0.5896694660186768, |
|
"eval_precision": 0.789232725399693, |
|
"eval_recall": 0.7798165137614679, |
|
"eval_runtime": 4.3692, |
|
"eval_samples_per_second": 24.947, |
|
"eval_steps_per_second": 0.458, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 50.97, |
|
"eval_accuracy": 0.7981651376146789, |
|
"eval_f1": 0.7992371326578404, |
|
"eval_loss": 0.5114642977714539, |
|
"eval_precision": 0.8014849021031709, |
|
"eval_recall": 0.7981651376146789, |
|
"eval_runtime": 4.3028, |
|
"eval_samples_per_second": 25.332, |
|
"eval_steps_per_second": 0.465, |
|
"step": 408 |
|
}, |
|
{ |
|
"epoch": 51.24, |
|
"learning_rate": 4.791666666666667e-05, |
|
"loss": 0.0676, |
|
"step": 410 |
|
}, |
|
{ |
|
"epoch": 51.97, |
|
"eval_accuracy": 0.7981651376146789, |
|
"eval_f1": 0.7977993643940755, |
|
"eval_loss": 0.4881470799446106, |
|
"eval_precision": 0.7998301588132414, |
|
"eval_recall": 0.7981651376146789, |
|
"eval_runtime": 4.3212, |
|
"eval_samples_per_second": 25.224, |
|
"eval_steps_per_second": 0.463, |
|
"step": 416 |
|
}, |
|
{ |
|
"epoch": 52.48, |
|
"learning_rate": 4.5833333333333334e-05, |
|
"loss": 0.0539, |
|
"step": 420 |
|
}, |
|
{ |
|
"epoch": 52.97, |
|
"eval_accuracy": 0.8073394495412844, |
|
"eval_f1": 0.807691055721277, |
|
"eval_loss": 0.4819609224796295, |
|
"eval_precision": 0.8138503399273244, |
|
"eval_recall": 0.8073394495412844, |
|
"eval_runtime": 4.3125, |
|
"eval_samples_per_second": 25.276, |
|
"eval_steps_per_second": 0.464, |
|
"step": 424 |
|
}, |
|
{ |
|
"epoch": 53.73, |
|
"learning_rate": 4.375e-05, |
|
"loss": 0.0596, |
|
"step": 430 |
|
}, |
|
{ |
|
"epoch": 53.97, |
|
"eval_accuracy": 0.8256880733944955, |
|
"eval_f1": 0.8244465797713664, |
|
"eval_loss": 0.4449571669101715, |
|
"eval_precision": 0.8245908379614004, |
|
"eval_recall": 0.8256880733944955, |
|
"eval_runtime": 5.8195, |
|
"eval_samples_per_second": 18.73, |
|
"eval_steps_per_second": 0.344, |
|
"step": 432 |
|
}, |
|
{ |
|
"epoch": 54.97, |
|
"learning_rate": 4.1666666666666665e-05, |
|
"loss": 0.0611, |
|
"step": 440 |
|
}, |
|
{ |
|
"epoch": 54.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.7924465793472197, |
|
"eval_loss": 0.5057494044303894, |
|
"eval_precision": 0.8008019735410222, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 4.6616, |
|
"eval_samples_per_second": 23.383, |
|
"eval_steps_per_second": 0.429, |
|
"step": 440 |
|
}, |
|
{ |
|
"epoch": 55.97, |
|
"eval_accuracy": 0.7981651376146789, |
|
"eval_f1": 0.8008031371900772, |
|
"eval_loss": 0.4918478727340698, |
|
"eval_precision": 0.8056331161636306, |
|
"eval_recall": 0.7981651376146789, |
|
"eval_runtime": 4.8639, |
|
"eval_samples_per_second": 22.41, |
|
"eval_steps_per_second": 0.411, |
|
"step": 448 |
|
}, |
|
{ |
|
"epoch": 56.24, |
|
"learning_rate": 3.958333333333333e-05, |
|
"loss": 0.0643, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 56.97, |
|
"eval_accuracy": 0.7522935779816514, |
|
"eval_f1": 0.7545272459450874, |
|
"eval_loss": 0.5946044325828552, |
|
"eval_precision": 0.7587394976605187, |
|
"eval_recall": 0.7522935779816514, |
|
"eval_runtime": 4.4153, |
|
"eval_samples_per_second": 24.687, |
|
"eval_steps_per_second": 0.453, |
|
"step": 456 |
|
}, |
|
{ |
|
"epoch": 57.48, |
|
"learning_rate": 3.7500000000000003e-05, |
|
"loss": 0.0605, |
|
"step": 460 |
|
}, |
|
{ |
|
"epoch": 57.97, |
|
"eval_accuracy": 0.8073394495412844, |
|
"eval_f1": 0.8120936083458042, |
|
"eval_loss": 0.4887966513633728, |
|
"eval_precision": 0.8238645162528876, |
|
"eval_recall": 0.8073394495412844, |
|
"eval_runtime": 6.6734, |
|
"eval_samples_per_second": 16.334, |
|
"eval_steps_per_second": 0.3, |
|
"step": 464 |
|
}, |
|
{ |
|
"epoch": 58.73, |
|
"learning_rate": 3.541666666666667e-05, |
|
"loss": 0.063, |
|
"step": 470 |
|
}, |
|
{ |
|
"epoch": 58.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.7936673558168583, |
|
"eval_loss": 0.5916518568992615, |
|
"eval_precision": 0.8051419661311963, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 4.2726, |
|
"eval_samples_per_second": 25.511, |
|
"eval_steps_per_second": 0.468, |
|
"step": 472 |
|
}, |
|
{ |
|
"epoch": 59.97, |
|
"learning_rate": 3.3333333333333335e-05, |
|
"loss": 0.0595, |
|
"step": 480 |
|
}, |
|
{ |
|
"epoch": 59.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.7894285298217145, |
|
"eval_loss": 0.5117025375366211, |
|
"eval_precision": 0.7904302906815871, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 4.4288, |
|
"eval_samples_per_second": 24.612, |
|
"eval_steps_per_second": 0.452, |
|
"step": 480 |
|
}, |
|
{ |
|
"epoch": 60.97, |
|
"eval_accuracy": 0.7614678899082569, |
|
"eval_f1": 0.7635438011331693, |
|
"eval_loss": 0.549720048904419, |
|
"eval_precision": 0.769159484755815, |
|
"eval_recall": 0.7614678899082569, |
|
"eval_runtime": 4.2635, |
|
"eval_samples_per_second": 25.566, |
|
"eval_steps_per_second": 0.469, |
|
"step": 488 |
|
}, |
|
{ |
|
"epoch": 61.24, |
|
"learning_rate": 3.125e-05, |
|
"loss": 0.0554, |
|
"step": 490 |
|
}, |
|
{ |
|
"epoch": 61.97, |
|
"eval_accuracy": 0.8165137614678899, |
|
"eval_f1": 0.812552773801982, |
|
"eval_loss": 0.4742366075515747, |
|
"eval_precision": 0.8100926678908328, |
|
"eval_recall": 0.8165137614678899, |
|
"eval_runtime": 4.3801, |
|
"eval_samples_per_second": 24.885, |
|
"eval_steps_per_second": 0.457, |
|
"step": 496 |
|
}, |
|
{ |
|
"epoch": 62.48, |
|
"learning_rate": 2.9166666666666666e-05, |
|
"loss": 0.0557, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 62.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.7886246853481453, |
|
"eval_loss": 0.5369319915771484, |
|
"eval_precision": 0.7886251828214332, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 4.4776, |
|
"eval_samples_per_second": 24.343, |
|
"eval_steps_per_second": 0.447, |
|
"step": 504 |
|
}, |
|
{ |
|
"epoch": 63.73, |
|
"learning_rate": 2.7083333333333335e-05, |
|
"loss": 0.0539, |
|
"step": 510 |
|
}, |
|
{ |
|
"epoch": 63.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.7898954921921011, |
|
"eval_loss": 0.5439756512641907, |
|
"eval_precision": 0.7922270390160299, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 4.4228, |
|
"eval_samples_per_second": 24.645, |
|
"eval_steps_per_second": 0.452, |
|
"step": 512 |
|
}, |
|
{ |
|
"epoch": 64.97, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.048, |
|
"step": 520 |
|
}, |
|
{ |
|
"epoch": 64.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.7882784673502429, |
|
"eval_loss": 0.5923751592636108, |
|
"eval_precision": 0.7878178107535906, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 5.5392, |
|
"eval_samples_per_second": 19.678, |
|
"eval_steps_per_second": 0.361, |
|
"step": 520 |
|
}, |
|
{ |
|
"epoch": 65.97, |
|
"eval_accuracy": 0.8440366972477065, |
|
"eval_f1": 0.8440366972477065, |
|
"eval_loss": 0.486260324716568, |
|
"eval_precision": 0.8440366972477065, |
|
"eval_recall": 0.8440366972477065, |
|
"eval_runtime": 4.2084, |
|
"eval_samples_per_second": 25.9, |
|
"eval_steps_per_second": 0.475, |
|
"step": 528 |
|
}, |
|
{ |
|
"epoch": 66.24, |
|
"learning_rate": 2.2916666666666667e-05, |
|
"loss": 0.045, |
|
"step": 530 |
|
}, |
|
{ |
|
"epoch": 66.97, |
|
"eval_accuracy": 0.8073394495412844, |
|
"eval_f1": 0.8046694749207712, |
|
"eval_loss": 0.5849686861038208, |
|
"eval_precision": 0.8076432996157767, |
|
"eval_recall": 0.8073394495412844, |
|
"eval_runtime": 4.3405, |
|
"eval_samples_per_second": 25.112, |
|
"eval_steps_per_second": 0.461, |
|
"step": 536 |
|
}, |
|
{ |
|
"epoch": 67.48, |
|
"learning_rate": 2.0833333333333333e-05, |
|
"loss": 0.047, |
|
"step": 540 |
|
}, |
|
{ |
|
"epoch": 67.97, |
|
"eval_accuracy": 0.8256880733944955, |
|
"eval_f1": 0.8227139701424718, |
|
"eval_loss": 0.4938836991786957, |
|
"eval_precision": 0.8211639886949021, |
|
"eval_recall": 0.8256880733944955, |
|
"eval_runtime": 4.2943, |
|
"eval_samples_per_second": 25.382, |
|
"eval_steps_per_second": 0.466, |
|
"step": 544 |
|
}, |
|
{ |
|
"epoch": 68.73, |
|
"learning_rate": 1.8750000000000002e-05, |
|
"loss": 0.0412, |
|
"step": 550 |
|
}, |
|
{ |
|
"epoch": 68.97, |
|
"eval_accuracy": 0.7889908256880734, |
|
"eval_f1": 0.7899819010172877, |
|
"eval_loss": 0.4850451946258545, |
|
"eval_precision": 0.7911629060252914, |
|
"eval_recall": 0.7889908256880734, |
|
"eval_runtime": 4.3733, |
|
"eval_samples_per_second": 24.924, |
|
"eval_steps_per_second": 0.457, |
|
"step": 552 |
|
}, |
|
{ |
|
"epoch": 69.97, |
|
"learning_rate": 1.6666666666666667e-05, |
|
"loss": 0.0392, |
|
"step": 560 |
|
}, |
|
{ |
|
"epoch": 69.97, |
|
"eval_accuracy": 0.8256880733944955, |
|
"eval_f1": 0.8257529642156887, |
|
"eval_loss": 0.5065794587135315, |
|
"eval_precision": 0.8264957264957264, |
|
"eval_recall": 0.8256880733944955, |
|
"eval_runtime": 4.2901, |
|
"eval_samples_per_second": 25.407, |
|
"eval_steps_per_second": 0.466, |
|
"step": 560 |
|
}, |
|
{ |
|
"epoch": 70.97, |
|
"eval_accuracy": 0.8073394495412844, |
|
"eval_f1": 0.8058135764557783, |
|
"eval_loss": 0.49649733304977417, |
|
"eval_precision": 0.8053007135575942, |
|
"eval_recall": 0.8073394495412844, |
|
"eval_runtime": 4.1424, |
|
"eval_samples_per_second": 26.313, |
|
"eval_steps_per_second": 0.483, |
|
"step": 568 |
|
}, |
|
{ |
|
"epoch": 71.24, |
|
"learning_rate": 1.4583333333333333e-05, |
|
"loss": 0.0423, |
|
"step": 570 |
|
}, |
|
{ |
|
"epoch": 71.97, |
|
"eval_accuracy": 0.8348623853211009, |
|
"eval_f1": 0.8350885030999028, |
|
"eval_loss": 0.47168704867362976, |
|
"eval_precision": 0.8376424034680915, |
|
"eval_recall": 0.8348623853211009, |
|
"eval_runtime": 4.1897, |
|
"eval_samples_per_second": 26.016, |
|
"eval_steps_per_second": 0.477, |
|
"step": 576 |
|
}, |
|
{ |
|
"epoch": 72.48, |
|
"learning_rate": 1.25e-05, |
|
"loss": 0.0471, |
|
"step": 580 |
|
}, |
|
{ |
|
"epoch": 72.97, |
|
"eval_accuracy": 0.8256880733944955, |
|
"eval_f1": 0.8295520158325865, |
|
"eval_loss": 0.48450949788093567, |
|
"eval_precision": 0.837811160528748, |
|
"eval_recall": 0.8256880733944955, |
|
"eval_runtime": 4.2446, |
|
"eval_samples_per_second": 25.68, |
|
"eval_steps_per_second": 0.471, |
|
"step": 584 |
|
}, |
|
{ |
|
"epoch": 73.73, |
|
"learning_rate": 1.0416666666666666e-05, |
|
"loss": 0.0322, |
|
"step": 590 |
|
}, |
|
{ |
|
"epoch": 73.97, |
|
"eval_accuracy": 0.7706422018348624, |
|
"eval_f1": 0.7692886041532689, |
|
"eval_loss": 0.5188109278678894, |
|
"eval_precision": 0.7689271840647987, |
|
"eval_recall": 0.7706422018348624, |
|
"eval_runtime": 4.4833, |
|
"eval_samples_per_second": 24.313, |
|
"eval_steps_per_second": 0.446, |
|
"step": 592 |
|
}, |
|
{ |
|
"epoch": 74.97, |
|
"learning_rate": 8.333333333333334e-06, |
|
"loss": 0.042, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 74.97, |
|
"eval_accuracy": 0.7706422018348624, |
|
"eval_f1": 0.7700888306392893, |
|
"eval_loss": 0.5242283940315247, |
|
"eval_precision": 0.7698942959712803, |
|
"eval_recall": 0.7706422018348624, |
|
"eval_runtime": 4.4923, |
|
"eval_samples_per_second": 24.264, |
|
"eval_steps_per_second": 0.445, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 75.97, |
|
"eval_accuracy": 0.7798165137614679, |
|
"eval_f1": 0.7803733958918072, |
|
"eval_loss": 0.5945499539375305, |
|
"eval_precision": 0.7823930357635982, |
|
"eval_recall": 0.7798165137614679, |
|
"eval_runtime": 5.1633, |
|
"eval_samples_per_second": 21.111, |
|
"eval_steps_per_second": 0.387, |
|
"step": 608 |
|
}, |
|
{ |
|
"epoch": 76.24, |
|
"learning_rate": 6.25e-06, |
|
"loss": 0.0416, |
|
"step": 610 |
|
}, |
|
{ |
|
"epoch": 76.97, |
|
"eval_accuracy": 0.7981651376146789, |
|
"eval_f1": 0.7993445642022374, |
|
"eval_loss": 0.5432426929473877, |
|
"eval_precision": 0.8038185145085823, |
|
"eval_recall": 0.7981651376146789, |
|
"eval_runtime": 4.2234, |
|
"eval_samples_per_second": 25.809, |
|
"eval_steps_per_second": 0.474, |
|
"step": 616 |
|
}, |
|
{ |
|
"epoch": 77.48, |
|
"learning_rate": 4.166666666666667e-06, |
|
"loss": 0.0399, |
|
"step": 620 |
|
}, |
|
{ |
|
"epoch": 77.97, |
|
"eval_accuracy": 0.7981651376146789, |
|
"eval_f1": 0.7994120087594209, |
|
"eval_loss": 0.5381362438201904, |
|
"eval_precision": 0.8072242548450546, |
|
"eval_recall": 0.7981651376146789, |
|
"eval_runtime": 4.2152, |
|
"eval_samples_per_second": 25.859, |
|
"eval_steps_per_second": 0.474, |
|
"step": 624 |
|
}, |
|
{ |
|
"epoch": 78.73, |
|
"learning_rate": 2.0833333333333334e-06, |
|
"loss": 0.0439, |
|
"step": 630 |
|
}, |
|
{ |
|
"epoch": 78.97, |
|
"eval_accuracy": 0.7798165137614679, |
|
"eval_f1": 0.7827462243679189, |
|
"eval_loss": 0.6181262135505676, |
|
"eval_precision": 0.7877941763063422, |
|
"eval_recall": 0.7798165137614679, |
|
"eval_runtime": 4.2424, |
|
"eval_samples_per_second": 25.693, |
|
"eval_steps_per_second": 0.471, |
|
"step": 632 |
|
}, |
|
{ |
|
"epoch": 79.97, |
|
"learning_rate": 0.0, |
|
"loss": 0.0462, |
|
"step": 640 |
|
}, |
|
{ |
|
"epoch": 79.97, |
|
"eval_accuracy": 0.8165137614678899, |
|
"eval_f1": 0.8172526992448356, |
|
"eval_loss": 0.48008766770362854, |
|
"eval_precision": 0.8181998512273742, |
|
"eval_recall": 0.8165137614678899, |
|
"eval_runtime": 4.18, |
|
"eval_samples_per_second": 26.076, |
|
"eval_steps_per_second": 0.478, |
|
"step": 640 |
|
}, |
|
{ |
|
"epoch": 79.97, |
|
"step": 640, |
|
"total_flos": 3.5167284631649157e+18, |
|
"train_loss": 0.37728101573884487, |
|
"train_runtime": 2345.4183, |
|
"train_samples_per_second": 70.606, |
|
"train_steps_per_second": 0.273 |
|
} |
|
], |
|
"max_steps": 640, |
|
"num_train_epochs": 80, |
|
"total_flos": 3.5167284631649157e+18, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|