|
{ |
|
"best_metric": 0.6672587329780936, |
|
"best_model_checkpoint": "Distilled-Melanoma-Classification-MobileNetV2/checkpoint-60792", |
|
"epoch": 30.0, |
|
"eval_steps": 500, |
|
"global_step": 75990, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 4.8333333333333334e-05, |
|
"loss": 1.9302, |
|
"step": 2533 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.551805802249852, |
|
"eval_loss": 1.6089619398117065, |
|
"eval_runtime": 454.9672, |
|
"eval_samples_per_second": 11.137, |
|
"eval_steps_per_second": 1.394, |
|
"step": 2533 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 4.666666666666667e-05, |
|
"loss": 1.6357, |
|
"step": 5066 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.5964081310440102, |
|
"eval_loss": 1.3391807079315186, |
|
"eval_runtime": 461.1878, |
|
"eval_samples_per_second": 10.987, |
|
"eval_steps_per_second": 1.375, |
|
"step": 5066 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 4.5e-05, |
|
"loss": 1.5009, |
|
"step": 7599 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.6208802052496546, |
|
"eval_loss": 1.2432700395584106, |
|
"eval_runtime": 461.7485, |
|
"eval_samples_per_second": 10.974, |
|
"eval_steps_per_second": 1.373, |
|
"step": 7599 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"learning_rate": 4.3333333333333334e-05, |
|
"loss": 1.4095, |
|
"step": 10132 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.6246299585553582, |
|
"eval_loss": 1.3341896533966064, |
|
"eval_runtime": 455.3869, |
|
"eval_samples_per_second": 11.127, |
|
"eval_steps_per_second": 1.392, |
|
"step": 10132 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"learning_rate": 4.166666666666667e-05, |
|
"loss": 1.33, |
|
"step": 12665 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.6445628577067298, |
|
"eval_loss": 1.154502511024475, |
|
"eval_runtime": 456.8814, |
|
"eval_samples_per_second": 11.09, |
|
"eval_steps_per_second": 1.388, |
|
"step": 12665 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"learning_rate": 4e-05, |
|
"loss": 1.2499, |
|
"step": 15198 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.6329188869153345, |
|
"eval_loss": 1.3197146654129028, |
|
"eval_runtime": 470.1267, |
|
"eval_samples_per_second": 10.778, |
|
"eval_steps_per_second": 1.349, |
|
"step": 15198 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"learning_rate": 3.8333333333333334e-05, |
|
"loss": 1.1881, |
|
"step": 17731 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.6538385632524176, |
|
"eval_loss": 1.0565587282180786, |
|
"eval_runtime": 468.3787, |
|
"eval_samples_per_second": 10.818, |
|
"eval_steps_per_second": 1.354, |
|
"step": 17731 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"learning_rate": 3.6666666666666666e-05, |
|
"loss": 1.1184, |
|
"step": 20264 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.6660746003552398, |
|
"eval_loss": 1.036229133605957, |
|
"eval_runtime": 466.4784, |
|
"eval_samples_per_second": 10.862, |
|
"eval_steps_per_second": 1.359, |
|
"step": 20264 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"learning_rate": 3.5e-05, |
|
"loss": 1.0487, |
|
"step": 22797 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.648707321886718, |
|
"eval_loss": 1.2400047779083252, |
|
"eval_runtime": 466.581, |
|
"eval_samples_per_second": 10.86, |
|
"eval_steps_per_second": 1.359, |
|
"step": 22797 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"learning_rate": 3.3333333333333335e-05, |
|
"loss": 0.9876, |
|
"step": 25330 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.6571936056838366, |
|
"eval_loss": 1.0631685256958008, |
|
"eval_runtime": 466.0607, |
|
"eval_samples_per_second": 10.872, |
|
"eval_steps_per_second": 1.36, |
|
"step": 25330 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"learning_rate": 3.1666666666666666e-05, |
|
"loss": 0.9002, |
|
"step": 27863 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.6473258338267219, |
|
"eval_loss": 1.1159186363220215, |
|
"eval_runtime": 466.1714, |
|
"eval_samples_per_second": 10.869, |
|
"eval_steps_per_second": 1.36, |
|
"step": 27863 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"learning_rate": 3e-05, |
|
"loss": 0.8309, |
|
"step": 30396 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.6311426879810539, |
|
"eval_loss": 1.2457987070083618, |
|
"eval_runtime": 477.2863, |
|
"eval_samples_per_second": 10.616, |
|
"eval_steps_per_second": 1.328, |
|
"step": 30396 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"learning_rate": 2.8333333333333335e-05, |
|
"loss": 0.7729, |
|
"step": 32929 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_accuracy": 0.6425893033353068, |
|
"eval_loss": 1.2415727376937866, |
|
"eval_runtime": 468.9202, |
|
"eval_samples_per_second": 10.806, |
|
"eval_steps_per_second": 1.352, |
|
"step": 32929 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"learning_rate": 2.6666666666666667e-05, |
|
"loss": 0.7069, |
|
"step": 35462 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_accuracy": 0.6492993881981448, |
|
"eval_loss": 1.1467454433441162, |
|
"eval_runtime": 463.7522, |
|
"eval_samples_per_second": 10.926, |
|
"eval_steps_per_second": 1.367, |
|
"step": 35462 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"learning_rate": 2.5e-05, |
|
"loss": 0.6519, |
|
"step": 37995 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_accuracy": 0.6573909611209788, |
|
"eval_loss": 1.2422680854797363, |
|
"eval_runtime": 464.9266, |
|
"eval_samples_per_second": 10.898, |
|
"eval_steps_per_second": 1.364, |
|
"step": 37995 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"learning_rate": 2.3333333333333336e-05, |
|
"loss": 0.5956, |
|
"step": 40528 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.6498914545095718, |
|
"eval_loss": 1.2838796377182007, |
|
"eval_runtime": 477.5194, |
|
"eval_samples_per_second": 10.611, |
|
"eval_steps_per_second": 1.328, |
|
"step": 40528 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"learning_rate": 2.1666666666666667e-05, |
|
"loss": 0.5531, |
|
"step": 43061 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_accuracy": 0.6591671600552595, |
|
"eval_loss": 1.228452444076538, |
|
"eval_runtime": 479.3427, |
|
"eval_samples_per_second": 10.571, |
|
"eval_steps_per_second": 1.323, |
|
"step": 43061 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"learning_rate": 2e-05, |
|
"loss": 0.5104, |
|
"step": 45594 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_accuracy": 0.6421945924610223, |
|
"eval_loss": 1.287538766860962, |
|
"eval_runtime": 470.0202, |
|
"eval_samples_per_second": 10.78, |
|
"eval_steps_per_second": 1.349, |
|
"step": 45594 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"learning_rate": 1.8333333333333333e-05, |
|
"loss": 0.4777, |
|
"step": 48127 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_accuracy": 0.6573909611209788, |
|
"eval_loss": 1.1871315240859985, |
|
"eval_runtime": 471.7135, |
|
"eval_samples_per_second": 10.742, |
|
"eval_steps_per_second": 1.344, |
|
"step": 48127 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"learning_rate": 1.6666666666666667e-05, |
|
"loss": 0.447, |
|
"step": 50660 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_accuracy": 0.6566015393724097, |
|
"eval_loss": 1.2442570924758911, |
|
"eval_runtime": 467.1299, |
|
"eval_samples_per_second": 10.847, |
|
"eval_steps_per_second": 1.357, |
|
"step": 50660 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"learning_rate": 1.5e-05, |
|
"loss": 0.4179, |
|
"step": 53193 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_accuracy": 0.6603512926781133, |
|
"eval_loss": 1.2222002744674683, |
|
"eval_runtime": 467.1803, |
|
"eval_samples_per_second": 10.846, |
|
"eval_steps_per_second": 1.357, |
|
"step": 53193 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"learning_rate": 1.3333333333333333e-05, |
|
"loss": 0.3939, |
|
"step": 55726 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_accuracy": 0.6400236826524571, |
|
"eval_loss": 1.2755681276321411, |
|
"eval_runtime": 466.7893, |
|
"eval_samples_per_second": 10.855, |
|
"eval_steps_per_second": 1.358, |
|
"step": 55726 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"learning_rate": 1.1666666666666668e-05, |
|
"loss": 0.3695, |
|
"step": 58259 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_accuracy": 0.656798894809552, |
|
"eval_loss": 1.1457221508026123, |
|
"eval_runtime": 468.5285, |
|
"eval_samples_per_second": 10.815, |
|
"eval_steps_per_second": 1.353, |
|
"step": 58259 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"learning_rate": 1e-05, |
|
"loss": 0.348, |
|
"step": 60792 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_accuracy": 0.6672587329780936, |
|
"eval_loss": 1.144992709159851, |
|
"eval_runtime": 470.6423, |
|
"eval_samples_per_second": 10.766, |
|
"eval_steps_per_second": 1.347, |
|
"step": 60792 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"learning_rate": 8.333333333333334e-06, |
|
"loss": 0.3326, |
|
"step": 63325 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_accuracy": 0.6644957568581015, |
|
"eval_loss": 1.0921552181243896, |
|
"eval_runtime": 470.5011, |
|
"eval_samples_per_second": 10.769, |
|
"eval_steps_per_second": 1.347, |
|
"step": 63325 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"learning_rate": 6.666666666666667e-06, |
|
"loss": 0.315, |
|
"step": 65858 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_accuracy": 0.6621274916123939, |
|
"eval_loss": 1.1216638088226318, |
|
"eval_runtime": 454.9608, |
|
"eval_samples_per_second": 11.137, |
|
"eval_steps_per_second": 1.394, |
|
"step": 65858 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"learning_rate": 5e-06, |
|
"loss": 0.2995, |
|
"step": 68391 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_accuracy": 0.6611407144266824, |
|
"eval_loss": 1.0976777076721191, |
|
"eval_runtime": 446.8324, |
|
"eval_samples_per_second": 11.34, |
|
"eval_steps_per_second": 1.419, |
|
"step": 68391 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"learning_rate": 3.3333333333333333e-06, |
|
"loss": 0.2943, |
|
"step": 70924 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_accuracy": 0.6607460035523979, |
|
"eval_loss": 1.1353331804275513, |
|
"eval_runtime": 452.9025, |
|
"eval_samples_per_second": 11.188, |
|
"eval_steps_per_second": 1.4, |
|
"step": 70924 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"learning_rate": 1.6666666666666667e-06, |
|
"loss": 0.2828, |
|
"step": 73457 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_accuracy": 0.66350897967239, |
|
"eval_loss": 1.0929347276687622, |
|
"eval_runtime": 461.1223, |
|
"eval_samples_per_second": 10.988, |
|
"eval_steps_per_second": 1.375, |
|
"step": 73457 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"learning_rate": 0.0, |
|
"loss": 0.276, |
|
"step": 75990 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_accuracy": 0.6627195579238208, |
|
"eval_loss": 1.0914403200149536, |
|
"eval_runtime": 464.7038, |
|
"eval_samples_per_second": 10.904, |
|
"eval_steps_per_second": 1.364, |
|
"step": 75990 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 75990, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 30, |
|
"save_steps": 500, |
|
"total_flos": 1.2266522779779072e+18, |
|
"train_batch_size": 8, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|