|
{ |
|
"best_metric": 1.164973497390747, |
|
"best_model_checkpoint": "facial_age_image_detection/checkpoint-4800", |
|
"epoch": 20.0, |
|
"eval_steps": 500, |
|
"global_step": 4800, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.6013097448929723, |
|
"eval_loss": 1.182183861732483, |
|
"eval_runtime": 106.5296, |
|
"eval_samples_per_second": 96.039, |
|
"eval_steps_per_second": 3.004, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.6016029713615483, |
|
"eval_loss": 1.1812384128570557, |
|
"eval_runtime": 103.6605, |
|
"eval_samples_per_second": 98.697, |
|
"eval_steps_per_second": 3.087, |
|
"step": 480 |
|
}, |
|
{ |
|
"epoch": 2.08, |
|
"grad_norm": 11.414525032043457, |
|
"learning_rate": 4.526315789473684e-07, |
|
"loss": 0.7517, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.5973023164891017, |
|
"eval_loss": 1.1846318244934082, |
|
"eval_runtime": 104.3279, |
|
"eval_samples_per_second": 98.066, |
|
"eval_steps_per_second": 3.067, |
|
"step": 720 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.6031668458606196, |
|
"eval_loss": 1.178046464920044, |
|
"eval_runtime": 105.5564, |
|
"eval_samples_per_second": 96.924, |
|
"eval_steps_per_second": 3.032, |
|
"step": 960 |
|
}, |
|
{ |
|
"epoch": 4.17, |
|
"grad_norm": 10.3371000289917, |
|
"learning_rate": 4e-07, |
|
"loss": 0.7404, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.6057081419216108, |
|
"eval_loss": 1.1763097047805786, |
|
"eval_runtime": 104.8017, |
|
"eval_samples_per_second": 97.622, |
|
"eval_steps_per_second": 3.053, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.6061968527025706, |
|
"eval_loss": 1.173648715019226, |
|
"eval_runtime": 104.8949, |
|
"eval_samples_per_second": 97.536, |
|
"eval_steps_per_second": 3.051, |
|
"step": 1440 |
|
}, |
|
{ |
|
"epoch": 6.25, |
|
"grad_norm": 11.105679512023926, |
|
"learning_rate": 3.4736842105263157e-07, |
|
"loss": 0.7343, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.6017984556739322, |
|
"eval_loss": 1.175057053565979, |
|
"eval_runtime": 104.1925, |
|
"eval_samples_per_second": 98.193, |
|
"eval_steps_per_second": 3.071, |
|
"step": 1680 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.6026781350796598, |
|
"eval_loss": 1.1735320091247559, |
|
"eval_runtime": 103.0462, |
|
"eval_samples_per_second": 99.286, |
|
"eval_steps_per_second": 3.105, |
|
"step": 1920 |
|
}, |
|
{ |
|
"epoch": 8.33, |
|
"grad_norm": 15.928546905517578, |
|
"learning_rate": 2.947368421052631e-07, |
|
"loss": 0.7275, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.6044374938911152, |
|
"eval_loss": 1.1707645654678345, |
|
"eval_runtime": 103.3329, |
|
"eval_samples_per_second": 99.01, |
|
"eval_steps_per_second": 3.097, |
|
"step": 2160 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.6085426644511778, |
|
"eval_loss": 1.169615387916565, |
|
"eval_runtime": 104.1315, |
|
"eval_samples_per_second": 98.251, |
|
"eval_steps_per_second": 3.073, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 10.42, |
|
"grad_norm": 15.35641098022461, |
|
"learning_rate": 2.4210526315789473e-07, |
|
"loss": 0.7201, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.6064900791711465, |
|
"eval_loss": 1.1700137853622437, |
|
"eval_runtime": 106.578, |
|
"eval_samples_per_second": 95.995, |
|
"eval_steps_per_second": 3.002, |
|
"step": 2640 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.6087381487635617, |
|
"eval_loss": 1.1673282384872437, |
|
"eval_runtime": 102.521, |
|
"eval_samples_per_second": 99.794, |
|
"eval_steps_per_second": 3.121, |
|
"step": 2880 |
|
}, |
|
{ |
|
"epoch": 12.5, |
|
"grad_norm": 10.890913963317871, |
|
"learning_rate": 1.8947368421052632e-07, |
|
"loss": 0.7144, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_accuracy": 0.6035578144853876, |
|
"eval_loss": 1.1682850122451782, |
|
"eval_runtime": 103.3961, |
|
"eval_samples_per_second": 98.95, |
|
"eval_steps_per_second": 3.095, |
|
"step": 3120 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_accuracy": 0.6070765321082983, |
|
"eval_loss": 1.1674185991287231, |
|
"eval_runtime": 103.2219, |
|
"eval_samples_per_second": 99.117, |
|
"eval_steps_per_second": 3.1, |
|
"step": 3360 |
|
}, |
|
{ |
|
"epoch": 14.58, |
|
"grad_norm": 11.558945655822754, |
|
"learning_rate": 1.368421052631579e-07, |
|
"loss": 0.7137, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_accuracy": 0.6073697585768743, |
|
"eval_loss": 1.1667180061340332, |
|
"eval_runtime": 103.2403, |
|
"eval_samples_per_second": 99.099, |
|
"eval_steps_per_second": 3.1, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.6068810477959143, |
|
"eval_loss": 1.166371464729309, |
|
"eval_runtime": 103.7779, |
|
"eval_samples_per_second": 98.586, |
|
"eval_steps_per_second": 3.084, |
|
"step": 3840 |
|
}, |
|
{ |
|
"epoch": 16.67, |
|
"grad_norm": 15.126260757446289, |
|
"learning_rate": 8.421052631578947e-08, |
|
"loss": 0.7093, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_accuracy": 0.6044374938911152, |
|
"eval_loss": 1.1674280166625977, |
|
"eval_runtime": 102.8109, |
|
"eval_samples_per_second": 99.513, |
|
"eval_steps_per_second": 3.113, |
|
"step": 4080 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_accuracy": 0.6042420095787313, |
|
"eval_loss": 1.1664873361587524, |
|
"eval_runtime": 102.8553, |
|
"eval_samples_per_second": 99.47, |
|
"eval_steps_per_second": 3.111, |
|
"step": 4320 |
|
}, |
|
{ |
|
"epoch": 18.75, |
|
"grad_norm": 14.217340469360352, |
|
"learning_rate": 3.157894736842105e-08, |
|
"loss": 0.7035, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_accuracy": 0.6062945948587626, |
|
"eval_loss": 1.1650714874267578, |
|
"eval_runtime": 103.4609, |
|
"eval_samples_per_second": 98.888, |
|
"eval_steps_per_second": 3.093, |
|
"step": 4560 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_accuracy": 0.6068810477959143, |
|
"eval_loss": 1.164973497390747, |
|
"eval_runtime": 102.8512, |
|
"eval_samples_per_second": 99.474, |
|
"eval_steps_per_second": 3.111, |
|
"step": 4800 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 4800, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 20, |
|
"save_steps": 500, |
|
"total_flos": 2.3786767829022114e+19, |
|
"train_batch_size": 64, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|