alyzbane's picture
End of training
30ac9c0 verified
{
"best_metric": 0.003647729055956006,
"best_model_checkpoint": "vit-base-patch16-224-finetuned-barkley\\checkpoint-570",
"epoch": 17.0,
"eval_steps": 500,
"global_step": 646,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"train_accuracy": 0.26398026315789475
},
{
"epoch": 1.0,
"grad_norm": 6.455413341522217,
"learning_rate": 2.0914608267470257e-06,
"loss": 1.6093,
"step": 38
},
{
"epoch": 1.0,
"eval_accuracy": 0.4148818501759678,
"eval_error_rate": 0.5851181498240322,
"eval_f1": 0.406583244487493,
"eval_loss": 1.4340049028396606,
"eval_precision": 0.47685010008788203,
"eval_recall": 0.4342105263157895,
"eval_runtime": 80.0768,
"eval_samples_per_second": 1.898,
"eval_steps_per_second": 0.237,
"eval_top1_accuracy": 0.4342105263157895,
"step": 38
},
{
"epoch": 2.0,
"train_accuracy": 0.5095029239766082
},
{
"epoch": 2.0,
"grad_norm": 6.083907127380371,
"learning_rate": 2.365146216752351e-06,
"loss": 1.2908,
"step": 76
},
{
"epoch": 2.0,
"eval_accuracy": 0.6161337355455003,
"eval_error_rate": 0.3838662644544997,
"eval_f1": 0.615989993007031,
"eval_loss": 1.1747227907180786,
"eval_precision": 0.6587479462326463,
"eval_recall": 0.6118421052631579,
"eval_runtime": 62.2988,
"eval_samples_per_second": 2.44,
"eval_steps_per_second": 0.305,
"eval_top1_accuracy": 0.6118421052631579,
"step": 76
},
{
"epoch": 3.0,
"train_accuracy": 0.7017543859649122
},
{
"epoch": 3.0,
"grad_norm": 5.073782444000244,
"learning_rate": 2.8189702123460904e-06,
"loss": 1.0409,
"step": 114
},
{
"epoch": 3.0,
"eval_accuracy": 0.7424685771744596,
"eval_error_rate": 0.2575314228255404,
"eval_f1": 0.7293001164996891,
"eval_loss": 0.9174113869667053,
"eval_precision": 0.7381704260651629,
"eval_recall": 0.7302631578947368,
"eval_runtime": 63.0328,
"eval_samples_per_second": 2.411,
"eval_steps_per_second": 0.301,
"eval_top1_accuracy": 0.7302631578947368,
"step": 114
},
{
"epoch": 4.0,
"train_accuracy": 0.8172514619883041
},
{
"epoch": 4.0,
"grad_norm": 4.503601551055908,
"learning_rate": 3.449473887042014e-06,
"loss": 0.781,
"step": 152
},
{
"epoch": 4.0,
"eval_accuracy": 0.8650025138260432,
"eval_error_rate": 0.1349974861739568,
"eval_f1": 0.862176726467179,
"eval_loss": 0.6527765989303589,
"eval_precision": 0.8632378661708033,
"eval_recall": 0.8618421052631579,
"eval_runtime": 64.1793,
"eval_samples_per_second": 2.368,
"eval_steps_per_second": 0.296,
"eval_top1_accuracy": 0.8618421052631579,
"step": 152
},
{
"epoch": 5.0,
"train_accuracy": 0.9027777777777778
},
{
"epoch": 5.0,
"grad_norm": 3.8262150287628174,
"learning_rate": 4.251851708560589e-06,
"loss": 0.5429,
"step": 190
},
{
"epoch": 5.0,
"eval_accuracy": 0.9442885872297637,
"eval_error_rate": 0.05571141277023628,
"eval_f1": 0.9404774954713644,
"eval_loss": 0.41116613149642944,
"eval_precision": 0.9416901233513075,
"eval_recall": 0.9407894736842105,
"eval_runtime": 64.0989,
"eval_samples_per_second": 2.371,
"eval_steps_per_second": 0.296,
"eval_top1_accuracy": 0.9407894736842105,
"step": 190
},
{
"epoch": 6.0,
"train_accuracy": 0.9568713450292398
},
{
"epoch": 6.0,
"grad_norm": 2.5020029544830322,
"learning_rate": 5.219988165325166e-06,
"loss": 0.328,
"step": 228
},
{
"epoch": 6.0,
"eval_accuracy": 0.981111111111111,
"eval_error_rate": 0.018888888888888955,
"eval_f1": 0.980233547031901,
"eval_loss": 0.22286705672740936,
"eval_precision": 0.9808624413887572,
"eval_recall": 0.9802631578947368,
"eval_runtime": 65.9742,
"eval_samples_per_second": 2.304,
"eval_steps_per_second": 0.288,
"eval_top1_accuracy": 0.9802631578947368,
"step": 228
},
{
"epoch": 7.0,
"train_accuracy": 0.9707602339181286
},
{
"epoch": 7.0,
"grad_norm": 3.700869560241699,
"learning_rate": 6.346504377274108e-06,
"loss": 0.1837,
"step": 266
},
{
"epoch": 7.0,
"eval_accuracy": 0.9877777777777779,
"eval_error_rate": 0.012222222222222134,
"eval_f1": 0.9868484170131115,
"eval_loss": 0.11809363961219788,
"eval_precision": 0.9870857699805068,
"eval_recall": 0.9868421052631579,
"eval_runtime": 64.4539,
"eval_samples_per_second": 2.358,
"eval_steps_per_second": 0.295,
"eval_top1_accuracy": 0.9868421052631579,
"step": 266
},
{
"epoch": 8.0,
"train_accuracy": 0.9766081871345029
},
{
"epoch": 8.0,
"grad_norm": 1.4798824787139893,
"learning_rate": 7.622814335733349e-06,
"loss": 0.1131,
"step": 304
},
{
"epoch": 8.0,
"eval_accuracy": 0.9944444444444445,
"eval_error_rate": 0.005555555555555536,
"eval_f1": 0.99343678755752,
"eval_loss": 0.06803914159536362,
"eval_precision": 0.9936647173489279,
"eval_recall": 0.993421052631579,
"eval_runtime": 66.8397,
"eval_samples_per_second": 2.274,
"eval_steps_per_second": 0.284,
"eval_top1_accuracy": 0.993421052631579,
"step": 304
},
{
"epoch": 9.0,
"train_accuracy": 0.9912280701754386
},
{
"epoch": 9.0,
"grad_norm": 0.24450232088565826,
"learning_rate": 9.039190343704055e-06,
"loss": 0.0526,
"step": 342
},
{
"epoch": 9.0,
"eval_accuracy": 0.9944444444444445,
"eval_error_rate": 0.005555555555555536,
"eval_f1": 0.99343678755752,
"eval_loss": 0.0387217253446579,
"eval_precision": 0.9936647173489279,
"eval_recall": 0.993421052631579,
"eval_runtime": 62.2983,
"eval_samples_per_second": 2.44,
"eval_steps_per_second": 0.305,
"eval_top1_accuracy": 0.993421052631579,
"step": 342
},
{
"epoch": 10.0,
"train_accuracy": 0.9948830409356725
},
{
"epoch": 10.0,
"grad_norm": 0.18834975361824036,
"learning_rate": 1.0584837157796744e-05,
"loss": 0.0283,
"step": 380
},
{
"epoch": 10.0,
"eval_accuracy": 0.9877777777777779,
"eval_error_rate": 0.012222222222222134,
"eval_f1": 0.9868641519390525,
"eval_loss": 0.032834384590387344,
"eval_precision": 0.9873294346978557,
"eval_recall": 0.9868421052631579,
"eval_runtime": 65.4882,
"eval_samples_per_second": 2.321,
"eval_steps_per_second": 0.29,
"eval_top1_accuracy": 0.9868421052631579,
"step": 380
},
{
"epoch": 11.0,
"train_accuracy": 0.9956140350877193
},
{
"epoch": 11.0,
"grad_norm": 0.2787030041217804,
"learning_rate": 1.2247974266721769e-05,
"loss": 0.019,
"step": 418
},
{
"epoch": 11.0,
"eval_accuracy": 0.9888888888888889,
"eval_error_rate": 0.011111111111111072,
"eval_f1": 0.9867701266776593,
"eval_loss": 0.0223978441208601,
"eval_precision": 0.9872979940891655,
"eval_recall": 0.9868421052631579,
"eval_runtime": 66.7371,
"eval_samples_per_second": 2.278,
"eval_steps_per_second": 0.285,
"eval_top1_accuracy": 0.9868421052631579,
"step": 418
},
{
"epoch": 12.0,
"train_accuracy": 0.9963450292397661
},
{
"epoch": 12.0,
"grad_norm": 1.9764137268066406,
"learning_rate": 1.401592567923113e-05,
"loss": 0.0148,
"step": 456
},
{
"epoch": 12.0,
"eval_accuracy": 0.9888888888888889,
"eval_error_rate": 0.011111111111111072,
"eval_f1": 0.9867701266776593,
"eval_loss": 0.02013457380235195,
"eval_precision": 0.9872979940891655,
"eval_recall": 0.9868421052631579,
"eval_runtime": 62.9372,
"eval_samples_per_second": 2.415,
"eval_steps_per_second": 0.302,
"eval_top1_accuracy": 0.9868421052631579,
"step": 456
},
{
"epoch": 13.0,
"train_accuracy": 0.9963450292397661
},
{
"epoch": 13.0,
"grad_norm": 0.050672873854637146,
"learning_rate": 1.5875216537171772e-05,
"loss": 0.0095,
"step": 494
},
{
"epoch": 13.0,
"eval_accuracy": 0.9877777777777779,
"eval_error_rate": 0.012222222222222134,
"eval_f1": 0.9868484170131115,
"eval_loss": 0.03958281874656677,
"eval_precision": 0.9870857699805068,
"eval_recall": 0.9868421052631579,
"eval_runtime": 63.5973,
"eval_samples_per_second": 2.39,
"eval_steps_per_second": 0.299,
"eval_top1_accuracy": 0.9868421052631579,
"step": 494
},
{
"epoch": 14.0,
"train_accuracy": 0.9978070175438597
},
{
"epoch": 14.0,
"grad_norm": 0.06194866821169853,
"learning_rate": 1.7811675817291163e-05,
"loss": 0.007,
"step": 532
},
{
"epoch": 14.0,
"eval_accuracy": 1.0,
"eval_error_rate": 0.0,
"eval_f1": 1.0,
"eval_loss": 0.0047844694927334785,
"eval_precision": 1.0,
"eval_recall": 1.0,
"eval_runtime": 63.8972,
"eval_samples_per_second": 2.379,
"eval_steps_per_second": 0.297,
"eval_top1_accuracy": 1.0,
"step": 532
},
{
"epoch": 15.0,
"train_accuracy": 0.9956140350877193
},
{
"epoch": 15.0,
"grad_norm": 0.3071841597557068,
"learning_rate": 1.9810544339029155e-05,
"loss": 0.011,
"step": 570
},
{
"epoch": 15.0,
"eval_accuracy": 1.0,
"eval_error_rate": 0.0,
"eval_f1": 1.0,
"eval_loss": 0.003647729055956006,
"eval_precision": 1.0,
"eval_recall": 1.0,
"eval_runtime": 65.5965,
"eval_samples_per_second": 2.317,
"eval_steps_per_second": 0.29,
"eval_top1_accuracy": 1.0,
"step": 570
},
{
"epoch": 16.0,
"train_accuracy": 0.9978070175438597
},
{
"epoch": 16.0,
"grad_norm": 0.05617503821849823,
"learning_rate": 2.1856587255089357e-05,
"loss": 0.0071,
"step": 608
},
{
"epoch": 16.0,
"eval_accuracy": 0.9941176470588236,
"eval_error_rate": 0.00588235294117645,
"eval_f1": 0.9934170172927719,
"eval_loss": 0.009170782752335072,
"eval_precision": 0.9935988620199147,
"eval_recall": 0.993421052631579,
"eval_runtime": 66.4048,
"eval_samples_per_second": 2.289,
"eval_steps_per_second": 0.286,
"eval_top1_accuracy": 0.993421052631579,
"step": 608
},
{
"epoch": 17.0,
"train_accuracy": 0.9963450292397661
},
{
"epoch": 17.0,
"grad_norm": 0.02715430036187172,
"learning_rate": 2.393421016741653e-05,
"loss": 0.0103,
"step": 646
},
{
"epoch": 17.0,
"eval_accuracy": 0.9944444444444445,
"eval_error_rate": 0.005555555555555536,
"eval_f1": 0.9934286478144102,
"eval_loss": 0.014811488799750805,
"eval_precision": 0.9936332767402377,
"eval_recall": 0.993421052631579,
"eval_runtime": 64.9042,
"eval_samples_per_second": 2.342,
"eval_steps_per_second": 0.293,
"eval_top1_accuracy": 0.993421052631579,
"step": 646
},
{
"epoch": 17.0,
"step": 646,
"total_flos": 1.601957481669329e+18,
"train_loss": 0.3558414801263219,
"train_runtime": 14288.2591,
"train_samples_per_second": 2.553,
"train_steps_per_second": 0.08
}
],
"logging_steps": 10,
"max_steps": 1140,
"num_input_tokens_seen": 0,
"num_train_epochs": 30,
"save_steps": 500,
"stateful_callbacks": {
"EarlyStoppingCallback": {
"args": {
"early_stopping_patience": 2,
"early_stopping_threshold": 0.0
},
"attributes": {
"early_stopping_patience_counter": 0
}
},
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1.601957481669329e+18,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}