|
{ |
|
"best_metric": 0.018954848870635033, |
|
"best_model_checkpoint": "swinv2-tiny-patch4-window8-256-Kontur-competition-1.3K/checkpoint-52", |
|
"epoch": 12.631578947368421, |
|
"eval_steps": 500, |
|
"global_step": 60, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.84, |
|
"eval_loss": 0.6833776235580444, |
|
"eval_runtime": 3.0114, |
|
"eval_samples_per_second": 44.165, |
|
"eval_steps_per_second": 0.996, |
|
"step": 4 |
|
}, |
|
{ |
|
"epoch": 1.89, |
|
"eval_loss": 0.4898586869239807, |
|
"eval_runtime": 3.4038, |
|
"eval_samples_per_second": 39.074, |
|
"eval_steps_per_second": 0.881, |
|
"step": 9 |
|
}, |
|
{ |
|
"epoch": 2.11, |
|
"grad_norm": 2.64339280128479, |
|
"learning_rate": 4.62962962962963e-05, |
|
"loss": 0.6773, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 2.95, |
|
"eval_loss": 0.2752000093460083, |
|
"eval_runtime": 2.6262, |
|
"eval_samples_per_second": 50.644, |
|
"eval_steps_per_second": 1.142, |
|
"step": 14 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_loss": 0.13112162053585052, |
|
"eval_runtime": 2.6149, |
|
"eval_samples_per_second": 50.862, |
|
"eval_steps_per_second": 1.147, |
|
"step": 19 |
|
}, |
|
{ |
|
"epoch": 4.21, |
|
"grad_norm": 2.5273399353027344, |
|
"learning_rate": 3.7037037037037037e-05, |
|
"loss": 0.3528, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 4.84, |
|
"eval_loss": 0.08120357245206833, |
|
"eval_runtime": 3.1533, |
|
"eval_samples_per_second": 42.178, |
|
"eval_steps_per_second": 0.951, |
|
"step": 23 |
|
}, |
|
{ |
|
"epoch": 5.89, |
|
"eval_loss": 0.04769232124090195, |
|
"eval_runtime": 2.61, |
|
"eval_samples_per_second": 50.958, |
|
"eval_steps_per_second": 1.149, |
|
"step": 28 |
|
}, |
|
{ |
|
"epoch": 6.32, |
|
"grad_norm": 13.101208686828613, |
|
"learning_rate": 2.777777777777778e-05, |
|
"loss": 0.1595, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 6.95, |
|
"eval_loss": 0.028914544731378555, |
|
"eval_runtime": 3.2525, |
|
"eval_samples_per_second": 40.891, |
|
"eval_steps_per_second": 0.922, |
|
"step": 33 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_loss": 0.022866781800985336, |
|
"eval_runtime": 2.636, |
|
"eval_samples_per_second": 50.456, |
|
"eval_steps_per_second": 1.138, |
|
"step": 38 |
|
}, |
|
{ |
|
"epoch": 8.42, |
|
"grad_norm": 7.744855880737305, |
|
"learning_rate": 1.8518518518518518e-05, |
|
"loss": 0.1054, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 8.84, |
|
"eval_loss": 0.02127755992114544, |
|
"eval_runtime": 2.7818, |
|
"eval_samples_per_second": 47.812, |
|
"eval_steps_per_second": 1.078, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 9.89, |
|
"eval_loss": 0.028130069375038147, |
|
"eval_runtime": 3.1605, |
|
"eval_samples_per_second": 42.083, |
|
"eval_steps_per_second": 0.949, |
|
"step": 47 |
|
}, |
|
{ |
|
"epoch": 10.53, |
|
"grad_norm": 4.180393695831299, |
|
"learning_rate": 9.259259259259259e-06, |
|
"loss": 0.0822, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 10.95, |
|
"eval_loss": 0.018954848870635033, |
|
"eval_runtime": 3.079, |
|
"eval_samples_per_second": 43.196, |
|
"eval_steps_per_second": 0.974, |
|
"step": 52 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_loss": 0.023994147777557373, |
|
"eval_runtime": 2.9444, |
|
"eval_samples_per_second": 45.17, |
|
"eval_steps_per_second": 1.019, |
|
"step": 57 |
|
}, |
|
{ |
|
"epoch": 12.63, |
|
"grad_norm": 2.7027509212493896, |
|
"learning_rate": 0.0, |
|
"loss": 0.076, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 12.63, |
|
"eval_loss": 0.023665426298975945, |
|
"eval_runtime": 3.0873, |
|
"eval_samples_per_second": 43.079, |
|
"eval_steps_per_second": 0.972, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 12.63, |
|
"step": 60, |
|
"total_flos": 4.9113822316304794e+17, |
|
"train_loss": 0.24218196471532186, |
|
"train_runtime": 426.607, |
|
"train_samples_per_second": 41.982, |
|
"train_steps_per_second": 0.141 |
|
} |
|
], |
|
"logging_steps": 10, |
|
"max_steps": 60, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 15, |
|
"save_steps": 500, |
|
"total_flos": 4.9113822316304794e+17, |
|
"train_batch_size": 64, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|