{ "best_metric": 0.8007936507936508, "best_model_checkpoint": "CP2_HAR_mobilenet_v2_1.4_224/checkpoint-908", "epoch": 29.620253164556964, "eval_steps": 500, "global_step": 1170, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.9873417721518988, "grad_norm": 4.1262431144714355, "learning_rate": 1.6666666666666667e-05, "loss": 2.7851, "step": 39 }, { "epoch": 0.9873417721518988, "eval_accuracy": 0.16428571428571428, "eval_loss": 2.5702319145202637, "eval_runtime": 5.3145, "eval_samples_per_second": 237.087, "eval_steps_per_second": 3.763, "step": 39 }, { "epoch": 2.0, "grad_norm": 4.215778350830078, "learning_rate": 3.376068376068376e-05, "loss": 2.3201, "step": 79 }, { "epoch": 2.0, "eval_accuracy": 0.46190476190476193, "eval_loss": 1.8606162071228027, "eval_runtime": 5.1344, "eval_samples_per_second": 245.404, "eval_steps_per_second": 3.895, "step": 79 }, { "epoch": 2.9873417721518987, "grad_norm": 3.7117207050323486, "learning_rate": 4.995251661918329e-05, "loss": 1.8017, "step": 118 }, { "epoch": 2.9873417721518987, "eval_accuracy": 0.6, "eval_loss": 1.3362585306167603, "eval_runtime": 5.1732, "eval_samples_per_second": 243.562, "eval_steps_per_second": 3.866, "step": 118 }, { "epoch": 4.0, "grad_norm": 4.134876728057861, "learning_rate": 4.8053181386514724e-05, "loss": 1.3925, "step": 158 }, { "epoch": 4.0, "eval_accuracy": 0.6674603174603174, "eval_loss": 1.083453893661499, "eval_runtime": 5.1678, "eval_samples_per_second": 243.819, "eval_steps_per_second": 3.87, "step": 158 }, { "epoch": 4.987341772151899, "grad_norm": 4.160211563110352, "learning_rate": 4.620132953466287e-05, "loss": 1.2488, "step": 197 }, { "epoch": 4.987341772151899, "eval_accuracy": 0.7015873015873015, "eval_loss": 0.9785799384117126, "eval_runtime": 5.3488, "eval_samples_per_second": 235.567, "eval_steps_per_second": 3.739, "step": 197 }, { "epoch": 6.0, "grad_norm": 4.307733058929443, "learning_rate": 4.4301994301994304e-05, "loss": 1.1085, "step": 237 }, { "epoch": 6.0, "eval_accuracy": 0.7261904761904762, "eval_loss": 0.9022073149681091, "eval_runtime": 5.1424, "eval_samples_per_second": 245.02, "eval_steps_per_second": 3.889, "step": 237 }, { "epoch": 6.987341772151899, "grad_norm": 4.160565376281738, "learning_rate": 4.2450142450142457e-05, "loss": 1.0843, "step": 276 }, { "epoch": 6.987341772151899, "eval_accuracy": 0.7214285714285714, "eval_loss": 0.8979443907737732, "eval_runtime": 5.1188, "eval_samples_per_second": 246.15, "eval_steps_per_second": 3.907, "step": 276 }, { "epoch": 8.0, "grad_norm": 4.81905460357666, "learning_rate": 4.0550807217473884e-05, "loss": 0.9888, "step": 316 }, { "epoch": 8.0, "eval_accuracy": 0.7309523809523809, "eval_loss": 0.8573768138885498, "eval_runtime": 5.1282, "eval_samples_per_second": 245.698, "eval_steps_per_second": 3.9, "step": 316 }, { "epoch": 8.987341772151899, "grad_norm": 3.801147222518921, "learning_rate": 3.8698955365622036e-05, "loss": 0.9578, "step": 355 }, { "epoch": 8.987341772151899, "eval_accuracy": 0.7492063492063492, "eval_loss": 0.8365480303764343, "eval_runtime": 5.2155, "eval_samples_per_second": 241.59, "eval_steps_per_second": 3.835, "step": 355 }, { "epoch": 10.0, "grad_norm": 4.457461833953857, "learning_rate": 3.679962013295346e-05, "loss": 0.9056, "step": 395 }, { "epoch": 10.0, "eval_accuracy": 0.7285714285714285, "eval_loss": 0.8673570156097412, "eval_runtime": 5.1408, "eval_samples_per_second": 245.099, "eval_steps_per_second": 3.89, "step": 395 }, { "epoch": 10.987341772151899, "grad_norm": 4.0614914894104, "learning_rate": 3.4947768281101616e-05, "loss": 0.9162, "step": 434 }, { "epoch": 10.987341772151899, "eval_accuracy": 0.7603174603174603, "eval_loss": 0.795954167842865, "eval_runtime": 5.0977, "eval_samples_per_second": 247.17, "eval_steps_per_second": 3.923, "step": 434 }, { "epoch": 12.0, "grad_norm": 4.270706653594971, "learning_rate": 3.304843304843305e-05, "loss": 0.8398, "step": 474 }, { "epoch": 12.0, "eval_accuracy": 0.7404761904761905, "eval_loss": 0.8218683004379272, "eval_runtime": 5.2244, "eval_samples_per_second": 241.174, "eval_steps_per_second": 3.828, "step": 474 }, { "epoch": 12.987341772151899, "grad_norm": 4.428926944732666, "learning_rate": 3.1196581196581195e-05, "loss": 0.8452, "step": 513 }, { "epoch": 12.987341772151899, "eval_accuracy": 0.7714285714285715, "eval_loss": 0.7633056044578552, "eval_runtime": 5.1299, "eval_samples_per_second": 245.618, "eval_steps_per_second": 3.899, "step": 513 }, { "epoch": 14.0, "grad_norm": 4.47945499420166, "learning_rate": 2.9297245963912633e-05, "loss": 0.8082, "step": 553 }, { "epoch": 14.0, "eval_accuracy": 0.7476190476190476, "eval_loss": 0.8107038140296936, "eval_runtime": 5.1173, "eval_samples_per_second": 246.224, "eval_steps_per_second": 3.908, "step": 553 }, { "epoch": 14.987341772151899, "grad_norm": 4.362588405609131, "learning_rate": 2.744539411206078e-05, "loss": 0.8206, "step": 592 }, { "epoch": 14.987341772151899, "eval_accuracy": 0.7634920634920634, "eval_loss": 0.8023912310600281, "eval_runtime": 5.1183, "eval_samples_per_second": 246.177, "eval_steps_per_second": 3.908, "step": 592 }, { "epoch": 16.0, "grad_norm": 4.238908767700195, "learning_rate": 2.5546058879392216e-05, "loss": 0.7715, "step": 632 }, { "epoch": 16.0, "eval_accuracy": 0.7785714285714286, "eval_loss": 0.7276574373245239, "eval_runtime": 5.0688, "eval_samples_per_second": 248.579, "eval_steps_per_second": 3.946, "step": 632 }, { "epoch": 16.9873417721519, "grad_norm": 4.040332794189453, "learning_rate": 2.3694207027540365e-05, "loss": 0.7675, "step": 671 }, { "epoch": 16.9873417721519, "eval_accuracy": 0.7714285714285715, "eval_loss": 0.758399486541748, "eval_runtime": 5.0624, "eval_samples_per_second": 248.896, "eval_steps_per_second": 3.951, "step": 671 }, { "epoch": 18.0, "grad_norm": 5.9856367111206055, "learning_rate": 2.1794871794871795e-05, "loss": 0.7406, "step": 711 }, { "epoch": 18.0, "eval_accuracy": 0.734920634920635, "eval_loss": 0.8578805327415466, "eval_runtime": 5.1475, "eval_samples_per_second": 244.779, "eval_steps_per_second": 3.885, "step": 711 }, { "epoch": 18.9873417721519, "grad_norm": 4.246652126312256, "learning_rate": 1.9943019943019945e-05, "loss": 0.7632, "step": 750 }, { "epoch": 18.9873417721519, "eval_accuracy": 0.7619047619047619, "eval_loss": 0.7650825381278992, "eval_runtime": 5.2577, "eval_samples_per_second": 239.646, "eval_steps_per_second": 3.804, "step": 750 }, { "epoch": 20.0, "grad_norm": 4.661935806274414, "learning_rate": 1.804368471035138e-05, "loss": 0.7064, "step": 790 }, { "epoch": 20.0, "eval_accuracy": 0.7849206349206349, "eval_loss": 0.733094334602356, "eval_runtime": 5.0919, "eval_samples_per_second": 247.453, "eval_steps_per_second": 3.928, "step": 790 }, { "epoch": 20.9873417721519, "grad_norm": 4.025776386260986, "learning_rate": 1.6191832858499524e-05, "loss": 0.7102, "step": 829 }, { "epoch": 20.9873417721519, "eval_accuracy": 0.7801587301587302, "eval_loss": 0.7464848756790161, "eval_runtime": 5.1692, "eval_samples_per_second": 243.75, "eval_steps_per_second": 3.869, "step": 829 }, { "epoch": 22.0, "grad_norm": 5.104211330413818, "learning_rate": 1.4292497625830961e-05, "loss": 0.7034, "step": 869 }, { "epoch": 22.0, "eval_accuracy": 0.7817460317460317, "eval_loss": 0.7262414693832397, "eval_runtime": 5.1545, "eval_samples_per_second": 244.446, "eval_steps_per_second": 3.88, "step": 869 }, { "epoch": 22.9873417721519, "grad_norm": 4.623615264892578, "learning_rate": 1.2440645773979107e-05, "loss": 0.7141, "step": 908 }, { "epoch": 22.9873417721519, "eval_accuracy": 0.8007936507936508, "eval_loss": 0.6805568337440491, "eval_runtime": 5.1455, "eval_samples_per_second": 244.872, "eval_steps_per_second": 3.887, "step": 908 }, { "epoch": 24.0, "grad_norm": 4.392916679382324, "learning_rate": 1.0541310541310543e-05, "loss": 0.6688, "step": 948 }, { "epoch": 24.0, "eval_accuracy": 0.7817460317460317, "eval_loss": 0.7176946997642517, "eval_runtime": 5.1385, "eval_samples_per_second": 245.206, "eval_steps_per_second": 3.892, "step": 948 }, { "epoch": 24.9873417721519, "grad_norm": 4.022359848022461, "learning_rate": 8.68945868945869e-06, "loss": 0.7047, "step": 987 }, { "epoch": 24.9873417721519, "eval_accuracy": 0.7984126984126985, "eval_loss": 0.6904021501541138, "eval_runtime": 5.1085, "eval_samples_per_second": 246.65, "eval_steps_per_second": 3.915, "step": 987 }, { "epoch": 26.0, "grad_norm": 4.436544895172119, "learning_rate": 6.790123456790123e-06, "loss": 0.6788, "step": 1027 }, { "epoch": 26.0, "eval_accuracy": 0.7984126984126985, "eval_loss": 0.7002637386322021, "eval_runtime": 5.0847, "eval_samples_per_second": 247.801, "eval_steps_per_second": 3.933, "step": 1027 }, { "epoch": 26.9873417721519, "grad_norm": 4.585982322692871, "learning_rate": 4.938271604938272e-06, "loss": 0.676, "step": 1066 }, { "epoch": 26.9873417721519, "eval_accuracy": 0.7976190476190477, "eval_loss": 0.6969181895256042, "eval_runtime": 5.1071, "eval_samples_per_second": 246.715, "eval_steps_per_second": 3.916, "step": 1066 }, { "epoch": 28.0, "grad_norm": 3.7966365814208984, "learning_rate": 3.038936372269706e-06, "loss": 0.6589, "step": 1106 }, { "epoch": 28.0, "eval_accuracy": 0.7738095238095238, "eval_loss": 0.7518599033355713, "eval_runtime": 5.2632, "eval_samples_per_second": 239.396, "eval_steps_per_second": 3.8, "step": 1106 }, { "epoch": 28.9873417721519, "grad_norm": 4.134976387023926, "learning_rate": 1.1870845204178538e-06, "loss": 0.684, "step": 1145 }, { "epoch": 28.9873417721519, "eval_accuracy": 0.765079365079365, "eval_loss": 0.7477497458457947, "eval_runtime": 5.0759, "eval_samples_per_second": 248.23, "eval_steps_per_second": 3.94, "step": 1145 }, { "epoch": 29.620253164556964, "grad_norm": 3.8848156929016113, "learning_rate": 0.0, "loss": 0.6432, "step": 1170 }, { "epoch": 29.620253164556964, "eval_accuracy": 0.7888888888888889, "eval_loss": 0.7207361459732056, "eval_runtime": 5.1075, "eval_samples_per_second": 246.695, "eval_steps_per_second": 3.916, "step": 1170 }, { "epoch": 29.620253164556964, "step": 1170, "total_flos": 1.5296340129333903e+18, "train_loss": 0.9841398206531492, "train_runtime": 2406.841, "train_samples_per_second": 125.642, "train_steps_per_second": 0.486 } ], "logging_steps": 500, "max_steps": 1170, "num_input_tokens_seen": 0, "num_train_epochs": 30, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1.5296340129333903e+18, "train_batch_size": 64, "trial_name": null, "trial_params": null }