{"current_steps": 5, "total_steps": 3882, "loss": 3.0388, "lr": 2.564102564102564e-06, "epoch": 0.0025753283543651817, "percentage": 0.13, "elapsed_time": "0:02:49", "remaining_time": "1 day, 12:31:05", "throughput": 345.02, "total_tokens": 58496} {"current_steps": 10, "total_steps": 3882, "loss": 2.9831, "lr": 5.128205128205128e-06, "epoch": 0.0051506567087303634, "percentage": 0.26, "elapsed_time": "0:04:19", "remaining_time": "1 day, 3:52:53", "throughput": 451.18, "total_tokens": 116960} {"current_steps": 15, "total_steps": 3882, "loss": 2.8696, "lr": 7.692307692307694e-06, "epoch": 0.007725985063095545, "percentage": 0.39, "elapsed_time": "0:05:47", "remaining_time": "1 day, 0:54:38", "throughput": 504.36, "total_tokens": 175448} {"current_steps": 20, "total_steps": 3882, "loss": 2.6316, "lr": 1.0256410256410256e-05, "epoch": 0.010301313417460727, "percentage": 0.52, "elapsed_time": "0:07:17", "remaining_time": "23:26:52", "throughput": 535.17, "total_tokens": 233944} {"current_steps": 25, "total_steps": 3882, "loss": 1.9707, "lr": 1.282051282051282e-05, "epoch": 0.012876641771825908, "percentage": 0.64, "elapsed_time": "0:08:45", "remaining_time": "22:30:52", "throughput": 556.6, "total_tokens": 292416} {"current_steps": 30, "total_steps": 3882, "loss": 1.3782, "lr": 1.5384615384615387e-05, "epoch": 0.01545197012619109, "percentage": 0.77, "elapsed_time": "0:10:14", "remaining_time": "21:55:33", "throughput": 570.81, "total_tokens": 350904} {"current_steps": 35, "total_steps": 3882, "loss": 1.0628, "lr": 1.794871794871795e-05, "epoch": 0.018027298480556272, "percentage": 0.9, "elapsed_time": "0:11:42", "remaining_time": "21:27:25", "throughput": 582.52, "total_tokens": 409384} {"current_steps": 40, "total_steps": 3882, "loss": 0.9789, "lr": 2.0512820512820512e-05, "epoch": 0.020602626834921454, "percentage": 1.03, "elapsed_time": "0:13:11", "remaining_time": "21:07:29", "throughput": 590.91, "total_tokens": 467864} {"current_steps": 45, "total_steps": 3882, "loss": 0.9327, "lr": 2.307692307692308e-05, "epoch": 0.023177955189286635, "percentage": 1.16, "elapsed_time": "0:14:39", "remaining_time": "20:50:06", "throughput": 598.39, "total_tokens": 526384} {"current_steps": 50, "total_steps": 3882, "loss": 0.9233, "lr": 2.564102564102564e-05, "epoch": 0.025753283543651816, "percentage": 1.29, "elapsed_time": "0:16:09", "remaining_time": "20:38:40", "throughput": 603.11, "total_tokens": 584856} {"current_steps": 50, "total_steps": 3882, "eval_loss": 0.9281821846961975, "epoch": 0.025753283543651816, "percentage": 1.29, "elapsed_time": "0:16:57", "remaining_time": "21:40:17", "throughput": 574.53, "total_tokens": 584856} {"current_steps": 55, "total_steps": 3882, "loss": 0.897, "lr": 2.8205128205128207e-05, "epoch": 0.028328611898016998, "percentage": 1.42, "elapsed_time": "0:18:34", "remaining_time": "21:32:15", "throughput": 577.35, "total_tokens": 643344} {"current_steps": 60, "total_steps": 3882, "loss": 0.9169, "lr": 3.0769230769230774e-05, "epoch": 0.03090394025238218, "percentage": 1.55, "elapsed_time": "0:20:03", "remaining_time": "21:17:49", "throughput": 583.09, "total_tokens": 701808} {"current_steps": 65, "total_steps": 3882, "loss": 0.9019, "lr": 3.3333333333333335e-05, "epoch": 0.03347926860674736, "percentage": 1.67, "elapsed_time": "0:21:32", "remaining_time": "21:04:47", "throughput": 588.34, "total_tokens": 760304} {"current_steps": 70, "total_steps": 3882, "loss": 0.8996, "lr": 3.58974358974359e-05, "epoch": 0.036054596961112545, "percentage": 1.8, "elapsed_time": "0:23:02", "remaining_time": "20:55:11", "throughput": 592.04, "total_tokens": 818760} {"current_steps": 75, "total_steps": 3882, "loss": 0.9073, "lr": 3.846153846153846e-05, "epoch": 0.03862992531547772, "percentage": 1.93, "elapsed_time": "0:24:32", "remaining_time": "20:46:08", "throughput": 595.56, "total_tokens": 877256} {"current_steps": 80, "total_steps": 3882, "loss": 0.9081, "lr": 4.1025641025641023e-05, "epoch": 0.04120525366984291, "percentage": 2.06, "elapsed_time": "0:26:03", "remaining_time": "20:38:41", "throughput": 598.36, "total_tokens": 935752} {"current_steps": 85, "total_steps": 3882, "loss": 0.906, "lr": 4.358974358974359e-05, "epoch": 0.043780582024208085, "percentage": 2.19, "elapsed_time": "0:27:32", "remaining_time": "20:30:19", "throughput": 601.63, "total_tokens": 994216} {"current_steps": 90, "total_steps": 3882, "loss": 0.8952, "lr": 4.615384615384616e-05, "epoch": 0.04635591037857327, "percentage": 2.32, "elapsed_time": "0:29:02", "remaining_time": "20:23:48", "throughput": 604.04, "total_tokens": 1052704} {"current_steps": 95, "total_steps": 3882, "loss": 0.8996, "lr": 4.871794871794872e-05, "epoch": 0.04893123873293845, "percentage": 2.45, "elapsed_time": "0:30:31", "remaining_time": "20:17:00", "throughput": 606.61, "total_tokens": 1111176} {"current_steps": 100, "total_steps": 3882, "loss": 0.9024, "lr": 5.128205128205128e-05, "epoch": 0.05150656708730363, "percentage": 2.58, "elapsed_time": "0:32:01", "remaining_time": "20:10:52", "throughput": 608.88, "total_tokens": 1169664} {"current_steps": 100, "total_steps": 3882, "eval_loss": 0.911374032497406, "epoch": 0.05150656708730363, "percentage": 2.58, "elapsed_time": "0:32:20", "remaining_time": "20:23:12", "throughput": 602.74, "total_tokens": 1169664}