Qwen1.5-Capybara-0.5B-Chat / trainer_log.jsonl
markab's picture
Upload folder using huggingface_hub
7609f00 verified
{"current_steps": 10, "total_steps": 1000, "loss": 1.6821, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.998766400914329e-05, "epoch": 0.01, "percentage": 1.0, "elapsed_time": "0:00:21", "remaining_time": "0:34:50"}
{"current_steps": 20, "total_steps": 1000, "loss": 1.7047, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.995066821070679e-05, "epoch": 0.02, "percentage": 2.0, "elapsed_time": "0:00:42", "remaining_time": "0:34:34"}
{"current_steps": 30, "total_steps": 1000, "loss": 1.5966, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.9889049115077005e-05, "epoch": 0.03, "percentage": 3.0, "elapsed_time": "0:01:03", "remaining_time": "0:34:15"}
{"current_steps": 40, "total_steps": 1000, "loss": 1.6008, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.980286753286195e-05, "epoch": 0.04, "percentage": 4.0, "elapsed_time": "0:01:25", "remaining_time": "0:34:09"}
{"current_steps": 50, "total_steps": 1000, "loss": 1.6592, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.9692208514878444e-05, "epoch": 0.05, "percentage": 5.0, "elapsed_time": "0:01:46", "remaining_time": "0:33:49"}
{"current_steps": 60, "total_steps": 1000, "loss": 1.7166, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.9557181268217227e-05, "epoch": 0.06, "percentage": 6.0, "elapsed_time": "0:02:08", "remaining_time": "0:33:33"}
{"current_steps": 70, "total_steps": 1000, "loss": 1.6112, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.939791904846869e-05, "epoch": 0.07, "percentage": 7.0, "elapsed_time": "0:02:29", "remaining_time": "0:33:10"}
{"current_steps": 80, "total_steps": 1000, "loss": 1.575, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.9214579028215776e-05, "epoch": 0.08, "percentage": 8.0, "elapsed_time": "0:02:51", "remaining_time": "0:32:53"}
{"current_steps": 90, "total_steps": 1000, "loss": 1.6309, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.900734214192358e-05, "epoch": 0.09, "percentage": 9.0, "elapsed_time": "0:03:12", "remaining_time": "0:32:29"}
{"current_steps": 100, "total_steps": 1000, "loss": 1.6733, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.877641290737884e-05, "epoch": 0.1, "percentage": 10.0, "elapsed_time": "0:03:34", "remaining_time": "0:32:09"}
{"current_steps": 110, "total_steps": 1000, "loss": 1.5773, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.852201922385564e-05, "epoch": 0.11, "percentage": 11.0, "elapsed_time": "0:03:55", "remaining_time": "0:31:47"}
{"current_steps": 120, "total_steps": 1000, "loss": 1.5916, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.8244412147206284e-05, "epoch": 0.12, "percentage": 12.0, "elapsed_time": "0:04:17", "remaining_time": "0:31:24"}
{"current_steps": 130, "total_steps": 1000, "loss": 1.6133, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.794386564209953e-05, "epoch": 0.13, "percentage": 13.0, "elapsed_time": "0:04:38", "remaining_time": "0:31:02"}
{"current_steps": 140, "total_steps": 1000, "loss": 1.5403, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.762067631165049e-05, "epoch": 0.14, "percentage": 14.0, "elapsed_time": "0:05:00", "remaining_time": "0:30:43"}
{"current_steps": 150, "total_steps": 1000, "loss": 1.5969, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.72751631047092e-05, "epoch": 0.15, "percentage": 15.0, "elapsed_time": "0:05:22", "remaining_time": "0:30:25"}
{"current_steps": 160, "total_steps": 1000, "loss": 1.6164, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.690766700109659e-05, "epoch": 0.16, "percentage": 16.0, "elapsed_time": "0:05:44", "remaining_time": "0:30:06"}
{"current_steps": 170, "total_steps": 1000, "loss": 1.6303, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.65185506750986e-05, "epoch": 0.17, "percentage": 17.0, "elapsed_time": "0:06:05", "remaining_time": "0:29:46"}
{"current_steps": 180, "total_steps": 1000, "loss": 1.5334, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.610819813755038e-05, "epoch": 0.18, "percentage": 18.0, "elapsed_time": "0:06:27", "remaining_time": "0:29:27"}
{"current_steps": 190, "total_steps": 1000, "loss": 1.5435, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.567701435686404e-05, "epoch": 0.19, "percentage": 19.0, "elapsed_time": "0:06:49", "remaining_time": "0:29:05"}
{"current_steps": 200, "total_steps": 1000, "loss": 1.5958, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.522542485937369e-05, "epoch": 0.2, "percentage": 20.0, "elapsed_time": "0:07:11", "remaining_time": "0:28:44"}
{"current_steps": 210, "total_steps": 1000, "loss": 1.6114, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.4753875309392266e-05, "epoch": 0.21, "percentage": 21.0, "elapsed_time": "0:07:33", "remaining_time": "0:28:25"}
{"current_steps": 220, "total_steps": 1000, "loss": 1.5988, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.426283106939474e-05, "epoch": 0.22, "percentage": 22.0, "elapsed_time": "0:07:54", "remaining_time": "0:28:02"}
{"current_steps": 230, "total_steps": 1000, "loss": 1.5951, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.375277674076149e-05, "epoch": 0.23, "percentage": 23.0, "elapsed_time": "0:08:16", "remaining_time": "0:27:42"}
{"current_steps": 240, "total_steps": 1000, "loss": 1.5952, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.3224215685535294e-05, "epoch": 0.24, "percentage": 24.0, "elapsed_time": "0:08:37", "remaining_time": "0:27:18"}
{"current_steps": 250, "total_steps": 1000, "loss": 1.5654, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.267766952966369e-05, "epoch": 0.25, "percentage": 25.0, "elapsed_time": "0:08:59", "remaining_time": "0:26:57"}
{"current_steps": 260, "total_steps": 1000, "loss": 1.6435, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.211367764821722e-05, "epoch": 0.26, "percentage": 26.0, "elapsed_time": "0:09:20", "remaining_time": "0:26:35"}
{"current_steps": 270, "total_steps": 1000, "loss": 1.6034, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.1532796633091296e-05, "epoch": 0.27, "percentage": 27.0, "elapsed_time": "0:09:42", "remaining_time": "0:26:14"}
{"current_steps": 280, "total_steps": 1000, "loss": 1.5224, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.093559974371725e-05, "epoch": 0.28, "percentage": 28.0, "elapsed_time": "0:10:03", "remaining_time": "0:25:51"}
{"current_steps": 290, "total_steps": 1000, "loss": 1.5068, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.0322676341324415e-05, "epoch": 0.29, "percentage": 29.0, "elapsed_time": "0:10:25", "remaining_time": "0:25:30"}
{"current_steps": 300, "total_steps": 1000, "loss": 1.5696, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.969463130731183e-05, "epoch": 0.3, "percentage": 30.0, "elapsed_time": "0:10:46", "remaining_time": "0:25:09"}
{"current_steps": 310, "total_steps": 1000, "loss": 1.6044, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.905208444630327e-05, "epoch": 0.31, "percentage": 31.0, "elapsed_time": "0:11:08", "remaining_time": "0:24:48"}
{"current_steps": 320, "total_steps": 1000, "loss": 1.5515, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.8395669874474915e-05, "epoch": 0.32, "percentage": 32.0, "elapsed_time": "0:11:30", "remaining_time": "0:24:27"}
{"current_steps": 330, "total_steps": 1000, "loss": 1.5805, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.7726035393759285e-05, "epoch": 0.33, "percentage": 33.0, "elapsed_time": "0:11:52", "remaining_time": "0:24:06"}
{"current_steps": 340, "total_steps": 1000, "loss": 1.5119, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.704384185254288e-05, "epoch": 0.34, "percentage": 34.0, "elapsed_time": "0:12:14", "remaining_time": "0:23:45"}
{"current_steps": 350, "total_steps": 1000, "loss": 1.5301, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.634976249348867e-05, "epoch": 0.35, "percentage": 35.0, "elapsed_time": "0:12:36", "remaining_time": "0:23:24"}
{"current_steps": 360, "total_steps": 1000, "loss": 1.5822, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.564448228912682e-05, "epoch": 0.36, "percentage": 36.0, "elapsed_time": "0:12:57", "remaining_time": "0:23:02"}
{"current_steps": 370, "total_steps": 1000, "loss": 1.6206, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.4928697265869515e-05, "epoch": 0.37, "percentage": 37.0, "elapsed_time": "0:13:18", "remaining_time": "0:22:40"}
{"current_steps": 380, "total_steps": 1000, "loss": 1.7065, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.4203113817116957e-05, "epoch": 0.38, "percentage": 38.0, "elapsed_time": "0:13:40", "remaining_time": "0:22:19"}
{"current_steps": 390, "total_steps": 1000, "loss": 1.64, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.346844800613229e-05, "epoch": 0.39, "percentage": 39.0, "elapsed_time": "0:14:02", "remaining_time": "0:21:58"}
{"current_steps": 400, "total_steps": 1000, "loss": 1.5591, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.272542485937369e-05, "epoch": 0.4, "percentage": 40.0, "elapsed_time": "0:14:24", "remaining_time": "0:21:36"}
{"current_steps": 410, "total_steps": 1000, "loss": 1.5759, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.1974777650980735e-05, "epoch": 0.41, "percentage": 41.0, "elapsed_time": "0:14:46", "remaining_time": "0:21:15"}
{"current_steps": 420, "total_steps": 1000, "loss": 1.4817, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.121724717912138e-05, "epoch": 0.42, "percentage": 42.0, "elapsed_time": "0:15:08", "remaining_time": "0:20:54"}
{"current_steps": 430, "total_steps": 1000, "loss": 1.65, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.045358103491357e-05, "epoch": 0.43, "percentage": 43.0, "elapsed_time": "0:15:29", "remaining_time": "0:20:32"}
{"current_steps": 440, "total_steps": 1000, "loss": 1.4503, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.9684532864643122e-05, "epoch": 0.44, "percentage": 44.0, "elapsed_time": "0:15:51", "remaining_time": "0:20:10"}
{"current_steps": 450, "total_steps": 1000, "loss": 1.609, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.8910861626005776e-05, "epoch": 0.45, "percentage": 45.0, "elapsed_time": "0:16:12", "remaining_time": "0:19:48"}
{"current_steps": 460, "total_steps": 1000, "loss": 1.6128, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.8133330839107608e-05, "epoch": 0.46, "percentage": 46.0, "elapsed_time": "0:16:33", "remaining_time": "0:19:26"}
{"current_steps": 470, "total_steps": 1000, "loss": 1.5582, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.7352707832962865e-05, "epoch": 0.47, "percentage": 47.0, "elapsed_time": "0:16:55", "remaining_time": "0:19:05"}
{"current_steps": 480, "total_steps": 1000, "loss": 1.5761, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.656976298823284e-05, "epoch": 0.48, "percentage": 48.0, "elapsed_time": "0:17:17", "remaining_time": "0:18:43"}
{"current_steps": 490, "total_steps": 1000, "loss": 1.4935, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.578526897695321e-05, "epoch": 0.49, "percentage": 49.0, "elapsed_time": "0:17:38", "remaining_time": "0:18:21"}
{"current_steps": 500, "total_steps": 1000, "loss": 1.5955, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.5e-05, "epoch": 0.5, "percentage": 50.0, "elapsed_time": "0:18:00", "remaining_time": "0:18:00"}
{"current_steps": 510, "total_steps": 1000, "loss": 1.555, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.4214731023046793e-05, "epoch": 0.51, "percentage": 51.0, "elapsed_time": "0:18:22", "remaining_time": "0:17:39"}
{"current_steps": 520, "total_steps": 1000, "loss": 1.5394, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.3430237011767167e-05, "epoch": 0.52, "percentage": 52.0, "elapsed_time": "0:18:44", "remaining_time": "0:17:18"}
{"current_steps": 530, "total_steps": 1000, "loss": 1.6694, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.2647292167037144e-05, "epoch": 0.53, "percentage": 53.0, "elapsed_time": "0:19:06", "remaining_time": "0:16:56"}
{"current_steps": 540, "total_steps": 1000, "loss": 1.542, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.186666916089239e-05, "epoch": 0.54, "percentage": 54.0, "elapsed_time": "0:19:27", "remaining_time": "0:16:34"}
{"current_steps": 550, "total_steps": 1000, "loss": 1.5596, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.1089138373994223e-05, "epoch": 0.55, "percentage": 55.0, "elapsed_time": "0:19:48", "remaining_time": "0:16:12"}
{"current_steps": 560, "total_steps": 1000, "loss": 1.5421, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.031546713535688e-05, "epoch": 0.56, "percentage": 56.0, "elapsed_time": "0:20:10", "remaining_time": "0:15:51"}
{"current_steps": 570, "total_steps": 1000, "loss": 1.4972, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.9546418965086442e-05, "epoch": 0.57, "percentage": 57.0, "elapsed_time": "0:20:32", "remaining_time": "0:15:29"}
{"current_steps": 580, "total_steps": 1000, "loss": 1.5185, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.8782752820878634e-05, "epoch": 0.58, "percentage": 58.0, "elapsed_time": "0:20:54", "remaining_time": "0:15:08"}
{"current_steps": 590, "total_steps": 1000, "loss": 1.6447, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.802522234901927e-05, "epoch": 0.59, "percentage": 59.0, "elapsed_time": "0:21:15", "remaining_time": "0:14:46"}
{"current_steps": 600, "total_steps": 1000, "loss": 1.5495, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.7274575140626318e-05, "epoch": 0.6, "percentage": 60.0, "elapsed_time": "0:21:37", "remaining_time": "0:14:25"}
{"current_steps": 610, "total_steps": 1000, "loss": 1.5969, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6531551993867717e-05, "epoch": 0.61, "percentage": 61.0, "elapsed_time": "0:21:58", "remaining_time": "0:14:03"}
{"current_steps": 620, "total_steps": 1000, "loss": 1.525, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.5796886182883053e-05, "epoch": 0.62, "percentage": 62.0, "elapsed_time": "0:22:20", "remaining_time": "0:13:41"}
{"current_steps": 630, "total_steps": 1000, "loss": 1.5483, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.5071302734130489e-05, "epoch": 0.63, "percentage": 63.0, "elapsed_time": "0:22:42", "remaining_time": "0:13:20"}
{"current_steps": 640, "total_steps": 1000, "loss": 1.513, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4355517710873184e-05, "epoch": 0.64, "percentage": 64.0, "elapsed_time": "0:23:04", "remaining_time": "0:12:58"}
{"current_steps": 650, "total_steps": 1000, "loss": 1.6179, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.3650237506511331e-05, "epoch": 0.65, "percentage": 65.0, "elapsed_time": "0:23:25", "remaining_time": "0:12:36"}
{"current_steps": 660, "total_steps": 1000, "loss": 1.5573, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2956158147457115e-05, "epoch": 0.66, "percentage": 66.0, "elapsed_time": "0:23:47", "remaining_time": "0:12:15"}
{"current_steps": 670, "total_steps": 1000, "loss": 1.5965, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2273964606240718e-05, "epoch": 0.67, "percentage": 67.0, "elapsed_time": "0:24:08", "remaining_time": "0:11:53"}
{"current_steps": 680, "total_steps": 1000, "loss": 1.5351, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.1604330125525079e-05, "epoch": 0.68, "percentage": 68.0, "elapsed_time": "0:24:30", "remaining_time": "0:11:32"}
{"current_steps": 690, "total_steps": 1000, "loss": 1.5327, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0947915553696742e-05, "epoch": 0.69, "percentage": 69.0, "elapsed_time": "0:24:52", "remaining_time": "0:11:10"}
{"current_steps": 700, "total_steps": 1000, "loss": 1.5258, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0305368692688174e-05, "epoch": 0.7, "percentage": 70.0, "elapsed_time": "0:25:13", "remaining_time": "0:10:48"}
{"current_steps": 710, "total_steps": 1000, "loss": 1.4896, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.677323658675594e-06, "epoch": 0.71, "percentage": 71.0, "elapsed_time": "0:25:35", "remaining_time": "0:10:27"}
{"current_steps": 720, "total_steps": 1000, "loss": 1.5334, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.064400256282757e-06, "epoch": 0.72, "percentage": 72.0, "elapsed_time": "0:25:57", "remaining_time": "0:10:05"}
{"current_steps": 730, "total_steps": 1000, "loss": 1.5586, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.467203366908707e-06, "epoch": 0.73, "percentage": 73.0, "elapsed_time": "0:26:18", "remaining_time": "0:09:43"}
{"current_steps": 740, "total_steps": 1000, "loss": 1.5456, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.886322351782783e-06, "epoch": 0.74, "percentage": 74.0, "elapsed_time": "0:26:40", "remaining_time": "0:09:22"}
{"current_steps": 750, "total_steps": 1000, "loss": 1.6154, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.3223304703363135e-06, "epoch": 0.75, "percentage": 75.0, "elapsed_time": "0:27:02", "remaining_time": "0:09:00"}
{"current_steps": 760, "total_steps": 1000, "loss": 1.6238, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.775784314464717e-06, "epoch": 0.76, "percentage": 76.0, "elapsed_time": "0:27:23", "remaining_time": "0:08:38"}
{"current_steps": 770, "total_steps": 1000, "loss": 1.6143, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.247223259238511e-06, "epoch": 0.77, "percentage": 77.0, "elapsed_time": "0:27:44", "remaining_time": "0:08:17"}
{"current_steps": 780, "total_steps": 1000, "loss": 1.5645, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.737168930605272e-06, "epoch": 0.78, "percentage": 78.0, "elapsed_time": "0:28:06", "remaining_time": "0:07:55"}
{"current_steps": 790, "total_steps": 1000, "loss": 1.599, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.24612469060774e-06, "epoch": 0.79, "percentage": 79.0, "elapsed_time": "0:28:28", "remaining_time": "0:07:34"}
{"current_steps": 800, "total_steps": 1000, "loss": 1.5936, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.7745751406263165e-06, "epoch": 0.8, "percentage": 80.0, "elapsed_time": "0:28:50", "remaining_time": "0:07:12"}
{"current_steps": 810, "total_steps": 1000, "loss": 1.5839, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.322985643135952e-06, "epoch": 0.81, "percentage": 81.0, "elapsed_time": "0:29:12", "remaining_time": "0:06:51"}
{"current_steps": 820, "total_steps": 1000, "loss": 1.6365, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.891801862449629e-06, "epoch": 0.82, "percentage": 82.0, "elapsed_time": "0:29:33", "remaining_time": "0:06:29"}
{"current_steps": 830, "total_steps": 1000, "loss": 1.6002, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.4814493249014116e-06, "epoch": 0.83, "percentage": 83.0, "elapsed_time": "0:29:54", "remaining_time": "0:06:07"}
{"current_steps": 840, "total_steps": 1000, "loss": 1.5553, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.092332998903416e-06, "epoch": 0.84, "percentage": 84.0, "elapsed_time": "0:30:16", "remaining_time": "0:05:46"}
{"current_steps": 850, "total_steps": 1000, "loss": 1.5059, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.7248368952908053e-06, "epoch": 0.85, "percentage": 85.0, "elapsed_time": "0:30:38", "remaining_time": "0:05:24"}
{"current_steps": 860, "total_steps": 1000, "loss": 1.5607, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.379323688349516e-06, "epoch": 0.86, "percentage": 86.0, "elapsed_time": "0:31:00", "remaining_time": "0:05:02"}
{"current_steps": 870, "total_steps": 1000, "loss": 1.5616, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.0561343579004715e-06, "epoch": 0.87, "percentage": 87.0, "elapsed_time": "0:31:22", "remaining_time": "0:04:41"}
{"current_steps": 880, "total_steps": 1000, "loss": 1.5769, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.7555878527937164e-06, "epoch": 0.88, "percentage": 88.0, "elapsed_time": "0:31:43", "remaining_time": "0:04:19"}
{"current_steps": 890, "total_steps": 1000, "loss": 1.5796, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4779807761443636e-06, "epoch": 0.89, "percentage": 89.0, "elapsed_time": "0:32:05", "remaining_time": "0:03:57"}
{"current_steps": 900, "total_steps": 1000, "loss": 1.5477, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2235870926211619e-06, "epoch": 0.9, "percentage": 90.0, "elapsed_time": "0:32:26", "remaining_time": "0:03:36"}
{"current_steps": 910, "total_steps": 1000, "loss": 1.5246, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.926578580764234e-07, "epoch": 0.91, "percentage": 91.0, "elapsed_time": "0:32:48", "remaining_time": "0:03:14"}
{"current_steps": 920, "total_steps": 1000, "loss": 1.5501, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.854209717842231e-07, "epoch": 0.92, "percentage": 92.0, "elapsed_time": "0:33:09", "remaining_time": "0:02:53"}
{"current_steps": 930, "total_steps": 1000, "loss": 1.6663, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.020809515313142e-07, "epoch": 0.93, "percentage": 93.0, "elapsed_time": "0:33:31", "remaining_time": "0:02:31"}
{"current_steps": 940, "total_steps": 1000, "loss": 1.5585, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.4281873178278475e-07, "epoch": 0.94, "percentage": 94.0, "elapsed_time": "0:33:53", "remaining_time": "0:02:09"}
{"current_steps": 950, "total_steps": 1000, "loss": 1.4972, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.077914851215585e-07, "epoch": 0.95, "percentage": 95.0, "elapsed_time": "0:34:15", "remaining_time": "0:01:48"}
{"current_steps": 960, "total_steps": 1000, "loss": 1.5653, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.9713246713805588e-07, "epoch": 0.96, "percentage": 96.0, "elapsed_time": "0:34:37", "remaining_time": "0:01:26"}
{"current_steps": 970, "total_steps": 1000, "loss": 1.6213, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.109508849230001e-07, "epoch": 0.97, "percentage": 97.0, "elapsed_time": "0:34:58", "remaining_time": "0:01:04"}
{"current_steps": 980, "total_steps": 1000, "loss": 1.5936, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.9331789293211026e-08, "epoch": 0.98, "percentage": 98.0, "elapsed_time": "0:35:20", "remaining_time": "0:00:43"}
{"current_steps": 990, "total_steps": 1000, "loss": 1.5483, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.233599085671e-08, "epoch": 0.99, "percentage": 99.0, "elapsed_time": "0:35:40", "remaining_time": "0:00:21"}
{"current_steps": 1000, "total_steps": 1000, "loss": 1.5628, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.0, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:36:02", "remaining_time": "0:00:00"}
{"current_steps": 1000, "total_steps": 1000, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:36:02", "remaining_time": "0:00:00"}