top_1_ranking_stackexchange / trainer_log.jsonl
sedrickkeh's picture
Training in progress, epoch 2
51b8fe2 verified
{"current_steps": 10, "total_steps": 150, "loss": 0.812, "lr": 5e-06, "epoch": 0.19950124688279303, "percentage": 6.67, "elapsed_time": "0:09:39", "remaining_time": "2:15:07"}
{"current_steps": 20, "total_steps": 150, "loss": 0.6885, "lr": 5e-06, "epoch": 0.39900249376558605, "percentage": 13.33, "elapsed_time": "0:19:13", "remaining_time": "2:04:56"}
{"current_steps": 30, "total_steps": 150, "loss": 0.6424, "lr": 5e-06, "epoch": 0.5985037406483791, "percentage": 20.0, "elapsed_time": "0:28:47", "remaining_time": "1:55:10"}
{"current_steps": 40, "total_steps": 150, "loss": 0.6225, "lr": 5e-06, "epoch": 0.7980049875311721, "percentage": 26.67, "elapsed_time": "0:38:21", "remaining_time": "1:45:29"}
{"current_steps": 50, "total_steps": 150, "loss": 0.6165, "lr": 5e-06, "epoch": 0.9975062344139651, "percentage": 33.33, "elapsed_time": "0:47:56", "remaining_time": "1:35:52"}
{"current_steps": 50, "total_steps": 150, "eval_loss": 0.6011843085289001, "epoch": 0.9975062344139651, "percentage": 33.33, "elapsed_time": "0:48:57", "remaining_time": "1:37:55"}
{"current_steps": 60, "total_steps": 150, "loss": 0.6217, "lr": 5e-06, "epoch": 1.1970074812967582, "percentage": 40.0, "elapsed_time": "0:59:33", "remaining_time": "1:29:20"}
{"current_steps": 70, "total_steps": 150, "loss": 0.555, "lr": 5e-06, "epoch": 1.3965087281795512, "percentage": 46.67, "elapsed_time": "1:09:08", "remaining_time": "1:19:01"}
{"current_steps": 80, "total_steps": 150, "loss": 0.5496, "lr": 5e-06, "epoch": 1.5960099750623442, "percentage": 53.33, "elapsed_time": "1:18:43", "remaining_time": "1:08:52"}
{"current_steps": 90, "total_steps": 150, "loss": 0.5567, "lr": 5e-06, "epoch": 1.7955112219451372, "percentage": 60.0, "elapsed_time": "1:28:17", "remaining_time": "0:58:51"}
{"current_steps": 100, "total_steps": 150, "loss": 0.5416, "lr": 5e-06, "epoch": 1.9950124688279303, "percentage": 66.67, "elapsed_time": "1:37:52", "remaining_time": "0:48:56"}
{"current_steps": 100, "total_steps": 150, "eval_loss": 0.5647123456001282, "epoch": 1.9950124688279303, "percentage": 66.67, "elapsed_time": "1:39:00", "remaining_time": "0:49:30"}
{"current_steps": 110, "total_steps": 150, "loss": 0.5452, "lr": 5e-06, "epoch": 2.1945137157107233, "percentage": 73.33, "elapsed_time": "1:49:35", "remaining_time": "0:39:51"}
{"current_steps": 120, "total_steps": 150, "loss": 0.4933, "lr": 5e-06, "epoch": 2.3940149625935163, "percentage": 80.0, "elapsed_time": "1:59:09", "remaining_time": "0:29:47"}
{"current_steps": 130, "total_steps": 150, "loss": 0.4865, "lr": 5e-06, "epoch": 2.5935162094763093, "percentage": 86.67, "elapsed_time": "2:08:44", "remaining_time": "0:19:48"}
{"current_steps": 140, "total_steps": 150, "loss": 0.4884, "lr": 5e-06, "epoch": 2.7930174563591024, "percentage": 93.33, "elapsed_time": "2:18:20", "remaining_time": "0:09:52"}
{"current_steps": 150, "total_steps": 150, "loss": 0.4848, "lr": 5e-06, "epoch": 2.9925187032418954, "percentage": 100.0, "elapsed_time": "2:27:55", "remaining_time": "0:00:00"}
{"current_steps": 150, "total_steps": 150, "eval_loss": 0.5612708926200867, "epoch": 2.9925187032418954, "percentage": 100.0, "elapsed_time": "2:30:03", "remaining_time": "0:00:00"}
{"current_steps": 150, "total_steps": 150, "epoch": 2.9925187032418954, "percentage": 100.0, "elapsed_time": "2:31:18", "remaining_time": "0:00:00"}