|
{"current_steps": 10, "total_steps": 1350, "loss": 1.7454, "lr": 7.4074074074074075e-06, "epoch": 0.022222222222222223, "percentage": 0.74, "elapsed_time": "0:00:02", "remaining_time": "0:04:44"} |
|
{"current_steps": 20, "total_steps": 1350, "loss": 1.5071, "lr": 1.4814814814814815e-05, "epoch": 0.044444444444444446, "percentage": 1.48, "elapsed_time": "0:00:03", "remaining_time": "0:04:08"} |
|
{"current_steps": 30, "total_steps": 1350, "loss": 1.6012, "lr": 2.2222222222222223e-05, "epoch": 0.06666666666666667, "percentage": 2.22, "elapsed_time": "0:00:05", "remaining_time": "0:04:02"} |
|
{"current_steps": 40, "total_steps": 1350, "loss": 1.543, "lr": 2.8888888888888888e-05, "epoch": 0.08888888888888889, "percentage": 2.96, "elapsed_time": "0:00:07", "remaining_time": "0:03:55"} |
|
{"current_steps": 50, "total_steps": 1350, "loss": 1.6806, "lr": 3.62962962962963e-05, "epoch": 0.1111111111111111, "percentage": 3.7, "elapsed_time": "0:00:08", "remaining_time": "0:03:49"} |
|
{"current_steps": 60, "total_steps": 1350, "loss": 1.4376, "lr": 4.3703703703703705e-05, "epoch": 0.13333333333333333, "percentage": 4.44, "elapsed_time": "0:00:10", "remaining_time": "0:03:45"} |
|
{"current_steps": 70, "total_steps": 1350, "loss": 1.5629, "lr": 5.111111111111111e-05, "epoch": 0.15555555555555556, "percentage": 5.19, "elapsed_time": "0:00:12", "remaining_time": "0:03:41"} |
|
{"current_steps": 80, "total_steps": 1350, "loss": 1.5502, "lr": 5.851851851851852e-05, "epoch": 0.17777777777777778, "percentage": 5.93, "elapsed_time": "0:00:13", "remaining_time": "0:03:38"} |
|
{"current_steps": 90, "total_steps": 1350, "loss": 1.5744, "lr": 6.592592592592593e-05, "epoch": 0.2, "percentage": 6.67, "elapsed_time": "0:00:15", "remaining_time": "0:03:36"} |
|
{"current_steps": 100, "total_steps": 1350, "loss": 1.4887, "lr": 7.333333333333333e-05, "epoch": 0.2222222222222222, "percentage": 7.41, "elapsed_time": "0:00:17", "remaining_time": "0:03:35"} |
|
{"current_steps": 110, "total_steps": 1350, "loss": 1.4432, "lr": 8.074074074074075e-05, "epoch": 0.24444444444444444, "percentage": 8.15, "elapsed_time": "0:00:18", "remaining_time": "0:03:32"} |
|
{"current_steps": 120, "total_steps": 1350, "loss": 1.7349, "lr": 8.814814814814815e-05, "epoch": 0.26666666666666666, "percentage": 8.89, "elapsed_time": "0:00:20", "remaining_time": "0:03:31"} |
|
{"current_steps": 130, "total_steps": 1350, "loss": 1.8419, "lr": 9.555555555555557e-05, "epoch": 0.28888888888888886, "percentage": 9.63, "elapsed_time": "0:00:22", "remaining_time": "0:03:28"} |
|
{"current_steps": 140, "total_steps": 1350, "loss": 1.7434, "lr": 9.999732574196451e-05, "epoch": 0.3111111111111111, "percentage": 10.37, "elapsed_time": "0:00:23", "remaining_time": "0:03:26"} |
|
{"current_steps": 150, "total_steps": 1350, "loss": 1.7345, "lr": 9.996724362426075e-05, "epoch": 0.3333333333333333, "percentage": 11.11, "elapsed_time": "0:00:25", "remaining_time": "0:03:24"} |
|
{"current_steps": 160, "total_steps": 1350, "loss": 1.6652, "lr": 9.990375674425109e-05, "epoch": 0.35555555555555557, "percentage": 11.85, "elapsed_time": "0:00:27", "remaining_time": "0:03:21"} |
|
{"current_steps": 170, "total_steps": 1350, "loss": 1.6247, "lr": 9.980690754502393e-05, "epoch": 0.37777777777777777, "percentage": 12.59, "elapsed_time": "0:00:28", "remaining_time": "0:03:19"} |
|
{"current_steps": 180, "total_steps": 1350, "loss": 1.9226, "lr": 9.96767607734863e-05, "epoch": 0.4, "percentage": 13.33, "elapsed_time": "0:00:30", "remaining_time": "0:03:17"} |
|
{"current_steps": 190, "total_steps": 1350, "loss": 1.9507, "lr": 9.951340343707852e-05, "epoch": 0.4222222222222222, "percentage": 14.07, "elapsed_time": "0:00:31", "remaining_time": "0:03:15"} |
|
{"current_steps": 200, "total_steps": 1350, "loss": 1.5901, "lr": 9.931694474560686e-05, "epoch": 0.4444444444444444, "percentage": 14.81, "elapsed_time": "0:00:33", "remaining_time": "0:03:13"} |
|
{"current_steps": 210, "total_steps": 1350, "loss": 1.7762, "lr": 9.908751603823301e-05, "epoch": 0.4666666666666667, "percentage": 15.56, "elapsed_time": "0:00:35", "remaining_time": "0:03:11"} |
|
{"current_steps": 220, "total_steps": 1350, "loss": 1.7833, "lr": 9.882527069566965e-05, "epoch": 0.4888888888888889, "percentage": 16.3, "elapsed_time": "0:00:36", "remaining_time": "0:03:09"} |
|
{"current_steps": 230, "total_steps": 1350, "loss": 1.5891, "lr": 9.853038403764021e-05, "epoch": 0.5111111111111111, "percentage": 17.04, "elapsed_time": "0:00:38", "remaining_time": "0:03:06"} |
|
{"current_steps": 240, "total_steps": 1350, "loss": 1.7261, "lr": 9.820305320567192e-05, "epoch": 0.5333333333333333, "percentage": 17.78, "elapsed_time": "0:00:40", "remaining_time": "0:03:08"} |
|
{"current_steps": 250, "total_steps": 1350, "loss": 1.6448, "lr": 9.784349703130007e-05, "epoch": 0.5555555555555556, "percentage": 18.52, "elapsed_time": "0:00:42", "remaining_time": "0:03:06"} |
|
{"current_steps": 260, "total_steps": 1350, "loss": 1.9097, "lr": 9.745195588977192e-05, "epoch": 0.5777777777777777, "percentage": 19.26, "elapsed_time": "0:00:44", "remaining_time": "0:03:04"} |
|
{"current_steps": 270, "total_steps": 1350, "loss": 1.6173, "lr": 9.702869153934782e-05, "epoch": 0.6, "percentage": 20.0, "elapsed_time": "0:00:45", "remaining_time": "0:03:02"} |
|
{"current_steps": 280, "total_steps": 1350, "loss": 1.8324, "lr": 9.657398694630712e-05, "epoch": 0.6222222222222222, "percentage": 20.74, "elapsed_time": "0:00:47", "remaining_time": "0:03:00"} |
|
{"current_steps": 290, "total_steps": 1350, "loss": 1.818, "lr": 9.608814609577585e-05, "epoch": 0.6444444444444445, "percentage": 21.48, "elapsed_time": "0:00:48", "remaining_time": "0:02:58"} |
|
{"current_steps": 300, "total_steps": 1350, "loss": 1.618, "lr": 9.557149378850254e-05, "epoch": 0.6666666666666666, "percentage": 22.22, "elapsed_time": "0:00:50", "remaining_time": "0:02:56"} |
|
{"current_steps": 310, "total_steps": 1350, "loss": 1.6228, "lr": 9.502437542371812e-05, "epoch": 0.6888888888888889, "percentage": 22.96, "elapsed_time": "0:00:52", "remaining_time": "0:02:54"} |
|
{"current_steps": 320, "total_steps": 1350, "loss": 1.7307, "lr": 9.444715676822501e-05, "epoch": 0.7111111111111111, "percentage": 23.7, "elapsed_time": "0:00:53", "remaining_time": "0:02:52"} |
|
{"current_steps": 330, "total_steps": 1350, "loss": 1.7338, "lr": 9.384022371187003e-05, "epoch": 0.7333333333333333, "percentage": 24.44, "elapsed_time": "0:00:55", "remaining_time": "0:02:51"} |
|
{"current_steps": 340, "total_steps": 1350, "loss": 1.4941, "lr": 9.320398200956403e-05, "epoch": 0.7555555555555555, "percentage": 25.19, "elapsed_time": "0:00:57", "remaining_time": "0:02:49"} |
|
{"current_steps": 350, "total_steps": 1350, "loss": 1.9377, "lr": 9.253885701002134e-05, "epoch": 0.7777777777777778, "percentage": 25.93, "elapsed_time": "0:00:58", "remaining_time": "0:02:47"} |
|
{"current_steps": 360, "total_steps": 1350, "loss": 1.5295, "lr": 9.184529337140002e-05, "epoch": 0.8, "percentage": 26.67, "elapsed_time": "0:01:00", "remaining_time": "0:02:45"} |
|
{"current_steps": 370, "total_steps": 1350, "loss": 1.688, "lr": 9.112375476403312e-05, "epoch": 0.8222222222222222, "percentage": 27.41, "elapsed_time": "0:01:01", "remaining_time": "0:02:44"} |
|
{"current_steps": 380, "total_steps": 1350, "loss": 1.7526, "lr": 9.037472356044962e-05, "epoch": 0.8444444444444444, "percentage": 28.15, "elapsed_time": "0:01:04", "remaining_time": "0:02:43"} |
|
{"current_steps": 390, "total_steps": 1350, "loss": 1.5125, "lr": 8.959870051289241e-05, "epoch": 0.8666666666666667, "percentage": 28.89, "elapsed_time": "0:01:06", "remaining_time": "0:02:42"} |
|
{"current_steps": 400, "total_steps": 1350, "loss": 1.6507, "lr": 8.879620441854872e-05, "epoch": 0.8888888888888888, "percentage": 29.63, "elapsed_time": "0:01:07", "remaining_time": "0:02:41"} |
|
{"current_steps": 410, "total_steps": 1350, "loss": 1.6118, "lr": 8.796777177271708e-05, "epoch": 0.9111111111111111, "percentage": 30.37, "elapsed_time": "0:01:09", "remaining_time": "0:02:40"} |
|
{"current_steps": 420, "total_steps": 1350, "loss": 1.6589, "lr": 8.711395641014228e-05, "epoch": 0.9333333333333333, "percentage": 31.11, "elapsed_time": "0:01:11", "remaining_time": "0:02:38"} |
|
{"current_steps": 430, "total_steps": 1350, "loss": 1.6891, "lr": 8.623532913475847e-05, "epoch": 0.9555555555555556, "percentage": 31.85, "elapsed_time": "0:01:13", "remaining_time": "0:02:37"} |
|
{"current_steps": 440, "total_steps": 1350, "loss": 1.5275, "lr": 8.533247733808776e-05, "epoch": 0.9777777777777777, "percentage": 32.59, "elapsed_time": "0:01:15", "remaining_time": "0:02:35"} |
|
{"current_steps": 450, "total_steps": 1350, "loss": 1.7984, "lr": 8.440600460654958e-05, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:01:17", "remaining_time": "0:02:34"} |
|
{"current_steps": 460, "total_steps": 1350, "loss": 0.9174, "lr": 8.345653031794292e-05, "epoch": 1.0222222222222221, "percentage": 34.07, "elapsed_time": "0:01:19", "remaining_time": "0:02:32"} |
|
{"current_steps": 470, "total_steps": 1350, "loss": 1.3878, "lr": 8.248468922737188e-05, "epoch": 1.0444444444444445, "percentage": 34.81, "elapsed_time": "0:01:20", "remaining_time": "0:02:31"} |
|
{"current_steps": 480, "total_steps": 1350, "loss": 1.1277, "lr": 8.149113104289063e-05, "epoch": 1.0666666666666667, "percentage": 35.56, "elapsed_time": "0:01:22", "remaining_time": "0:02:29"} |
|
{"current_steps": 490, "total_steps": 1350, "loss": 1.0124, "lr": 8.047651999115217e-05, "epoch": 1.0888888888888888, "percentage": 36.3, "elapsed_time": "0:01:24", "remaining_time": "0:02:28"} |
|
{"current_steps": 500, "total_steps": 1350, "loss": 1.0102, "lr": 7.944153437335057e-05, "epoch": 1.1111111111111112, "percentage": 37.04, "elapsed_time": "0:01:26", "remaining_time": "0:02:26"} |
|
{"current_steps": 500, "total_steps": 1350, "eval_loss": 1.7722898721694946, "epoch": 1.1111111111111112, "percentage": 37.04, "elapsed_time": "0:01:30", "remaining_time": "0:02:33"} |
|
{"current_steps": 510, "total_steps": 1350, "loss": 1.1386, "lr": 7.838686611175421e-05, "epoch": 1.1333333333333333, "percentage": 37.78, "elapsed_time": "0:01:38", "remaining_time": "0:02:41"} |
|
{"current_steps": 520, "total_steps": 1350, "loss": 1.0376, "lr": 7.73132202871327e-05, "epoch": 1.1555555555555554, "percentage": 38.52, "elapsed_time": "0:01:39", "remaining_time": "0:02:39"} |
|
{"current_steps": 530, "total_steps": 1350, "loss": 1.2585, "lr": 7.6221314667387e-05, "epoch": 1.1777777777777778, "percentage": 39.26, "elapsed_time": "0:01:41", "remaining_time": "0:02:37"} |
|
{"current_steps": 540, "total_steps": 1350, "loss": 1.2203, "lr": 7.511187922769768e-05, "epoch": 1.2, "percentage": 40.0, "elapsed_time": "0:01:43", "remaining_time": "0:02:35"} |
|
{"current_steps": 550, "total_steps": 1350, "loss": 1.1651, "lr": 7.398565566251232e-05, "epoch": 1.2222222222222223, "percentage": 40.74, "elapsed_time": "0:01:45", "remaining_time": "0:02:33"} |
|
{"current_steps": 560, "total_steps": 1350, "loss": 1.1229, "lr": 7.284339688969809e-05, "epoch": 1.2444444444444445, "percentage": 41.48, "elapsed_time": "0:01:47", "remaining_time": "0:02:31"} |
|
{"current_steps": 570, "total_steps": 1350, "loss": 1.1348, "lr": 7.168586654719117e-05, "epoch": 1.2666666666666666, "percentage": 42.22, "elapsed_time": "0:01:48", "remaining_time": "0:02:28"} |
|
{"current_steps": 580, "total_steps": 1350, "loss": 1.1637, "lr": 7.051383848247942e-05, "epoch": 1.2888888888888888, "percentage": 42.96, "elapsed_time": "0:01:50", "remaining_time": "0:02:26"} |
|
{"current_steps": 590, "total_steps": 1350, "loss": 1.0358, "lr": 6.944726507547169e-05, "epoch": 1.3111111111111111, "percentage": 43.7, "elapsed_time": "0:01:52", "remaining_time": "0:02:24"} |
|
{"current_steps": 600, "total_steps": 1350, "loss": 1.0499, "lr": 6.824985757903016e-05, "epoch": 1.3333333333333333, "percentage": 44.44, "elapsed_time": "0:01:53", "remaining_time": "0:02:22"} |
|
{"current_steps": 610, "total_steps": 1350, "loss": 0.9614, "lr": 6.704024944652537e-05, "epoch": 1.3555555555555556, "percentage": 45.19, "elapsed_time": "0:01:55", "remaining_time": "0:02:20"} |
|
{"current_steps": 620, "total_steps": 1350, "loss": 1.2387, "lr": 6.581924934117782e-05, "epoch": 1.3777777777777778, "percentage": 45.93, "elapsed_time": "0:01:57", "remaining_time": "0:02:18"} |
|
{"current_steps": 630, "total_steps": 1350, "loss": 0.9807, "lr": 6.458767354212036e-05, "epoch": 1.4, "percentage": 46.67, "elapsed_time": "0:01:59", "remaining_time": "0:02:16"} |
|
{"current_steps": 640, "total_steps": 1350, "loss": 1.047, "lr": 6.334634539868836e-05, "epoch": 1.4222222222222223, "percentage": 47.41, "elapsed_time": "0:02:00", "remaining_time": "0:02:13"} |
|
{"current_steps": 650, "total_steps": 1350, "loss": 1.1423, "lr": 6.22214975761865e-05, "epoch": 1.4444444444444444, "percentage": 48.15, "elapsed_time": "0:02:02", "remaining_time": "0:02:11"} |
|
{"current_steps": 660, "total_steps": 1350, "loss": 1.1181, "lr": 6.096393120939516e-05, "epoch": 1.4666666666666668, "percentage": 48.89, "elapsed_time": "0:02:03", "remaining_time": "0:02:09"} |
|
{"current_steps": 670, "total_steps": 1350, "loss": 0.8642, "lr": 5.969903509036172e-05, "epoch": 1.488888888888889, "percentage": 49.63, "elapsed_time": "0:02:05", "remaining_time": "0:02:07"} |
|
{"current_steps": 680, "total_steps": 1350, "loss": 0.9609, "lr": 5.842765484416237e-05, "epoch": 1.511111111111111, "percentage": 50.37, "elapsed_time": "0:02:07", "remaining_time": "0:02:05"} |
|
{"current_steps": 690, "total_steps": 1350, "loss": 0.9543, "lr": 5.715064043072771e-05, "epoch": 1.5333333333333332, "percentage": 51.11, "elapsed_time": "0:02:08", "remaining_time": "0:02:03"} |
|
{"current_steps": 700, "total_steps": 1350, "loss": 1.3545, "lr": 5.586884557661638e-05, "epoch": 1.5555555555555556, "percentage": 51.85, "elapsed_time": "0:02:10", "remaining_time": "0:02:01"} |
|
{"current_steps": 710, "total_steps": 1350, "loss": 1.1898, "lr": 5.458312720427037e-05, "epoch": 1.5777777777777777, "percentage": 52.59, "elapsed_time": "0:02:12", "remaining_time": "0:01:59"} |
|
{"current_steps": 720, "total_steps": 1350, "loss": 0.9212, "lr": 5.329434485913393e-05, "epoch": 1.6, "percentage": 53.33, "elapsed_time": "0:02:14", "remaining_time": "0:01:57"} |
|
{"current_steps": 730, "total_steps": 1350, "loss": 1.0051, "lr": 5.200336013501898e-05, "epoch": 1.6222222222222222, "percentage": 54.07, "elapsed_time": "0:02:16", "remaining_time": "0:01:55"} |
|
{"current_steps": 740, "total_steps": 1350, "loss": 0.9947, "lr": 5.07110360981009e-05, "epoch": 1.6444444444444444, "percentage": 54.81, "elapsed_time": "0:02:17", "remaining_time": "0:01:53"} |
|
{"current_steps": 750, "total_steps": 1350, "loss": 1.2966, "lr": 4.941823670993016e-05, "epoch": 1.6666666666666665, "percentage": 55.56, "elapsed_time": "0:02:19", "remaining_time": "0:01:51"} |
|
{"current_steps": 760, "total_steps": 1350, "loss": 0.9482, "lr": 4.8125826249845375e-05, "epoch": 1.6888888888888889, "percentage": 56.3, "elapsed_time": "0:02:21", "remaining_time": "0:01:49"} |
|
{"current_steps": 770, "total_steps": 1350, "loss": 1.1203, "lr": 4.683466873717379e-05, "epoch": 1.7111111111111112, "percentage": 57.04, "elapsed_time": "0:02:23", "remaining_time": "0:01:48"} |
|
{"current_steps": 780, "total_steps": 1350, "loss": 0.9876, "lr": 4.55456273536057e-05, "epoch": 1.7333333333333334, "percentage": 57.78, "elapsed_time": "0:02:25", "remaining_time": "0:01:46"} |
|
{"current_steps": 790, "total_steps": 1350, "loss": 0.9708, "lr": 4.4259563866128754e-05, "epoch": 1.7555555555555555, "percentage": 58.52, "elapsed_time": "0:02:26", "remaining_time": "0:01:44"} |
|
{"current_steps": 800, "total_steps": 1350, "loss": 1.1659, "lr": 4.297733805090819e-05, "epoch": 1.7777777777777777, "percentage": 59.26, "elapsed_time": "0:02:28", "remaining_time": "0:01:42"} |
|
{"current_steps": 810, "total_steps": 1350, "loss": 1.0767, "lr": 4.169980711849781e-05, "epoch": 1.8, "percentage": 60.0, "elapsed_time": "0:02:30", "remaining_time": "0:01:40"} |
|
{"current_steps": 820, "total_steps": 1350, "loss": 0.9197, "lr": 4.0427825140766306e-05, "epoch": 1.8222222222222222, "percentage": 60.74, "elapsed_time": "0:02:32", "remaining_time": "0:01:38"} |
|
{"current_steps": 830, "total_steps": 1350, "loss": 1.0032, "lr": 3.916224247992184e-05, "epoch": 1.8444444444444446, "percentage": 61.48, "elapsed_time": "0:02:33", "remaining_time": "0:01:36"} |
|
{"current_steps": 840, "total_steps": 1350, "loss": 0.9162, "lr": 3.790390522001662e-05, "epoch": 1.8666666666666667, "percentage": 62.22, "elapsed_time": "0:02:35", "remaining_time": "0:01:34"} |
|
{"current_steps": 850, "total_steps": 1350, "loss": 0.9894, "lr": 3.665365460131165e-05, "epoch": 1.8888888888888888, "percentage": 62.96, "elapsed_time": "0:02:37", "remaining_time": "0:01:32"} |
|
{"current_steps": 860, "total_steps": 1350, "loss": 1.0847, "lr": 3.541232645787964e-05, "epoch": 1.911111111111111, "percentage": 63.7, "elapsed_time": "0:02:38", "remaining_time": "0:01:30"} |
|
{"current_steps": 870, "total_steps": 1350, "loss": 1.0293, "lr": 3.418075065882217e-05, "epoch": 1.9333333333333333, "percentage": 64.44, "elapsed_time": "0:02:40", "remaining_time": "0:01:28"} |
|
{"current_steps": 880, "total_steps": 1350, "loss": 1.1167, "lr": 3.295975055347464e-05, "epoch": 1.9555555555555557, "percentage": 65.19, "elapsed_time": "0:02:42", "remaining_time": "0:01:26"} |
|
{"current_steps": 890, "total_steps": 1350, "loss": 0.9419, "lr": 3.175014242096985e-05, "epoch": 1.9777777777777779, "percentage": 65.93, "elapsed_time": "0:02:43", "remaining_time": "0:01:24"} |
|
{"current_steps": 900, "total_steps": 1350, "loss": 1.0782, "lr": 3.0552734924528306e-05, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:02:45", "remaining_time": "0:01:22"} |
|
{"current_steps": 910, "total_steps": 1350, "loss": 0.7008, "lr": 2.936832857084003e-05, "epoch": 2.022222222222222, "percentage": 67.41, "elapsed_time": "0:02:47", "remaining_time": "0:01:20"} |
|
{"current_steps": 920, "total_steps": 1350, "loss": 0.5128, "lr": 2.8197715174899185e-05, "epoch": 2.0444444444444443, "percentage": 68.15, "elapsed_time": "0:02:48", "remaining_time": "0:01:18"} |
|
{"current_steps": 930, "total_steps": 1350, "loss": 0.4185, "lr": 2.7041677330649407e-05, "epoch": 2.066666666666667, "percentage": 68.89, "elapsed_time": "0:02:50", "remaining_time": "0:01:17"} |
|
{"current_steps": 940, "total_steps": 1350, "loss": 0.52, "lr": 2.590098788779396e-05, "epoch": 2.088888888888889, "percentage": 69.63, "elapsed_time": "0:02:52", "remaining_time": "0:01:15"} |
|
{"current_steps": 950, "total_steps": 1350, "loss": 0.7065, "lr": 2.4776409435119775e-05, "epoch": 2.111111111111111, "percentage": 70.37, "elapsed_time": "0:02:54", "remaining_time": "0:01:13"} |
|
{"current_steps": 960, "total_steps": 1350, "loss": 0.3988, "lr": 2.3668693790681634e-05, "epoch": 2.1333333333333333, "percentage": 71.11, "elapsed_time": "0:02:55", "remaining_time": "0:01:11"} |
|
{"current_steps": 970, "total_steps": 1350, "loss": 0.6353, "lr": 2.257858149918688e-05, "epoch": 2.1555555555555554, "percentage": 71.85, "elapsed_time": "0:02:57", "remaining_time": "0:01:09"} |
|
{"current_steps": 980, "total_steps": 1350, "loss": 0.4815, "lr": 2.15068013369166e-05, "epoch": 2.1777777777777776, "percentage": 72.59, "elapsed_time": "0:02:59", "remaining_time": "0:01:07"} |
|
{"current_steps": 990, "total_steps": 1350, "loss": 0.5903, "lr": 2.0454069824514444e-05, "epoch": 2.2, "percentage": 73.33, "elapsed_time": "0:03:01", "remaining_time": "0:01:05"} |
|
{"current_steps": 1000, "total_steps": 1350, "loss": 0.5375, "lr": 1.942109074796888e-05, "epoch": 2.2222222222222223, "percentage": 74.07, "elapsed_time": "0:03:02", "remaining_time": "0:01:03"} |
|
{"current_steps": 1000, "total_steps": 1350, "eval_loss": 1.9768437147140503, "epoch": 2.2222222222222223, "percentage": 74.07, "elapsed_time": "0:03:06", "remaining_time": "0:01:05"} |
|
{"current_steps": 1010, "total_steps": 1350, "loss": 0.4914, "lr": 1.8408554688108786e-05, "epoch": 2.2444444444444445, "percentage": 74.81, "elapsed_time": "0:03:12", "remaining_time": "0:01:04"} |
|
{"current_steps": 1020, "total_steps": 1350, "loss": 0.6643, "lr": 1.7417138558927244e-05, "epoch": 2.2666666666666666, "percentage": 75.56, "elapsed_time": "0:03:14", "remaining_time": "0:01:02"} |
|
{"current_steps": 1030, "total_steps": 1350, "loss": 0.4727, "lr": 1.6447505155042088e-05, "epoch": 2.2888888888888888, "percentage": 76.3, "elapsed_time": "0:03:16", "remaining_time": "0:01:01"} |
|
{"current_steps": 1040, "total_steps": 1350, "loss": 0.5654, "lr": 1.5500302708595648e-05, "epoch": 2.311111111111111, "percentage": 77.04, "elapsed_time": "0:03:18", "remaining_time": "0:00:59"} |
|
{"current_steps": 1050, "total_steps": 1350, "loss": 0.4691, "lr": 1.4576164455890013e-05, "epoch": 2.3333333333333335, "percentage": 77.78, "elapsed_time": "0:03:19", "remaining_time": "0:00:57"} |
|
{"current_steps": 1060, "total_steps": 1350, "loss": 0.5061, "lr": 1.3675708214047578e-05, "epoch": 2.3555555555555556, "percentage": 78.52, "elapsed_time": "0:03:21", "remaining_time": "0:00:55"} |
|
{"current_steps": 1070, "total_steps": 1350, "loss": 0.4352, "lr": 1.2799535967979747e-05, "epoch": 2.3777777777777778, "percentage": 79.26, "elapsed_time": "0:03:23", "remaining_time": "0:00:53"} |
|
{"current_steps": 1080, "total_steps": 1350, "loss": 0.5483, "lr": 1.194823346793998e-05, "epoch": 2.4, "percentage": 80.0, "elapsed_time": "0:03:24", "remaining_time": "0:00:51"} |
|
{"current_steps": 1090, "total_steps": 1350, "loss": 0.4424, "lr": 1.1122369837930363e-05, "epoch": 2.422222222222222, "percentage": 80.74, "elapsed_time": "0:03:26", "remaining_time": "0:00:49"} |
|
{"current_steps": 1100, "total_steps": 1350, "loss": 0.4717, "lr": 1.0322497195223285e-05, "epoch": 2.4444444444444446, "percentage": 81.48, "elapsed_time": "0:03:28", "remaining_time": "0:00:47"} |
|
{"current_steps": 1110, "total_steps": 1350, "loss": 0.4239, "lr": 9.549150281252633e-06, "epoch": 2.466666666666667, "percentage": 82.22, "elapsed_time": "0:03:30", "remaining_time": "0:00:45"} |
|
{"current_steps": 1120, "total_steps": 1350, "loss": 0.6657, "lr": 8.802846104121477e-06, "epoch": 2.488888888888889, "percentage": 82.96, "elapsed_time": "0:03:31", "remaining_time": "0:00:43"} |
|
{"current_steps": 1130, "total_steps": 1350, "loss": 0.4603, "lr": 8.084083592964942e-06, "epoch": 2.511111111111111, "percentage": 83.7, "elapsed_time": "0:03:33", "remaining_time": "0:00:41"} |
|
{"current_steps": 1140, "total_steps": 1350, "loss": 0.4783, "lr": 7.393343264399438e-06, "epoch": 2.533333333333333, "percentage": 84.44, "elapsed_time": "0:03:35", "remaining_time": "0:00:39"} |
|
{"current_steps": 1150, "total_steps": 1350, "loss": 0.5769, "lr": 6.7310869012814585e-06, "epoch": 2.5555555555555554, "percentage": 85.19, "elapsed_time": "0:03:36", "remaining_time": "0:00:37"} |
|
{"current_steps": 1160, "total_steps": 1350, "loss": 0.6047, "lr": 6.097757243990321e-06, "epoch": 2.5777777777777775, "percentage": 85.93, "elapsed_time": "0:03:38", "remaining_time": "0:00:35"} |
|
{"current_steps": 1170, "total_steps": 1350, "loss": 0.3204, "lr": 5.493777694441521e-06, "epoch": 2.6, "percentage": 86.67, "elapsed_time": "0:03:40", "remaining_time": "0:00:33"} |
|
{"current_steps": 1180, "total_steps": 1350, "loss": 0.4655, "lr": 4.919552033028513e-06, "epoch": 2.6222222222222222, "percentage": 87.41, "elapsed_time": "0:03:42", "remaining_time": "0:00:31"} |
|
{"current_steps": 1190, "total_steps": 1350, "loss": 0.5527, "lr": 4.375464148682096e-06, "epoch": 2.6444444444444444, "percentage": 88.15, "elapsed_time": "0:03:43", "remaining_time": "0:00:30"} |
|
{"current_steps": 1200, "total_steps": 1350, "loss": 0.5065, "lr": 3.861877782227885e-06, "epoch": 2.6666666666666665, "percentage": 88.89, "elapsed_time": "0:03:45", "remaining_time": "0:00:28"} |
|
{"current_steps": 1210, "total_steps": 1350, "loss": 0.4094, "lr": 3.3791362832135133e-06, "epoch": 2.688888888888889, "percentage": 89.63, "elapsed_time": "0:03:47", "remaining_time": "0:00:26"} |
|
{"current_steps": 1220, "total_steps": 1350, "loss": 0.6052, "lr": 2.9275623803680596e-06, "epoch": 2.7111111111111112, "percentage": 90.37, "elapsed_time": "0:03:49", "remaining_time": "0:00:24"} |
|
{"current_steps": 1230, "total_steps": 1350, "loss": 0.491, "lr": 2.5074579658471266e-06, "epoch": 2.7333333333333334, "percentage": 91.11, "elapsed_time": "0:03:51", "remaining_time": "0:00:22"} |
|
{"current_steps": 1240, "total_steps": 1350, "loss": 0.5293, "lr": 2.1191038934079643e-06, "epoch": 2.7555555555555555, "percentage": 91.85, "elapsed_time": "0:03:53", "remaining_time": "0:00:20"} |
|
{"current_steps": 1250, "total_steps": 1350, "loss": 0.5024, "lr": 1.7627597906493654e-06, "epoch": 2.7777777777777777, "percentage": 92.59, "elapsed_time": "0:03:55", "remaining_time": "0:00:18"} |
|
{"current_steps": 1260, "total_steps": 1350, "loss": 0.4411, "lr": 1.438663885441982e-06, "epoch": 2.8, "percentage": 93.33, "elapsed_time": "0:03:56", "remaining_time": "0:00:16"} |
|
{"current_steps": 1270, "total_steps": 1350, "loss": 0.616, "lr": 1.1470328466651304e-06, "epoch": 2.822222222222222, "percentage": 94.07, "elapsed_time": "0:03:58", "remaining_time": "0:00:15"} |
|
{"current_steps": 1280, "total_steps": 1350, "loss": 0.5948, "lr": 8.880616393563967e-07, "epoch": 2.8444444444444446, "percentage": 94.81, "elapsed_time": "0:04:00", "remaining_time": "0:00:13"} |
|
{"current_steps": 1290, "total_steps": 1350, "loss": 0.4361, "lr": 6.61923394371039e-07, "epoch": 2.8666666666666667, "percentage": 95.56, "elapsed_time": "0:04:01", "remaining_time": "0:00:11"} |
|
{"current_steps": 1300, "total_steps": 1350, "loss": 0.4553, "lr": 4.6876929263829915e-07, "epoch": 2.888888888888889, "percentage": 96.3, "elapsed_time": "0:04:03", "remaining_time": "0:00:09"} |
|
{"current_steps": 1310, "total_steps": 1350, "loss": 0.407, "lr": 3.087284640918786e-07, "epoch": 2.911111111111111, "percentage": 97.04, "elapsed_time": "0:04:05", "remaining_time": "0:00:07"} |
|
{"current_steps": 1320, "total_steps": 1350, "loss": 0.4567, "lr": 1.819079013423153e-07, "epoch": 2.9333333333333336, "percentage": 97.78, "elapsed_time": "0:04:06", "remaining_time": "0:00:05"} |
|
{"current_steps": 1330, "total_steps": 1350, "loss": 0.5011, "lr": 8.839238814886685e-08, "epoch": 2.9555555555555557, "percentage": 98.52, "elapsed_time": "0:04:08", "remaining_time": "0:00:03"} |
|
{"current_steps": 1340, "total_steps": 1350, "loss": 0.5416, "lr": 2.824444273875071e-08, "epoch": 2.977777777777778, "percentage": 99.26, "elapsed_time": "0:04:10", "remaining_time": "0:00:01"} |
|
{"current_steps": 1350, "total_steps": 1350, "loss": 0.4591, "lr": 1.5042760116212861e-09, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:04:12", "remaining_time": "0:00:00"} |
|
{"current_steps": 1350, "total_steps": 1350, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:04:15", "remaining_time": "0:00:00"} |
|
|