diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,9990 @@ +{ + "best_metric": 6.867476942316711, + "best_model_checkpoint": "./checkpoint-37000", + "epoch": 401.50564617314933, + "eval_steps": 1000, + "global_step": 40000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.25, + "learning_rate": 5.000000000000001e-07, + "loss": 0.887, + "step": 25 + }, + { + "epoch": 0.5, + "learning_rate": 1.0000000000000002e-06, + "loss": 0.5318, + "step": 50 + }, + { + "epoch": 0.75, + "learning_rate": 1.5e-06, + "loss": 0.349, + "step": 75 + }, + { + "epoch": 1.0, + "learning_rate": 2.0000000000000003e-06, + "loss": 0.2908, + "step": 100 + }, + { + "epoch": 1.25, + "learning_rate": 2.5e-06, + "loss": 0.2495, + "step": 125 + }, + { + "epoch": 1.51, + "learning_rate": 3e-06, + "loss": 0.227, + "step": 150 + }, + { + "epoch": 1.76, + "learning_rate": 3.5e-06, + "loss": 0.2084, + "step": 175 + }, + { + "epoch": 2.01, + "learning_rate": 4.000000000000001e-06, + "loss": 0.1904, + "step": 200 + }, + { + "epoch": 2.26, + "learning_rate": 4.5e-06, + "loss": 0.1543, + "step": 225 + }, + { + "epoch": 2.51, + "learning_rate": 5e-06, + "loss": 0.147, + "step": 250 + }, + { + "epoch": 2.76, + "learning_rate": 5.500000000000001e-06, + "loss": 0.141, + "step": 275 + }, + { + "epoch": 3.01, + "learning_rate": 6e-06, + "loss": 0.1351, + "step": 300 + }, + { + "epoch": 3.26, + "learning_rate": 6.5000000000000004e-06, + "loss": 0.0963, + "step": 325 + }, + { + "epoch": 3.51, + "learning_rate": 7e-06, + "loss": 0.0932, + "step": 350 + }, + { + "epoch": 3.76, + "learning_rate": 7.500000000000001e-06, + "loss": 0.0977, + "step": 375 + }, + { + "epoch": 4.02, + "learning_rate": 8.000000000000001e-06, + "loss": 0.0942, + "step": 400 + }, + { + "epoch": 4.27, + "learning_rate": 8.5e-06, + "loss": 0.0607, + "step": 425 + }, + { + "epoch": 4.52, + "learning_rate": 9e-06, + "loss": 0.0603, + "step": 450 + }, + { + "epoch": 4.77, + "learning_rate": 9.5e-06, + "loss": 0.0646, + "step": 475 + }, + { + "epoch": 5.02, + "learning_rate": 1e-05, + "loss": 0.063, + "step": 500 + }, + { + "epoch": 5.27, + "learning_rate": 9.99367088607595e-06, + "loss": 0.0376, + "step": 525 + }, + { + "epoch": 5.52, + "learning_rate": 9.9873417721519e-06, + "loss": 0.0401, + "step": 550 + }, + { + "epoch": 5.77, + "learning_rate": 9.981012658227849e-06, + "loss": 0.0411, + "step": 575 + }, + { + "epoch": 6.02, + "learning_rate": 9.974683544303799e-06, + "loss": 0.0404, + "step": 600 + }, + { + "epoch": 6.27, + "learning_rate": 9.968354430379748e-06, + "loss": 0.025, + "step": 625 + }, + { + "epoch": 6.52, + "learning_rate": 9.962025316455697e-06, + "loss": 0.0242, + "step": 650 + }, + { + "epoch": 6.78, + "learning_rate": 9.955696202531647e-06, + "loss": 0.0261, + "step": 675 + }, + { + "epoch": 7.03, + "learning_rate": 9.949367088607596e-06, + "loss": 0.0235, + "step": 700 + }, + { + "epoch": 7.28, + "learning_rate": 9.943037974683544e-06, + "loss": 0.0147, + "step": 725 + }, + { + "epoch": 7.53, + "learning_rate": 9.936708860759493e-06, + "loss": 0.0161, + "step": 750 + }, + { + "epoch": 7.78, + "learning_rate": 9.930379746835443e-06, + "loss": 0.0158, + "step": 775 + }, + { + "epoch": 8.03, + "learning_rate": 9.924050632911392e-06, + "loss": 0.0154, + "step": 800 + }, + { + "epoch": 8.28, + "learning_rate": 9.917721518987342e-06, + "loss": 0.0098, + "step": 825 + }, + { + "epoch": 8.53, + "learning_rate": 9.911392405063291e-06, + "loss": 0.0101, + "step": 850 + }, + { + "epoch": 8.78, + "learning_rate": 9.90506329113924e-06, + "loss": 0.011, + "step": 875 + }, + { + "epoch": 9.03, + "learning_rate": 9.89873417721519e-06, + "loss": 0.0112, + "step": 900 + }, + { + "epoch": 9.28, + "learning_rate": 9.892405063291141e-06, + "loss": 0.007, + "step": 925 + }, + { + "epoch": 9.54, + "learning_rate": 9.88607594936709e-06, + "loss": 0.0074, + "step": 950 + }, + { + "epoch": 9.79, + "learning_rate": 9.87974683544304e-06, + "loss": 0.0076, + "step": 975 + }, + { + "epoch": 10.04, + "learning_rate": 9.87341772151899e-06, + "loss": 0.0095, + "step": 1000 + }, + { + "epoch": 10.04, + "eval_loss": 0.20232713222503662, + "eval_runtime": 2823.9879, + "eval_samples_per_second": 4.512, + "eval_steps_per_second": 0.282, + "eval_wer": 9.680318899484133, + "step": 1000 + }, + { + "epoch": 10.29, + "learning_rate": 9.867088607594937e-06, + "loss": 0.0068, + "step": 1025 + }, + { + "epoch": 10.54, + "learning_rate": 9.860759493670887e-06, + "loss": 0.0062, + "step": 1050 + }, + { + "epoch": 10.79, + "learning_rate": 9.854430379746836e-06, + "loss": 0.0065, + "step": 1075 + }, + { + "epoch": 11.04, + "learning_rate": 9.848101265822785e-06, + "loss": 0.0059, + "step": 1100 + }, + { + "epoch": 11.29, + "learning_rate": 9.841772151898735e-06, + "loss": 0.0041, + "step": 1125 + }, + { + "epoch": 11.54, + "learning_rate": 9.835443037974684e-06, + "loss": 0.0043, + "step": 1150 + }, + { + "epoch": 11.79, + "learning_rate": 9.829113924050634e-06, + "loss": 0.0043, + "step": 1175 + }, + { + "epoch": 12.05, + "learning_rate": 9.822784810126583e-06, + "loss": 0.0046, + "step": 1200 + }, + { + "epoch": 12.3, + "learning_rate": 9.816455696202533e-06, + "loss": 0.0042, + "step": 1225 + }, + { + "epoch": 12.55, + "learning_rate": 9.810126582278482e-06, + "loss": 0.004, + "step": 1250 + }, + { + "epoch": 12.8, + "learning_rate": 9.803797468354431e-06, + "loss": 0.004, + "step": 1275 + }, + { + "epoch": 13.05, + "learning_rate": 9.79746835443038e-06, + "loss": 0.0039, + "step": 1300 + }, + { + "epoch": 13.3, + "learning_rate": 9.79113924050633e-06, + "loss": 0.0031, + "step": 1325 + }, + { + "epoch": 13.55, + "learning_rate": 9.78481012658228e-06, + "loss": 0.0029, + "step": 1350 + }, + { + "epoch": 13.8, + "learning_rate": 9.778481012658229e-06, + "loss": 0.003, + "step": 1375 + }, + { + "epoch": 14.05, + "learning_rate": 9.772151898734179e-06, + "loss": 0.0032, + "step": 1400 + }, + { + "epoch": 14.3, + "learning_rate": 9.765822784810128e-06, + "loss": 0.003, + "step": 1425 + }, + { + "epoch": 14.55, + "learning_rate": 9.759493670886077e-06, + "loss": 0.0029, + "step": 1450 + }, + { + "epoch": 14.81, + "learning_rate": 9.753164556962025e-06, + "loss": 0.0031, + "step": 1475 + }, + { + "epoch": 15.06, + "learning_rate": 9.746835443037975e-06, + "loss": 0.004, + "step": 1500 + }, + { + "epoch": 15.31, + "learning_rate": 9.740506329113924e-06, + "loss": 0.0034, + "step": 1525 + }, + { + "epoch": 15.56, + "learning_rate": 9.734177215189873e-06, + "loss": 0.0037, + "step": 1550 + }, + { + "epoch": 15.81, + "learning_rate": 9.727848101265823e-06, + "loss": 0.0038, + "step": 1575 + }, + { + "epoch": 16.06, + "learning_rate": 9.721518987341772e-06, + "loss": 0.0045, + "step": 1600 + }, + { + "epoch": 16.31, + "learning_rate": 9.715189873417722e-06, + "loss": 0.0039, + "step": 1625 + }, + { + "epoch": 16.56, + "learning_rate": 9.708860759493671e-06, + "loss": 0.0038, + "step": 1650 + }, + { + "epoch": 16.81, + "learning_rate": 9.70253164556962e-06, + "loss": 0.0043, + "step": 1675 + }, + { + "epoch": 17.06, + "learning_rate": 9.69620253164557e-06, + "loss": 0.0046, + "step": 1700 + }, + { + "epoch": 17.31, + "learning_rate": 9.68987341772152e-06, + "loss": 0.0041, + "step": 1725 + }, + { + "epoch": 17.57, + "learning_rate": 9.68354430379747e-06, + "loss": 0.0034, + "step": 1750 + }, + { + "epoch": 17.82, + "learning_rate": 9.677215189873418e-06, + "loss": 0.004, + "step": 1775 + }, + { + "epoch": 18.07, + "learning_rate": 9.670886075949368e-06, + "loss": 0.0034, + "step": 1800 + }, + { + "epoch": 18.32, + "learning_rate": 9.664556962025317e-06, + "loss": 0.0029, + "step": 1825 + }, + { + "epoch": 18.57, + "learning_rate": 9.658227848101267e-06, + "loss": 0.0031, + "step": 1850 + }, + { + "epoch": 18.82, + "learning_rate": 9.651898734177216e-06, + "loss": 0.0033, + "step": 1875 + }, + { + "epoch": 19.07, + "learning_rate": 9.645569620253165e-06, + "loss": 0.0032, + "step": 1900 + }, + { + "epoch": 19.32, + "learning_rate": 9.639240506329115e-06, + "loss": 0.0026, + "step": 1925 + }, + { + "epoch": 19.57, + "learning_rate": 9.632911392405064e-06, + "loss": 0.0031, + "step": 1950 + }, + { + "epoch": 19.82, + "learning_rate": 9.626582278481014e-06, + "loss": 0.0039, + "step": 1975 + }, + { + "epoch": 20.08, + "learning_rate": 9.620253164556963e-06, + "loss": 0.0032, + "step": 2000 + }, + { + "epoch": 20.08, + "eval_loss": 0.21532024443149567, + "eval_runtime": 2792.5976, + "eval_samples_per_second": 4.563, + "eval_steps_per_second": 0.285, + "eval_wer": 9.052094731905582, + "step": 2000 + }, + { + "epoch": 20.33, + "learning_rate": 9.613924050632913e-06, + "loss": 0.0026, + "step": 2025 + }, + { + "epoch": 20.58, + "learning_rate": 9.607594936708862e-06, + "loss": 0.0022, + "step": 2050 + }, + { + "epoch": 20.83, + "learning_rate": 9.601265822784811e-06, + "loss": 0.0028, + "step": 2075 + }, + { + "epoch": 21.08, + "learning_rate": 9.59493670886076e-06, + "loss": 0.0025, + "step": 2100 + }, + { + "epoch": 21.33, + "learning_rate": 9.58860759493671e-06, + "loss": 0.0022, + "step": 2125 + }, + { + "epoch": 21.58, + "learning_rate": 9.58227848101266e-06, + "loss": 0.002, + "step": 2150 + }, + { + "epoch": 21.83, + "learning_rate": 9.575949367088609e-06, + "loss": 0.0026, + "step": 2175 + }, + { + "epoch": 22.08, + "learning_rate": 9.569620253164559e-06, + "loss": 0.0027, + "step": 2200 + }, + { + "epoch": 22.33, + "learning_rate": 9.563291139240506e-06, + "loss": 0.0018, + "step": 2225 + }, + { + "epoch": 22.58, + "learning_rate": 9.556962025316456e-06, + "loss": 0.002, + "step": 2250 + }, + { + "epoch": 22.84, + "learning_rate": 9.550632911392405e-06, + "loss": 0.003, + "step": 2275 + }, + { + "epoch": 23.09, + "learning_rate": 9.544303797468355e-06, + "loss": 0.0022, + "step": 2300 + }, + { + "epoch": 23.34, + "learning_rate": 9.537974683544304e-06, + "loss": 0.002, + "step": 2325 + }, + { + "epoch": 23.59, + "learning_rate": 9.531645569620253e-06, + "loss": 0.0019, + "step": 2350 + }, + { + "epoch": 23.84, + "learning_rate": 9.525316455696203e-06, + "loss": 0.0026, + "step": 2375 + }, + { + "epoch": 24.09, + "learning_rate": 9.518987341772152e-06, + "loss": 0.0022, + "step": 2400 + }, + { + "epoch": 24.34, + "learning_rate": 9.512658227848102e-06, + "loss": 0.0019, + "step": 2425 + }, + { + "epoch": 24.59, + "learning_rate": 9.506329113924051e-06, + "loss": 0.0025, + "step": 2450 + }, + { + "epoch": 24.84, + "learning_rate": 9.5e-06, + "loss": 0.0027, + "step": 2475 + }, + { + "epoch": 25.09, + "learning_rate": 9.49367088607595e-06, + "loss": 0.0023, + "step": 2500 + }, + { + "epoch": 25.35, + "learning_rate": 9.4873417721519e-06, + "loss": 0.0019, + "step": 2525 + }, + { + "epoch": 25.6, + "learning_rate": 9.481012658227849e-06, + "loss": 0.0018, + "step": 2550 + }, + { + "epoch": 25.85, + "learning_rate": 9.474683544303798e-06, + "loss": 0.0021, + "step": 2575 + }, + { + "epoch": 26.1, + "learning_rate": 9.468354430379748e-06, + "loss": 0.0022, + "step": 2600 + }, + { + "epoch": 26.35, + "learning_rate": 9.462025316455697e-06, + "loss": 0.0025, + "step": 2625 + }, + { + "epoch": 26.6, + "learning_rate": 9.455696202531647e-06, + "loss": 0.0022, + "step": 2650 + }, + { + "epoch": 26.85, + "learning_rate": 9.449367088607596e-06, + "loss": 0.0024, + "step": 2675 + }, + { + "epoch": 27.1, + "learning_rate": 9.443037974683545e-06, + "loss": 0.0028, + "step": 2700 + }, + { + "epoch": 27.35, + "learning_rate": 9.436708860759495e-06, + "loss": 0.0025, + "step": 2725 + }, + { + "epoch": 27.6, + "learning_rate": 9.430379746835444e-06, + "loss": 0.0026, + "step": 2750 + }, + { + "epoch": 27.85, + "learning_rate": 9.424050632911394e-06, + "loss": 0.0026, + "step": 2775 + }, + { + "epoch": 28.11, + "learning_rate": 9.417721518987343e-06, + "loss": 0.0024, + "step": 2800 + }, + { + "epoch": 28.36, + "learning_rate": 9.411392405063293e-06, + "loss": 0.0025, + "step": 2825 + }, + { + "epoch": 28.61, + "learning_rate": 9.405063291139242e-06, + "loss": 0.0023, + "step": 2850 + }, + { + "epoch": 28.86, + "learning_rate": 9.398734177215191e-06, + "loss": 0.0027, + "step": 2875 + }, + { + "epoch": 29.11, + "learning_rate": 9.39240506329114e-06, + "loss": 0.0025, + "step": 2900 + }, + { + "epoch": 29.36, + "learning_rate": 9.38607594936709e-06, + "loss": 0.0026, + "step": 2925 + }, + { + "epoch": 29.61, + "learning_rate": 9.379746835443038e-06, + "loss": 0.0021, + "step": 2950 + }, + { + "epoch": 29.86, + "learning_rate": 9.373417721518987e-06, + "loss": 0.0025, + "step": 2975 + }, + { + "epoch": 30.11, + "learning_rate": 9.367088607594937e-06, + "loss": 0.0023, + "step": 3000 + }, + { + "epoch": 30.11, + "eval_loss": 0.22344575822353363, + "eval_runtime": 2793.5917, + "eval_samples_per_second": 4.561, + "eval_steps_per_second": 0.285, + "eval_wer": 8.86450680006253, + "step": 3000 + }, + { + "epoch": 30.36, + "learning_rate": 9.360759493670886e-06, + "loss": 0.0017, + "step": 3025 + }, + { + "epoch": 30.61, + "learning_rate": 9.354430379746836e-06, + "loss": 0.0018, + "step": 3050 + }, + { + "epoch": 30.87, + "learning_rate": 9.348101265822785e-06, + "loss": 0.0019, + "step": 3075 + }, + { + "epoch": 31.12, + "learning_rate": 9.341772151898735e-06, + "loss": 0.0017, + "step": 3100 + }, + { + "epoch": 31.37, + "learning_rate": 9.335443037974684e-06, + "loss": 0.0013, + "step": 3125 + }, + { + "epoch": 31.62, + "learning_rate": 9.329113924050633e-06, + "loss": 0.0016, + "step": 3150 + }, + { + "epoch": 31.87, + "learning_rate": 9.322784810126583e-06, + "loss": 0.0018, + "step": 3175 + }, + { + "epoch": 32.12, + "learning_rate": 9.316455696202532e-06, + "loss": 0.0016, + "step": 3200 + }, + { + "epoch": 32.37, + "learning_rate": 9.310126582278482e-06, + "loss": 0.0017, + "step": 3225 + }, + { + "epoch": 32.62, + "learning_rate": 9.303797468354431e-06, + "loss": 0.0014, + "step": 3250 + }, + { + "epoch": 32.87, + "learning_rate": 9.29746835443038e-06, + "loss": 0.0016, + "step": 3275 + }, + { + "epoch": 33.12, + "learning_rate": 9.29113924050633e-06, + "loss": 0.0013, + "step": 3300 + }, + { + "epoch": 33.38, + "learning_rate": 9.28481012658228e-06, + "loss": 0.0012, + "step": 3325 + }, + { + "epoch": 33.63, + "learning_rate": 9.278481012658229e-06, + "loss": 0.0011, + "step": 3350 + }, + { + "epoch": 33.88, + "learning_rate": 9.272151898734178e-06, + "loss": 0.0018, + "step": 3375 + }, + { + "epoch": 34.13, + "learning_rate": 9.265822784810128e-06, + "loss": 0.0019, + "step": 3400 + }, + { + "epoch": 34.38, + "learning_rate": 9.259493670886077e-06, + "loss": 0.0015, + "step": 3425 + }, + { + "epoch": 34.63, + "learning_rate": 9.253164556962027e-06, + "loss": 0.002, + "step": 3450 + }, + { + "epoch": 34.88, + "learning_rate": 9.246835443037976e-06, + "loss": 0.0023, + "step": 3475 + }, + { + "epoch": 35.13, + "learning_rate": 9.240506329113925e-06, + "loss": 0.0025, + "step": 3500 + }, + { + "epoch": 35.38, + "learning_rate": 9.234177215189875e-06, + "loss": 0.0023, + "step": 3525 + }, + { + "epoch": 35.63, + "learning_rate": 9.227848101265824e-06, + "loss": 0.0026, + "step": 3550 + }, + { + "epoch": 35.88, + "learning_rate": 9.221518987341774e-06, + "loss": 0.0029, + "step": 3575 + }, + { + "epoch": 36.14, + "learning_rate": 9.215189873417723e-06, + "loss": 0.0022, + "step": 3600 + }, + { + "epoch": 36.39, + "learning_rate": 9.208860759493673e-06, + "loss": 0.0024, + "step": 3625 + }, + { + "epoch": 36.64, + "learning_rate": 9.202531645569622e-06, + "loss": 0.0021, + "step": 3650 + }, + { + "epoch": 36.89, + "learning_rate": 9.196202531645571e-06, + "loss": 0.0021, + "step": 3675 + }, + { + "epoch": 37.14, + "learning_rate": 9.189873417721519e-06, + "loss": 0.0017, + "step": 3700 + }, + { + "epoch": 37.39, + "learning_rate": 9.183544303797469e-06, + "loss": 0.0013, + "step": 3725 + }, + { + "epoch": 37.64, + "learning_rate": 9.177215189873418e-06, + "loss": 0.0024, + "step": 3750 + }, + { + "epoch": 37.89, + "learning_rate": 9.170886075949367e-06, + "loss": 0.0029, + "step": 3775 + }, + { + "epoch": 38.14, + "learning_rate": 9.164556962025317e-06, + "loss": 0.0019, + "step": 3800 + }, + { + "epoch": 38.39, + "learning_rate": 9.158227848101266e-06, + "loss": 0.0016, + "step": 3825 + }, + { + "epoch": 38.64, + "learning_rate": 9.151898734177216e-06, + "loss": 0.0019, + "step": 3850 + }, + { + "epoch": 38.9, + "learning_rate": 9.145569620253165e-06, + "loss": 0.0028, + "step": 3875 + }, + { + "epoch": 39.15, + "learning_rate": 9.139240506329115e-06, + "loss": 0.003, + "step": 3900 + }, + { + "epoch": 39.4, + "learning_rate": 9.132911392405064e-06, + "loss": 0.0028, + "step": 3925 + }, + { + "epoch": 39.65, + "learning_rate": 9.126582278481013e-06, + "loss": 0.0027, + "step": 3950 + }, + { + "epoch": 39.9, + "learning_rate": 9.120253164556963e-06, + "loss": 0.0029, + "step": 3975 + }, + { + "epoch": 40.15, + "learning_rate": 9.113924050632912e-06, + "loss": 0.0023, + "step": 4000 + }, + { + "epoch": 40.15, + "eval_loss": 0.22782479226589203, + "eval_runtime": 2785.8527, + "eval_samples_per_second": 4.574, + "eval_steps_per_second": 0.286, + "eval_wer": 8.436571830545567, + "step": 4000 + }, + { + "epoch": 40.4, + "learning_rate": 9.107594936708862e-06, + "loss": 0.0026, + "step": 4025 + }, + { + "epoch": 40.65, + "learning_rate": 9.101265822784811e-06, + "loss": 0.0032, + "step": 4050 + }, + { + "epoch": 40.9, + "learning_rate": 9.09493670886076e-06, + "loss": 0.0028, + "step": 4075 + }, + { + "epoch": 41.15, + "learning_rate": 9.08860759493671e-06, + "loss": 0.0023, + "step": 4100 + }, + { + "epoch": 41.41, + "learning_rate": 9.08227848101266e-06, + "loss": 0.0016, + "step": 4125 + }, + { + "epoch": 41.66, + "learning_rate": 9.075949367088607e-06, + "loss": 0.002, + "step": 4150 + }, + { + "epoch": 41.91, + "learning_rate": 9.069620253164557e-06, + "loss": 0.002, + "step": 4175 + }, + { + "epoch": 42.16, + "learning_rate": 9.063291139240506e-06, + "loss": 0.0013, + "step": 4200 + }, + { + "epoch": 42.41, + "learning_rate": 9.056962025316457e-06, + "loss": 0.0016, + "step": 4225 + }, + { + "epoch": 42.66, + "learning_rate": 9.050632911392407e-06, + "loss": 0.002, + "step": 4250 + }, + { + "epoch": 42.91, + "learning_rate": 9.044303797468356e-06, + "loss": 0.0018, + "step": 4275 + }, + { + "epoch": 43.16, + "learning_rate": 9.037974683544305e-06, + "loss": 0.0012, + "step": 4300 + }, + { + "epoch": 43.41, + "learning_rate": 9.031645569620255e-06, + "loss": 0.0015, + "step": 4325 + }, + { + "epoch": 43.66, + "learning_rate": 9.025316455696204e-06, + "loss": 0.0012, + "step": 4350 + }, + { + "epoch": 43.91, + "learning_rate": 9.018987341772154e-06, + "loss": 0.0024, + "step": 4375 + }, + { + "epoch": 44.17, + "learning_rate": 9.012658227848103e-06, + "loss": 0.0019, + "step": 4400 + }, + { + "epoch": 44.42, + "learning_rate": 9.00632911392405e-06, + "loss": 0.0013, + "step": 4425 + }, + { + "epoch": 44.67, + "learning_rate": 9e-06, + "loss": 0.0014, + "step": 4450 + }, + { + "epoch": 44.92, + "learning_rate": 8.99367088607595e-06, + "loss": 0.0018, + "step": 4475 + }, + { + "epoch": 45.17, + "learning_rate": 8.987341772151899e-06, + "loss": 0.0018, + "step": 4500 + }, + { + "epoch": 45.42, + "learning_rate": 8.981012658227849e-06, + "loss": 0.0014, + "step": 4525 + }, + { + "epoch": 45.67, + "learning_rate": 8.974683544303798e-06, + "loss": 0.0018, + "step": 4550 + }, + { + "epoch": 45.92, + "learning_rate": 8.968354430379747e-06, + "loss": 0.0018, + "step": 4575 + }, + { + "epoch": 46.17, + "learning_rate": 8.962025316455697e-06, + "loss": 0.0012, + "step": 4600 + }, + { + "epoch": 46.42, + "learning_rate": 8.955696202531646e-06, + "loss": 0.0013, + "step": 4625 + }, + { + "epoch": 46.68, + "learning_rate": 8.949367088607596e-06, + "loss": 0.0013, + "step": 4650 + }, + { + "epoch": 46.93, + "learning_rate": 8.943037974683545e-06, + "loss": 0.0011, + "step": 4675 + }, + { + "epoch": 47.18, + "learning_rate": 8.936708860759495e-06, + "loss": 0.0008, + "step": 4700 + }, + { + "epoch": 47.43, + "learning_rate": 8.930379746835444e-06, + "loss": 0.0009, + "step": 4725 + }, + { + "epoch": 47.68, + "learning_rate": 8.924050632911393e-06, + "loss": 0.0009, + "step": 4750 + }, + { + "epoch": 47.93, + "learning_rate": 8.917721518987343e-06, + "loss": 0.001, + "step": 4775 + }, + { + "epoch": 48.18, + "learning_rate": 8.911392405063292e-06, + "loss": 0.0014, + "step": 4800 + }, + { + "epoch": 48.43, + "learning_rate": 8.905063291139242e-06, + "loss": 0.001, + "step": 4825 + }, + { + "epoch": 48.68, + "learning_rate": 8.898734177215191e-06, + "loss": 0.0013, + "step": 4850 + }, + { + "epoch": 48.93, + "learning_rate": 8.892405063291139e-06, + "loss": 0.0009, + "step": 4875 + }, + { + "epoch": 49.18, + "learning_rate": 8.886075949367088e-06, + "loss": 0.0007, + "step": 4900 + }, + { + "epoch": 49.44, + "learning_rate": 8.879746835443038e-06, + "loss": 0.0008, + "step": 4925 + }, + { + "epoch": 49.69, + "learning_rate": 8.873417721518987e-06, + "loss": 0.0007, + "step": 4950 + }, + { + "epoch": 49.94, + "learning_rate": 8.867088607594937e-06, + "loss": 0.0013, + "step": 4975 + }, + { + "epoch": 50.19, + "learning_rate": 8.860759493670886e-06, + "loss": 0.0012, + "step": 5000 + }, + { + "epoch": 50.19, + "eval_loss": 0.2259608805179596, + "eval_runtime": 2783.4754, + "eval_samples_per_second": 4.578, + "eval_steps_per_second": 0.286, + "eval_wer": 7.991050492418321, + "step": 5000 + }, + { + "epoch": 50.44, + "learning_rate": 8.854430379746835e-06, + "loss": 0.0012, + "step": 5025 + }, + { + "epoch": 50.69, + "learning_rate": 8.848101265822786e-06, + "loss": 0.0014, + "step": 5050 + }, + { + "epoch": 50.94, + "learning_rate": 8.841772151898736e-06, + "loss": 0.0012, + "step": 5075 + }, + { + "epoch": 51.19, + "learning_rate": 8.835443037974685e-06, + "loss": 0.0011, + "step": 5100 + }, + { + "epoch": 51.44, + "learning_rate": 8.829113924050635e-06, + "loss": 0.0013, + "step": 5125 + }, + { + "epoch": 51.69, + "learning_rate": 8.822784810126584e-06, + "loss": 0.0013, + "step": 5150 + }, + { + "epoch": 51.94, + "learning_rate": 8.816455696202532e-06, + "loss": 0.0015, + "step": 5175 + }, + { + "epoch": 52.2, + "learning_rate": 8.810126582278481e-06, + "loss": 0.0013, + "step": 5200 + }, + { + "epoch": 52.45, + "learning_rate": 8.80379746835443e-06, + "loss": 0.001, + "step": 5225 + }, + { + "epoch": 52.7, + "learning_rate": 8.79746835443038e-06, + "loss": 0.0015, + "step": 5250 + }, + { + "epoch": 52.95, + "learning_rate": 8.79113924050633e-06, + "loss": 0.0017, + "step": 5275 + }, + { + "epoch": 53.2, + "learning_rate": 8.784810126582279e-06, + "loss": 0.0024, + "step": 5300 + }, + { + "epoch": 53.45, + "learning_rate": 8.778481012658229e-06, + "loss": 0.0027, + "step": 5325 + }, + { + "epoch": 53.7, + "learning_rate": 8.772151898734178e-06, + "loss": 0.0023, + "step": 5350 + }, + { + "epoch": 53.95, + "learning_rate": 8.765822784810127e-06, + "loss": 0.0023, + "step": 5375 + }, + { + "epoch": 54.2, + "learning_rate": 8.759493670886077e-06, + "loss": 0.0023, + "step": 5400 + }, + { + "epoch": 54.45, + "learning_rate": 8.753164556962026e-06, + "loss": 0.0017, + "step": 5425 + }, + { + "epoch": 54.71, + "learning_rate": 8.746835443037976e-06, + "loss": 0.0014, + "step": 5450 + }, + { + "epoch": 54.96, + "learning_rate": 8.740506329113925e-06, + "loss": 0.0018, + "step": 5475 + }, + { + "epoch": 55.21, + "learning_rate": 8.734177215189874e-06, + "loss": 0.0013, + "step": 5500 + }, + { + "epoch": 55.46, + "learning_rate": 8.727848101265824e-06, + "loss": 0.0017, + "step": 5525 + }, + { + "epoch": 55.71, + "learning_rate": 8.721518987341773e-06, + "loss": 0.0018, + "step": 5550 + }, + { + "epoch": 55.96, + "learning_rate": 8.715189873417723e-06, + "loss": 0.0015, + "step": 5575 + }, + { + "epoch": 56.21, + "learning_rate": 8.708860759493672e-06, + "loss": 0.001, + "step": 5600 + }, + { + "epoch": 56.46, + "learning_rate": 8.70253164556962e-06, + "loss": 0.0009, + "step": 5625 + }, + { + "epoch": 56.71, + "learning_rate": 8.69620253164557e-06, + "loss": 0.001, + "step": 5650 + }, + { + "epoch": 56.96, + "learning_rate": 8.689873417721519e-06, + "loss": 0.0015, + "step": 5675 + }, + { + "epoch": 57.21, + "learning_rate": 8.683544303797468e-06, + "loss": 0.0016, + "step": 5700 + }, + { + "epoch": 57.47, + "learning_rate": 8.677215189873418e-06, + "loss": 0.0014, + "step": 5725 + }, + { + "epoch": 57.72, + "learning_rate": 8.670886075949367e-06, + "loss": 0.0013, + "step": 5750 + }, + { + "epoch": 57.97, + "learning_rate": 8.664556962025317e-06, + "loss": 0.0015, + "step": 5775 + }, + { + "epoch": 58.22, + "learning_rate": 8.658227848101266e-06, + "loss": 0.0016, + "step": 5800 + }, + { + "epoch": 58.47, + "learning_rate": 8.651898734177215e-06, + "loss": 0.0017, + "step": 5825 + }, + { + "epoch": 58.72, + "learning_rate": 8.645569620253166e-06, + "loss": 0.0015, + "step": 5850 + }, + { + "epoch": 58.97, + "learning_rate": 8.639240506329116e-06, + "loss": 0.0012, + "step": 5875 + }, + { + "epoch": 59.22, + "learning_rate": 8.632911392405064e-06, + "loss": 0.0013, + "step": 5900 + }, + { + "epoch": 59.47, + "learning_rate": 8.626582278481013e-06, + "loss": 0.0008, + "step": 5925 + }, + { + "epoch": 59.72, + "learning_rate": 8.620253164556963e-06, + "loss": 0.0007, + "step": 5950 + }, + { + "epoch": 59.97, + "learning_rate": 8.613924050632912e-06, + "loss": 0.0007, + "step": 5975 + }, + { + "epoch": 60.23, + "learning_rate": 8.607594936708861e-06, + "loss": 0.0005, + "step": 6000 + }, + { + "epoch": 60.23, + "eval_loss": 0.24347658455371857, + "eval_runtime": 2781.2525, + "eval_samples_per_second": 4.581, + "eval_steps_per_second": 0.287, + "eval_wer": 7.906049710801938, + "step": 6000 + }, + { + "epoch": 60.48, + "learning_rate": 8.60126582278481e-06, + "loss": 0.0006, + "step": 6025 + }, + { + "epoch": 60.73, + "learning_rate": 8.59493670886076e-06, + "loss": 0.0006, + "step": 6050 + }, + { + "epoch": 60.98, + "learning_rate": 8.58860759493671e-06, + "loss": 0.0005, + "step": 6075 + }, + { + "epoch": 61.23, + "learning_rate": 8.582278481012659e-06, + "loss": 0.0004, + "step": 6100 + }, + { + "epoch": 61.48, + "learning_rate": 8.575949367088608e-06, + "loss": 0.0005, + "step": 6125 + }, + { + "epoch": 61.73, + "learning_rate": 8.569620253164558e-06, + "loss": 0.0005, + "step": 6150 + }, + { + "epoch": 61.98, + "learning_rate": 8.563291139240507e-06, + "loss": 0.0006, + "step": 6175 + }, + { + "epoch": 62.23, + "learning_rate": 8.556962025316457e-06, + "loss": 0.0004, + "step": 6200 + }, + { + "epoch": 62.48, + "learning_rate": 8.550632911392406e-06, + "loss": 0.0003, + "step": 6225 + }, + { + "epoch": 62.74, + "learning_rate": 8.544303797468356e-06, + "loss": 0.0002, + "step": 6250 + }, + { + "epoch": 62.99, + "learning_rate": 8.537974683544305e-06, + "loss": 0.0003, + "step": 6275 + }, + { + "epoch": 63.24, + "learning_rate": 8.531645569620254e-06, + "loss": 0.0001, + "step": 6300 + }, + { + "epoch": 63.49, + "learning_rate": 8.525316455696204e-06, + "loss": 0.0002, + "step": 6325 + }, + { + "epoch": 63.74, + "learning_rate": 8.518987341772152e-06, + "loss": 0.0001, + "step": 6350 + }, + { + "epoch": 63.99, + "learning_rate": 8.512658227848101e-06, + "loss": 0.0002, + "step": 6375 + }, + { + "epoch": 64.24, + "learning_rate": 8.50632911392405e-06, + "loss": 0.0004, + "step": 6400 + }, + { + "epoch": 64.49, + "learning_rate": 8.5e-06, + "loss": 0.0003, + "step": 6425 + }, + { + "epoch": 64.74, + "learning_rate": 8.49367088607595e-06, + "loss": 0.0004, + "step": 6450 + }, + { + "epoch": 64.99, + "learning_rate": 8.487341772151899e-06, + "loss": 0.0004, + "step": 6475 + }, + { + "epoch": 65.24, + "learning_rate": 8.481012658227848e-06, + "loss": 0.0007, + "step": 6500 + }, + { + "epoch": 65.5, + "learning_rate": 8.474683544303798e-06, + "loss": 0.0007, + "step": 6525 + }, + { + "epoch": 65.75, + "learning_rate": 8.468354430379747e-06, + "loss": 0.001, + "step": 6550 + }, + { + "epoch": 66.0, + "learning_rate": 8.462025316455696e-06, + "loss": 0.0012, + "step": 6575 + }, + { + "epoch": 66.25, + "learning_rate": 8.455696202531646e-06, + "loss": 0.0014, + "step": 6600 + }, + { + "epoch": 66.5, + "learning_rate": 8.449367088607595e-06, + "loss": 0.0025, + "step": 6625 + }, + { + "epoch": 66.75, + "learning_rate": 8.443037974683545e-06, + "loss": 0.0024, + "step": 6650 + }, + { + "epoch": 67.0, + "learning_rate": 8.436708860759494e-06, + "loss": 0.0025, + "step": 6675 + }, + { + "epoch": 67.25, + "learning_rate": 8.430379746835444e-06, + "loss": 0.0024, + "step": 6700 + }, + { + "epoch": 67.5, + "learning_rate": 8.424050632911393e-06, + "loss": 0.0035, + "step": 6725 + }, + { + "epoch": 67.75, + "learning_rate": 8.417721518987342e-06, + "loss": 0.0028, + "step": 6750 + }, + { + "epoch": 68.01, + "learning_rate": 8.411392405063292e-06, + "loss": 0.0033, + "step": 6775 + }, + { + "epoch": 68.26, + "learning_rate": 8.405063291139241e-06, + "loss": 0.0026, + "step": 6800 + }, + { + "epoch": 68.51, + "learning_rate": 8.39873417721519e-06, + "loss": 0.0027, + "step": 6825 + }, + { + "epoch": 68.76, + "learning_rate": 8.39240506329114e-06, + "loss": 0.0029, + "step": 6850 + }, + { + "epoch": 69.01, + "learning_rate": 8.38607594936709e-06, + "loss": 0.0029, + "step": 6875 + }, + { + "epoch": 69.26, + "learning_rate": 8.379746835443039e-06, + "loss": 0.0022, + "step": 6900 + }, + { + "epoch": 69.51, + "learning_rate": 8.373417721518988e-06, + "loss": 0.0015, + "step": 6925 + }, + { + "epoch": 69.76, + "learning_rate": 8.367088607594938e-06, + "loss": 0.0018, + "step": 6950 + }, + { + "epoch": 70.01, + "learning_rate": 8.360759493670887e-06, + "loss": 0.002, + "step": 6975 + }, + { + "epoch": 70.26, + "learning_rate": 8.354430379746837e-06, + "loss": 0.0013, + "step": 7000 + }, + { + "epoch": 70.26, + "eval_loss": 0.2253977358341217, + "eval_runtime": 2781.6008, + "eval_samples_per_second": 4.581, + "eval_steps_per_second": 0.287, + "eval_wer": 7.848405502579333, + "step": 7000 + }, + { + "epoch": 70.51, + "learning_rate": 8.348101265822786e-06, + "loss": 0.0015, + "step": 7025 + }, + { + "epoch": 70.77, + "learning_rate": 8.341772151898736e-06, + "loss": 0.0014, + "step": 7050 + }, + { + "epoch": 71.02, + "learning_rate": 8.335443037974685e-06, + "loss": 0.0014, + "step": 7075 + }, + { + "epoch": 71.27, + "learning_rate": 8.329113924050633e-06, + "loss": 0.001, + "step": 7100 + }, + { + "epoch": 71.52, + "learning_rate": 8.322784810126582e-06, + "loss": 0.0017, + "step": 7125 + }, + { + "epoch": 71.77, + "learning_rate": 8.316455696202532e-06, + "loss": 0.0015, + "step": 7150 + }, + { + "epoch": 72.02, + "learning_rate": 8.310126582278481e-06, + "loss": 0.0013, + "step": 7175 + }, + { + "epoch": 72.27, + "learning_rate": 8.30379746835443e-06, + "loss": 0.0012, + "step": 7200 + }, + { + "epoch": 72.52, + "learning_rate": 8.29746835443038e-06, + "loss": 0.001, + "step": 7225 + }, + { + "epoch": 72.77, + "learning_rate": 8.29113924050633e-06, + "loss": 0.0014, + "step": 7250 + }, + { + "epoch": 73.02, + "learning_rate": 8.284810126582279e-06, + "loss": 0.0015, + "step": 7275 + }, + { + "epoch": 73.27, + "learning_rate": 8.278481012658228e-06, + "loss": 0.0015, + "step": 7300 + }, + { + "epoch": 73.53, + "learning_rate": 8.272151898734178e-06, + "loss": 0.001, + "step": 7325 + }, + { + "epoch": 73.78, + "learning_rate": 8.265822784810127e-06, + "loss": 0.0011, + "step": 7350 + }, + { + "epoch": 74.03, + "learning_rate": 8.259493670886076e-06, + "loss": 0.0013, + "step": 7375 + }, + { + "epoch": 74.28, + "learning_rate": 8.253164556962026e-06, + "loss": 0.0007, + "step": 7400 + }, + { + "epoch": 74.53, + "learning_rate": 8.246835443037975e-06, + "loss": 0.0006, + "step": 7425 + }, + { + "epoch": 74.78, + "learning_rate": 8.240506329113925e-06, + "loss": 0.0007, + "step": 7450 + }, + { + "epoch": 75.03, + "learning_rate": 8.234177215189874e-06, + "loss": 0.0007, + "step": 7475 + }, + { + "epoch": 75.28, + "learning_rate": 8.227848101265824e-06, + "loss": 0.0008, + "step": 7500 + }, + { + "epoch": 75.53, + "learning_rate": 8.221518987341773e-06, + "loss": 0.0007, + "step": 7525 + }, + { + "epoch": 75.78, + "learning_rate": 8.215189873417722e-06, + "loss": 0.0005, + "step": 7550 + }, + { + "epoch": 76.04, + "learning_rate": 8.208860759493672e-06, + "loss": 0.0006, + "step": 7575 + }, + { + "epoch": 76.29, + "learning_rate": 8.202531645569621e-06, + "loss": 0.0005, + "step": 7600 + }, + { + "epoch": 76.54, + "learning_rate": 8.19620253164557e-06, + "loss": 0.0005, + "step": 7625 + }, + { + "epoch": 76.79, + "learning_rate": 8.18987341772152e-06, + "loss": 0.0004, + "step": 7650 + }, + { + "epoch": 77.04, + "learning_rate": 8.18354430379747e-06, + "loss": 0.0003, + "step": 7675 + }, + { + "epoch": 77.29, + "learning_rate": 8.177215189873419e-06, + "loss": 0.0004, + "step": 7700 + }, + { + "epoch": 77.54, + "learning_rate": 8.170886075949368e-06, + "loss": 0.0005, + "step": 7725 + }, + { + "epoch": 77.79, + "learning_rate": 8.164556962025318e-06, + "loss": 0.0007, + "step": 7750 + }, + { + "epoch": 78.04, + "learning_rate": 8.158227848101267e-06, + "loss": 0.0007, + "step": 7775 + }, + { + "epoch": 78.29, + "learning_rate": 8.151898734177217e-06, + "loss": 0.0004, + "step": 7800 + }, + { + "epoch": 78.54, + "learning_rate": 8.145569620253164e-06, + "loss": 0.0005, + "step": 7825 + }, + { + "epoch": 78.8, + "learning_rate": 8.139240506329114e-06, + "loss": 0.0004, + "step": 7850 + }, + { + "epoch": 79.05, + "learning_rate": 8.132911392405063e-06, + "loss": 0.0004, + "step": 7875 + }, + { + "epoch": 79.3, + "learning_rate": 8.126582278481013e-06, + "loss": 0.0005, + "step": 7900 + }, + { + "epoch": 79.55, + "learning_rate": 8.120253164556962e-06, + "loss": 0.0003, + "step": 7925 + }, + { + "epoch": 79.8, + "learning_rate": 8.113924050632912e-06, + "loss": 0.0005, + "step": 7950 + }, + { + "epoch": 80.05, + "learning_rate": 8.107594936708861e-06, + "loss": 0.0006, + "step": 7975 + }, + { + "epoch": 80.3, + "learning_rate": 8.10126582278481e-06, + "loss": 0.0004, + "step": 8000 + }, + { + "epoch": 80.3, + "eval_loss": 0.23669902980327606, + "eval_runtime": 2781.0884, + "eval_samples_per_second": 4.582, + "eval_steps_per_second": 0.287, + "eval_wer": 7.482999843676723, + "step": 8000 + }, + { + "epoch": 80.55, + "learning_rate": 8.09493670886076e-06, + "loss": 0.0007, + "step": 8025 + }, + { + "epoch": 80.8, + "learning_rate": 8.08860759493671e-06, + "loss": 0.0012, + "step": 8050 + }, + { + "epoch": 81.05, + "learning_rate": 8.082278481012659e-06, + "loss": 0.0011, + "step": 8075 + }, + { + "epoch": 81.3, + "learning_rate": 8.075949367088608e-06, + "loss": 0.0011, + "step": 8100 + }, + { + "epoch": 81.56, + "learning_rate": 8.069620253164558e-06, + "loss": 0.0009, + "step": 8125 + }, + { + "epoch": 81.81, + "learning_rate": 8.063291139240507e-06, + "loss": 0.001, + "step": 8150 + }, + { + "epoch": 82.06, + "learning_rate": 8.056962025316456e-06, + "loss": 0.0008, + "step": 8175 + }, + { + "epoch": 82.31, + "learning_rate": 8.050632911392406e-06, + "loss": 0.0006, + "step": 8200 + }, + { + "epoch": 82.56, + "learning_rate": 8.044303797468355e-06, + "loss": 0.0004, + "step": 8225 + }, + { + "epoch": 82.81, + "learning_rate": 8.037974683544305e-06, + "loss": 0.0005, + "step": 8250 + }, + { + "epoch": 83.06, + "learning_rate": 8.031645569620252e-06, + "loss": 0.0005, + "step": 8275 + }, + { + "epoch": 83.31, + "learning_rate": 8.025316455696202e-06, + "loss": 0.0005, + "step": 8300 + }, + { + "epoch": 83.56, + "learning_rate": 8.018987341772153e-06, + "loss": 0.0006, + "step": 8325 + }, + { + "epoch": 83.81, + "learning_rate": 8.012658227848102e-06, + "loss": 0.0005, + "step": 8350 + }, + { + "epoch": 84.07, + "learning_rate": 8.006329113924052e-06, + "loss": 0.0005, + "step": 8375 + }, + { + "epoch": 84.32, + "learning_rate": 8.000000000000001e-06, + "loss": 0.0005, + "step": 8400 + }, + { + "epoch": 84.57, + "learning_rate": 7.99367088607595e-06, + "loss": 0.0005, + "step": 8425 + }, + { + "epoch": 84.82, + "learning_rate": 7.9873417721519e-06, + "loss": 0.0009, + "step": 8450 + }, + { + "epoch": 85.07, + "learning_rate": 7.98101265822785e-06, + "loss": 0.0008, + "step": 8475 + }, + { + "epoch": 85.32, + "learning_rate": 7.974683544303799e-06, + "loss": 0.0006, + "step": 8500 + }, + { + "epoch": 85.57, + "learning_rate": 7.968354430379748e-06, + "loss": 0.0008, + "step": 8525 + }, + { + "epoch": 85.82, + "learning_rate": 7.962025316455698e-06, + "loss": 0.0014, + "step": 8550 + }, + { + "epoch": 86.07, + "learning_rate": 7.955696202531646e-06, + "loss": 0.0011, + "step": 8575 + }, + { + "epoch": 86.32, + "learning_rate": 7.949367088607595e-06, + "loss": 0.001, + "step": 8600 + }, + { + "epoch": 86.57, + "learning_rate": 7.943037974683544e-06, + "loss": 0.0014, + "step": 8625 + }, + { + "epoch": 86.83, + "learning_rate": 7.936708860759494e-06, + "loss": 0.0017, + "step": 8650 + }, + { + "epoch": 87.08, + "learning_rate": 7.930632911392405e-06, + "loss": 0.0015, + "step": 8675 + }, + { + "epoch": 87.33, + "learning_rate": 7.924303797468355e-06, + "loss": 0.0019, + "step": 8700 + }, + { + "epoch": 87.58, + "learning_rate": 7.917974683544304e-06, + "loss": 0.0023, + "step": 8725 + }, + { + "epoch": 87.83, + "learning_rate": 7.911645569620254e-06, + "loss": 0.0023, + "step": 8750 + }, + { + "epoch": 88.08, + "learning_rate": 7.905316455696203e-06, + "loss": 0.0017, + "step": 8775 + }, + { + "epoch": 88.33, + "learning_rate": 7.898987341772153e-06, + "loss": 0.0017, + "step": 8800 + }, + { + "epoch": 88.58, + "learning_rate": 7.892658227848102e-06, + "loss": 0.0014, + "step": 8825 + }, + { + "epoch": 88.83, + "learning_rate": 7.886329113924051e-06, + "loss": 0.0018, + "step": 8850 + }, + { + "epoch": 89.08, + "learning_rate": 7.88e-06, + "loss": 0.0016, + "step": 8875 + }, + { + "epoch": 89.34, + "learning_rate": 7.87367088607595e-06, + "loss": 0.0015, + "step": 8900 + }, + { + "epoch": 89.59, + "learning_rate": 7.8673417721519e-06, + "loss": 0.001, + "step": 8925 + }, + { + "epoch": 89.84, + "learning_rate": 7.861012658227849e-06, + "loss": 0.0009, + "step": 8950 + }, + { + "epoch": 90.09, + "learning_rate": 7.854683544303798e-06, + "loss": 0.0009, + "step": 8975 + }, + { + "epoch": 90.34, + "learning_rate": 7.848354430379748e-06, + "loss": 0.0008, + "step": 9000 + }, + { + "epoch": 90.34, + "eval_loss": 0.22892530262470245, + "eval_runtime": 2781.5915, + "eval_samples_per_second": 4.581, + "eval_steps_per_second": 0.287, + "eval_wer": 7.441964983586057, + "step": 9000 + }, + { + "epoch": 90.59, + "learning_rate": 7.842025316455697e-06, + "loss": 0.0004, + "step": 9025 + }, + { + "epoch": 90.84, + "learning_rate": 7.835696202531647e-06, + "loss": 0.0005, + "step": 9050 + }, + { + "epoch": 91.09, + "learning_rate": 7.829367088607596e-06, + "loss": 0.001, + "step": 9075 + }, + { + "epoch": 91.34, + "learning_rate": 7.823037974683546e-06, + "loss": 0.0009, + "step": 9100 + }, + { + "epoch": 91.59, + "learning_rate": 7.816708860759495e-06, + "loss": 0.0006, + "step": 9125 + }, + { + "epoch": 91.84, + "learning_rate": 7.810379746835443e-06, + "loss": 0.0007, + "step": 9150 + }, + { + "epoch": 92.1, + "learning_rate": 7.804050632911392e-06, + "loss": 0.0006, + "step": 9175 + }, + { + "epoch": 92.35, + "learning_rate": 7.797721518987342e-06, + "loss": 0.0006, + "step": 9200 + }, + { + "epoch": 92.6, + "learning_rate": 7.791392405063291e-06, + "loss": 0.0007, + "step": 9225 + }, + { + "epoch": 92.85, + "learning_rate": 7.78506329113924e-06, + "loss": 0.0009, + "step": 9250 + }, + { + "epoch": 93.1, + "learning_rate": 7.77873417721519e-06, + "loss": 0.0005, + "step": 9275 + }, + { + "epoch": 93.35, + "learning_rate": 7.77240506329114e-06, + "loss": 0.0003, + "step": 9300 + }, + { + "epoch": 93.6, + "learning_rate": 7.766075949367089e-06, + "loss": 0.0003, + "step": 9325 + }, + { + "epoch": 93.85, + "learning_rate": 7.759746835443038e-06, + "loss": 0.0005, + "step": 9350 + }, + { + "epoch": 94.1, + "learning_rate": 7.753417721518988e-06, + "loss": 0.0005, + "step": 9375 + }, + { + "epoch": 94.35, + "learning_rate": 7.747088607594937e-06, + "loss": 0.0004, + "step": 9400 + }, + { + "epoch": 94.6, + "learning_rate": 7.740759493670887e-06, + "loss": 0.0005, + "step": 9425 + }, + { + "epoch": 94.86, + "learning_rate": 7.734430379746836e-06, + "loss": 0.0004, + "step": 9450 + }, + { + "epoch": 95.11, + "learning_rate": 7.728101265822785e-06, + "loss": 0.0004, + "step": 9475 + }, + { + "epoch": 95.36, + "learning_rate": 7.721772151898735e-06, + "loss": 0.0004, + "step": 9500 + }, + { + "epoch": 95.61, + "learning_rate": 7.715443037974684e-06, + "loss": 0.0003, + "step": 9525 + }, + { + "epoch": 95.86, + "learning_rate": 7.709113924050634e-06, + "loss": 0.0004, + "step": 9550 + }, + { + "epoch": 96.11, + "learning_rate": 7.702784810126583e-06, + "loss": 0.0002, + "step": 9575 + }, + { + "epoch": 96.36, + "learning_rate": 7.696455696202532e-06, + "loss": 0.0003, + "step": 9600 + }, + { + "epoch": 96.61, + "learning_rate": 7.690126582278482e-06, + "loss": 0.0007, + "step": 9625 + }, + { + "epoch": 96.86, + "learning_rate": 7.683797468354431e-06, + "loss": 0.0005, + "step": 9650 + }, + { + "epoch": 97.11, + "learning_rate": 7.67746835443038e-06, + "loss": 0.0005, + "step": 9675 + }, + { + "epoch": 97.37, + "learning_rate": 7.67113924050633e-06, + "loss": 0.0006, + "step": 9700 + }, + { + "epoch": 97.62, + "learning_rate": 7.66481012658228e-06, + "loss": 0.0009, + "step": 9725 + }, + { + "epoch": 97.87, + "learning_rate": 7.658481012658229e-06, + "loss": 0.0006, + "step": 9750 + }, + { + "epoch": 98.12, + "learning_rate": 7.652151898734178e-06, + "loss": 0.0009, + "step": 9775 + }, + { + "epoch": 98.37, + "learning_rate": 7.645822784810128e-06, + "loss": 0.0008, + "step": 9800 + }, + { + "epoch": 98.62, + "learning_rate": 7.639493670886077e-06, + "loss": 0.0012, + "step": 9825 + }, + { + "epoch": 98.87, + "learning_rate": 7.633164556962027e-06, + "loss": 0.0015, + "step": 9850 + }, + { + "epoch": 99.12, + "learning_rate": 7.626835443037975e-06, + "loss": 0.0012, + "step": 9875 + }, + { + "epoch": 99.37, + "learning_rate": 7.620506329113925e-06, + "loss": 0.0008, + "step": 9900 + }, + { + "epoch": 99.62, + "learning_rate": 7.614177215189874e-06, + "loss": 0.0007, + "step": 9925 + }, + { + "epoch": 99.87, + "learning_rate": 7.607848101265824e-06, + "loss": 0.0008, + "step": 9950 + }, + { + "epoch": 100.13, + "learning_rate": 7.601518987341773e-06, + "loss": 0.0008, + "step": 9975 + }, + { + "epoch": 100.38, + "learning_rate": 7.5951898734177225e-06, + "loss": 0.0007, + "step": 10000 + }, + { + "epoch": 100.38, + "eval_loss": 0.23848006129264832, + "eval_runtime": 2777.6649, + "eval_samples_per_second": 4.587, + "eval_steps_per_second": 0.287, + "eval_wer": 7.531850867594185, + "step": 10000 + }, + { + "epoch": 100.63, + "learning_rate": 7.588860759493671e-06, + "loss": 0.0008, + "step": 10025 + }, + { + "epoch": 100.88, + "learning_rate": 7.5825316455696205e-06, + "loss": 0.0007, + "step": 10050 + }, + { + "epoch": 101.13, + "learning_rate": 7.57620253164557e-06, + "loss": 0.0006, + "step": 10075 + }, + { + "epoch": 101.38, + "learning_rate": 7.569873417721519e-06, + "loss": 0.0005, + "step": 10100 + }, + { + "epoch": 101.63, + "learning_rate": 7.563544303797469e-06, + "loss": 0.0009, + "step": 10125 + }, + { + "epoch": 101.88, + "learning_rate": 7.557215189873418e-06, + "loss": 0.0006, + "step": 10150 + }, + { + "epoch": 102.13, + "learning_rate": 7.550886075949368e-06, + "loss": 0.0008, + "step": 10175 + }, + { + "epoch": 102.38, + "learning_rate": 7.544556962025317e-06, + "loss": 0.0007, + "step": 10200 + }, + { + "epoch": 102.63, + "learning_rate": 7.538227848101266e-06, + "loss": 0.0006, + "step": 10225 + }, + { + "epoch": 102.89, + "learning_rate": 7.531898734177215e-06, + "loss": 0.0007, + "step": 10250 + }, + { + "epoch": 103.14, + "learning_rate": 7.5255696202531645e-06, + "loss": 0.001, + "step": 10275 + }, + { + "epoch": 103.39, + "learning_rate": 7.519240506329114e-06, + "loss": 0.0007, + "step": 10300 + }, + { + "epoch": 103.64, + "learning_rate": 7.512911392405063e-06, + "loss": 0.0008, + "step": 10325 + }, + { + "epoch": 103.89, + "learning_rate": 7.506582278481013e-06, + "loss": 0.0012, + "step": 10350 + }, + { + "epoch": 104.14, + "learning_rate": 7.500253164556963e-06, + "loss": 0.0009, + "step": 10375 + }, + { + "epoch": 104.39, + "learning_rate": 7.4939240506329125e-06, + "loss": 0.0008, + "step": 10400 + }, + { + "epoch": 104.64, + "learning_rate": 7.487594936708862e-06, + "loss": 0.0005, + "step": 10425 + }, + { + "epoch": 104.89, + "learning_rate": 7.481265822784811e-06, + "loss": 0.0007, + "step": 10450 + }, + { + "epoch": 105.14, + "learning_rate": 7.474936708860761e-06, + "loss": 0.0007, + "step": 10475 + }, + { + "epoch": 105.4, + "learning_rate": 7.46860759493671e-06, + "loss": 0.0007, + "step": 10500 + }, + { + "epoch": 105.65, + "learning_rate": 7.462278481012659e-06, + "loss": 0.0006, + "step": 10525 + }, + { + "epoch": 105.9, + "learning_rate": 7.455949367088608e-06, + "loss": 0.0005, + "step": 10550 + }, + { + "epoch": 106.15, + "learning_rate": 7.449620253164558e-06, + "loss": 0.0002, + "step": 10575 + }, + { + "epoch": 106.4, + "learning_rate": 7.443291139240507e-06, + "loss": 0.0002, + "step": 10600 + }, + { + "epoch": 106.65, + "learning_rate": 7.4369620253164565e-06, + "loss": 0.0003, + "step": 10625 + }, + { + "epoch": 106.9, + "learning_rate": 7.430632911392406e-06, + "loss": 0.0003, + "step": 10650 + }, + { + "epoch": 107.15, + "learning_rate": 7.424303797468355e-06, + "loss": 0.0003, + "step": 10675 + }, + { + "epoch": 107.4, + "learning_rate": 7.417974683544305e-06, + "loss": 0.0003, + "step": 10700 + }, + { + "epoch": 107.65, + "learning_rate": 7.411645569620254e-06, + "loss": 0.0003, + "step": 10725 + }, + { + "epoch": 107.9, + "learning_rate": 7.405316455696203e-06, + "loss": 0.0007, + "step": 10750 + }, + { + "epoch": 108.16, + "learning_rate": 7.398987341772152e-06, + "loss": 0.0004, + "step": 10775 + }, + { + "epoch": 108.41, + "learning_rate": 7.392658227848102e-06, + "loss": 0.0002, + "step": 10800 + }, + { + "epoch": 108.66, + "learning_rate": 7.386329113924051e-06, + "loss": 0.0002, + "step": 10825 + }, + { + "epoch": 108.91, + "learning_rate": 7.3800000000000005e-06, + "loss": 0.0005, + "step": 10850 + }, + { + "epoch": 109.16, + "learning_rate": 7.37367088607595e-06, + "loss": 0.0007, + "step": 10875 + }, + { + "epoch": 109.41, + "learning_rate": 7.367341772151899e-06, + "loss": 0.0009, + "step": 10900 + }, + { + "epoch": 109.66, + "learning_rate": 7.361012658227849e-06, + "loss": 0.0011, + "step": 10925 + }, + { + "epoch": 109.91, + "learning_rate": 7.354683544303798e-06, + "loss": 0.0013, + "step": 10950 + }, + { + "epoch": 110.16, + "learning_rate": 7.348354430379747e-06, + "loss": 0.0009, + "step": 10975 + }, + { + "epoch": 110.41, + "learning_rate": 7.342025316455696e-06, + "loss": 0.001, + "step": 11000 + }, + { + "epoch": 110.41, + "eval_loss": 0.22928227484226227, + "eval_runtime": 2789.8685, + "eval_samples_per_second": 4.567, + "eval_steps_per_second": 0.286, + "eval_wer": 7.632483976864155, + "step": 11000 + }, + { + "epoch": 110.66, + "learning_rate": 7.335696202531646e-06, + "loss": 0.0007, + "step": 11025 + }, + { + "epoch": 110.92, + "learning_rate": 7.329367088607595e-06, + "loss": 0.001, + "step": 11050 + }, + { + "epoch": 111.17, + "learning_rate": 7.3230379746835445e-06, + "loss": 0.001, + "step": 11075 + }, + { + "epoch": 111.42, + "learning_rate": 7.316708860759494e-06, + "loss": 0.001, + "step": 11100 + }, + { + "epoch": 111.67, + "learning_rate": 7.310379746835443e-06, + "loss": 0.0009, + "step": 11125 + }, + { + "epoch": 111.92, + "learning_rate": 7.304050632911393e-06, + "loss": 0.0011, + "step": 11150 + }, + { + "epoch": 112.17, + "learning_rate": 7.297721518987342e-06, + "loss": 0.0007, + "step": 11175 + }, + { + "epoch": 112.42, + "learning_rate": 7.2913924050632925e-06, + "loss": 0.0007, + "step": 11200 + }, + { + "epoch": 112.67, + "learning_rate": 7.285063291139242e-06, + "loss": 0.0007, + "step": 11225 + }, + { + "epoch": 112.92, + "learning_rate": 7.278734177215191e-06, + "loss": 0.0008, + "step": 11250 + }, + { + "epoch": 113.17, + "learning_rate": 7.27240506329114e-06, + "loss": 0.0008, + "step": 11275 + }, + { + "epoch": 113.43, + "learning_rate": 7.266075949367089e-06, + "loss": 0.0006, + "step": 11300 + }, + { + "epoch": 113.68, + "learning_rate": 7.259746835443039e-06, + "loss": 0.0006, + "step": 11325 + }, + { + "epoch": 113.93, + "learning_rate": 7.253417721518988e-06, + "loss": 0.0007, + "step": 11350 + }, + { + "epoch": 114.18, + "learning_rate": 7.247088607594938e-06, + "loss": 0.0004, + "step": 11375 + }, + { + "epoch": 114.43, + "learning_rate": 7.240759493670887e-06, + "loss": 0.0004, + "step": 11400 + }, + { + "epoch": 114.68, + "learning_rate": 7.2344303797468365e-06, + "loss": 0.0004, + "step": 11425 + }, + { + "epoch": 114.93, + "learning_rate": 7.228101265822786e-06, + "loss": 0.0008, + "step": 11450 + }, + { + "epoch": 115.18, + "learning_rate": 7.221772151898735e-06, + "loss": 0.001, + "step": 11475 + }, + { + "epoch": 115.43, + "learning_rate": 7.215443037974684e-06, + "loss": 0.0008, + "step": 11500 + }, + { + "epoch": 115.68, + "learning_rate": 7.209113924050633e-06, + "loss": 0.0007, + "step": 11525 + }, + { + "epoch": 115.93, + "learning_rate": 7.202784810126583e-06, + "loss": 0.0007, + "step": 11550 + }, + { + "epoch": 116.19, + "learning_rate": 7.196455696202532e-06, + "loss": 0.0007, + "step": 11575 + }, + { + "epoch": 116.44, + "learning_rate": 7.190126582278482e-06, + "loss": 0.0009, + "step": 11600 + }, + { + "epoch": 116.69, + "learning_rate": 7.183797468354431e-06, + "loss": 0.001, + "step": 11625 + }, + { + "epoch": 116.94, + "learning_rate": 7.1774683544303805e-06, + "loss": 0.0006, + "step": 11650 + }, + { + "epoch": 117.19, + "learning_rate": 7.17113924050633e-06, + "loss": 0.0008, + "step": 11675 + }, + { + "epoch": 117.44, + "learning_rate": 7.164810126582279e-06, + "loss": 0.0008, + "step": 11700 + }, + { + "epoch": 117.69, + "learning_rate": 7.158481012658228e-06, + "loss": 0.0005, + "step": 11725 + }, + { + "epoch": 117.94, + "learning_rate": 7.152151898734177e-06, + "loss": 0.0004, + "step": 11750 + }, + { + "epoch": 118.19, + "learning_rate": 7.145822784810127e-06, + "loss": 0.0003, + "step": 11775 + }, + { + "epoch": 118.44, + "learning_rate": 7.139493670886076e-06, + "loss": 0.0002, + "step": 11800 + }, + { + "epoch": 118.7, + "learning_rate": 7.133164556962026e-06, + "loss": 0.0002, + "step": 11825 + }, + { + "epoch": 118.95, + "learning_rate": 7.126835443037975e-06, + "loss": 0.0003, + "step": 11850 + }, + { + "epoch": 119.2, + "learning_rate": 7.1205063291139245e-06, + "loss": 0.0008, + "step": 11875 + }, + { + "epoch": 119.45, + "learning_rate": 7.114177215189874e-06, + "loss": 0.0003, + "step": 11900 + }, + { + "epoch": 119.7, + "learning_rate": 7.107848101265823e-06, + "loss": 0.0001, + "step": 11925 + }, + { + "epoch": 119.95, + "learning_rate": 7.101518987341772e-06, + "loss": 0.0003, + "step": 11950 + }, + { + "epoch": 120.2, + "learning_rate": 7.095189873417721e-06, + "loss": 0.0003, + "step": 11975 + }, + { + "epoch": 120.45, + "learning_rate": 7.088860759493671e-06, + "loss": 0.0001, + "step": 12000 + }, + { + "epoch": 120.45, + "eval_loss": 0.2473139613866806, + "eval_runtime": 2824.4756, + "eval_samples_per_second": 4.511, + "eval_steps_per_second": 0.282, + "eval_wer": 7.142996717211194, + "step": 12000 + }, + { + "epoch": 120.7, + "learning_rate": 7.082531645569621e-06, + "loss": 0.0003, + "step": 12025 + }, + { + "epoch": 120.95, + "learning_rate": 7.0762025316455705e-06, + "loss": 0.0003, + "step": 12050 + }, + { + "epoch": 121.2, + "learning_rate": 7.06987341772152e-06, + "loss": 0.0002, + "step": 12075 + }, + { + "epoch": 121.46, + "learning_rate": 7.063544303797469e-06, + "loss": 0.0002, + "step": 12100 + }, + { + "epoch": 121.71, + "learning_rate": 7.057215189873419e-06, + "loss": 0.0001, + "step": 12125 + }, + { + "epoch": 121.96, + "learning_rate": 7.050886075949368e-06, + "loss": 0.0001, + "step": 12150 + }, + { + "epoch": 122.21, + "learning_rate": 7.044556962025318e-06, + "loss": 0.0003, + "step": 12175 + }, + { + "epoch": 122.46, + "learning_rate": 7.038227848101267e-06, + "loss": 0.0003, + "step": 12200 + }, + { + "epoch": 122.71, + "learning_rate": 7.031898734177216e-06, + "loss": 0.0004, + "step": 12225 + }, + { + "epoch": 122.96, + "learning_rate": 7.025569620253165e-06, + "loss": 0.0009, + "step": 12250 + }, + { + "epoch": 123.21, + "learning_rate": 7.0192405063291145e-06, + "loss": 0.0007, + "step": 12275 + }, + { + "epoch": 123.46, + "learning_rate": 7.012911392405064e-06, + "loss": 0.0007, + "step": 12300 + }, + { + "epoch": 123.71, + "learning_rate": 7.006582278481013e-06, + "loss": 0.0005, + "step": 12325 + }, + { + "epoch": 123.96, + "learning_rate": 7.000253164556963e-06, + "loss": 0.0007, + "step": 12350 + }, + { + "epoch": 124.22, + "learning_rate": 6.993924050632912e-06, + "loss": 0.0008, + "step": 12375 + }, + { + "epoch": 124.47, + "learning_rate": 6.987594936708862e-06, + "loss": 0.0007, + "step": 12400 + }, + { + "epoch": 124.72, + "learning_rate": 6.981265822784811e-06, + "loss": 0.0007, + "step": 12425 + }, + { + "epoch": 124.97, + "learning_rate": 6.97493670886076e-06, + "loss": 0.0007, + "step": 12450 + }, + { + "epoch": 125.22, + "learning_rate": 6.968607594936709e-06, + "loss": 0.0006, + "step": 12475 + }, + { + "epoch": 125.47, + "learning_rate": 6.9622784810126585e-06, + "loss": 0.0004, + "step": 12500 + }, + { + "epoch": 125.72, + "learning_rate": 6.955949367088608e-06, + "loss": 0.0005, + "step": 12525 + }, + { + "epoch": 125.97, + "learning_rate": 6.949620253164557e-06, + "loss": 0.0011, + "step": 12550 + }, + { + "epoch": 126.22, + "learning_rate": 6.943291139240507e-06, + "loss": 0.001, + "step": 12575 + }, + { + "epoch": 126.47, + "learning_rate": 6.936962025316456e-06, + "loss": 0.0009, + "step": 12600 + }, + { + "epoch": 126.73, + "learning_rate": 6.930632911392406e-06, + "loss": 0.0008, + "step": 12625 + }, + { + "epoch": 126.98, + "learning_rate": 6.924303797468355e-06, + "loss": 0.0011, + "step": 12650 + }, + { + "epoch": 127.23, + "learning_rate": 6.917974683544304e-06, + "loss": 0.0006, + "step": 12675 + }, + { + "epoch": 127.48, + "learning_rate": 6.911645569620253e-06, + "loss": 0.0005, + "step": 12700 + }, + { + "epoch": 127.73, + "learning_rate": 6.9053164556962025e-06, + "loss": 0.0008, + "step": 12725 + }, + { + "epoch": 127.98, + "learning_rate": 6.898987341772152e-06, + "loss": 0.0006, + "step": 12750 + }, + { + "epoch": 128.23, + "learning_rate": 6.892658227848101e-06, + "loss": 0.0004, + "step": 12775 + }, + { + "epoch": 128.48, + "learning_rate": 6.886329113924051e-06, + "loss": 0.0005, + "step": 12800 + }, + { + "epoch": 128.73, + "learning_rate": 6.88e-06, + "loss": 0.0004, + "step": 12825 + }, + { + "epoch": 128.98, + "learning_rate": 6.8736708860759505e-06, + "loss": 0.0003, + "step": 12850 + }, + { + "epoch": 129.23, + "learning_rate": 6.8673417721519e-06, + "loss": 0.0001, + "step": 12875 + }, + { + "epoch": 129.49, + "learning_rate": 6.861012658227849e-06, + "loss": 0.0002, + "step": 12900 + }, + { + "epoch": 129.74, + "learning_rate": 6.854683544303799e-06, + "loss": 0.0003, + "step": 12925 + }, + { + "epoch": 129.99, + "learning_rate": 6.848354430379748e-06, + "loss": 0.0002, + "step": 12950 + }, + { + "epoch": 130.24, + "learning_rate": 6.842025316455697e-06, + "loss": 0.0002, + "step": 12975 + }, + { + "epoch": 130.49, + "learning_rate": 6.835696202531646e-06, + "loss": 0.0001, + "step": 13000 + }, + { + "epoch": 130.49, + "eval_loss": 0.24884945154190063, + "eval_runtime": 2827.5774, + "eval_samples_per_second": 4.506, + "eval_steps_per_second": 0.282, + "eval_wer": 7.186962638736907, + "step": 13000 + }, + { + "epoch": 130.74, + "learning_rate": 6.829367088607596e-06, + "loss": 0.0001, + "step": 13025 + }, + { + "epoch": 130.99, + "learning_rate": 6.823037974683545e-06, + "loss": 0.0001, + "step": 13050 + }, + { + "epoch": 131.24, + "learning_rate": 6.8167088607594945e-06, + "loss": 0.0001, + "step": 13075 + }, + { + "epoch": 131.49, + "learning_rate": 6.810379746835444e-06, + "loss": 0.0002, + "step": 13100 + }, + { + "epoch": 131.74, + "learning_rate": 6.804050632911393e-06, + "loss": 0.0003, + "step": 13125 + }, + { + "epoch": 131.99, + "learning_rate": 6.797974683544304e-06, + "loss": 0.0007, + "step": 13150 + }, + { + "epoch": 132.25, + "learning_rate": 6.791645569620253e-06, + "loss": 0.0003, + "step": 13175 + }, + { + "epoch": 132.5, + "learning_rate": 6.785316455696203e-06, + "loss": 0.0002, + "step": 13200 + }, + { + "epoch": 132.75, + "learning_rate": 6.778987341772153e-06, + "loss": 0.0005, + "step": 13225 + }, + { + "epoch": 133.0, + "learning_rate": 6.7726582278481025e-06, + "loss": 0.0005, + "step": 13250 + }, + { + "epoch": 133.25, + "learning_rate": 6.766329113924052e-06, + "loss": 0.0006, + "step": 13275 + }, + { + "epoch": 133.5, + "learning_rate": 6.760000000000001e-06, + "loss": 0.0012, + "step": 13300 + }, + { + "epoch": 133.75, + "learning_rate": 6.75367088607595e-06, + "loss": 0.0011, + "step": 13325 + }, + { + "epoch": 134.0, + "learning_rate": 6.747594936708861e-06, + "loss": 0.0009, + "step": 13350 + }, + { + "epoch": 134.25, + "learning_rate": 6.741265822784811e-06, + "loss": 0.0008, + "step": 13375 + }, + { + "epoch": 134.5, + "learning_rate": 6.734936708860759e-06, + "loss": 0.0007, + "step": 13400 + }, + { + "epoch": 134.76, + "learning_rate": 6.728607594936709e-06, + "loss": 0.0008, + "step": 13425 + }, + { + "epoch": 135.01, + "learning_rate": 6.722278481012658e-06, + "loss": 0.0011, + "step": 13450 + }, + { + "epoch": 135.26, + "learning_rate": 6.715949367088608e-06, + "loss": 0.0015, + "step": 13475 + }, + { + "epoch": 135.51, + "learning_rate": 6.709620253164557e-06, + "loss": 0.0014, + "step": 13500 + }, + { + "epoch": 135.76, + "learning_rate": 6.7032911392405065e-06, + "loss": 0.0012, + "step": 13525 + }, + { + "epoch": 136.01, + "learning_rate": 6.696962025316456e-06, + "loss": 0.0012, + "step": 13550 + }, + { + "epoch": 136.26, + "learning_rate": 6.690632911392405e-06, + "loss": 0.001, + "step": 13575 + }, + { + "epoch": 136.51, + "learning_rate": 6.684303797468355e-06, + "loss": 0.0008, + "step": 13600 + }, + { + "epoch": 136.76, + "learning_rate": 6.677974683544305e-06, + "loss": 0.0007, + "step": 13625 + }, + { + "epoch": 137.01, + "learning_rate": 6.6716455696202545e-06, + "loss": 0.0007, + "step": 13650 + }, + { + "epoch": 137.26, + "learning_rate": 6.665316455696204e-06, + "loss": 0.0004, + "step": 13675 + }, + { + "epoch": 137.52, + "learning_rate": 6.6589873417721525e-06, + "loss": 0.0005, + "step": 13700 + }, + { + "epoch": 137.77, + "learning_rate": 6.652658227848102e-06, + "loss": 0.0004, + "step": 13725 + }, + { + "epoch": 138.02, + "learning_rate": 6.646329113924051e-06, + "loss": 0.0004, + "step": 13750 + }, + { + "epoch": 138.27, + "learning_rate": 6.640000000000001e-06, + "loss": 0.0002, + "step": 13775 + }, + { + "epoch": 138.52, + "learning_rate": 6.63367088607595e-06, + "loss": 0.0002, + "step": 13800 + }, + { + "epoch": 138.77, + "learning_rate": 6.6273417721519e-06, + "loss": 0.0002, + "step": 13825 + }, + { + "epoch": 139.02, + "learning_rate": 6.621012658227849e-06, + "loss": 0.0003, + "step": 13850 + }, + { + "epoch": 139.27, + "learning_rate": 6.6146835443037985e-06, + "loss": 0.0005, + "step": 13875 + }, + { + "epoch": 139.52, + "learning_rate": 6.608354430379748e-06, + "loss": 0.0002, + "step": 13900 + }, + { + "epoch": 139.77, + "learning_rate": 6.6020253164556965e-06, + "loss": 0.0003, + "step": 13925 + }, + { + "epoch": 140.03, + "learning_rate": 6.595696202531646e-06, + "loss": 0.0002, + "step": 13950 + }, + { + "epoch": 140.28, + "learning_rate": 6.589367088607595e-06, + "loss": 0.0001, + "step": 13975 + }, + { + "epoch": 140.53, + "learning_rate": 6.583037974683545e-06, + "loss": 0.0004, + "step": 14000 + }, + { + "epoch": 140.53, + "eval_loss": 0.23976704478263855, + "eval_runtime": 2824.3974, + "eval_samples_per_second": 4.511, + "eval_steps_per_second": 0.282, + "eval_wer": 7.183054556823511, + "step": 14000 + }, + { + "epoch": 140.78, + "learning_rate": 6.576708860759494e-06, + "loss": 0.0003, + "step": 14025 + }, + { + "epoch": 141.03, + "learning_rate": 6.570379746835444e-06, + "loss": 0.0004, + "step": 14050 + }, + { + "epoch": 141.28, + "learning_rate": 6.564050632911393e-06, + "loss": 0.0002, + "step": 14075 + }, + { + "epoch": 141.53, + "learning_rate": 6.5577215189873425e-06, + "loss": 0.0001, + "step": 14100 + }, + { + "epoch": 141.78, + "learning_rate": 6.551392405063292e-06, + "loss": 0.0002, + "step": 14125 + }, + { + "epoch": 142.03, + "learning_rate": 6.5450632911392405e-06, + "loss": 0.0003, + "step": 14150 + }, + { + "epoch": 142.28, + "learning_rate": 6.53873417721519e-06, + "loss": 0.0005, + "step": 14175 + }, + { + "epoch": 142.53, + "learning_rate": 6.532405063291139e-06, + "loss": 0.0003, + "step": 14200 + }, + { + "epoch": 142.79, + "learning_rate": 6.526075949367089e-06, + "loss": 0.0004, + "step": 14225 + }, + { + "epoch": 143.04, + "learning_rate": 6.519746835443038e-06, + "loss": 0.0003, + "step": 14250 + }, + { + "epoch": 143.29, + "learning_rate": 6.513417721518988e-06, + "loss": 0.0002, + "step": 14275 + }, + { + "epoch": 143.54, + "learning_rate": 6.507088607594937e-06, + "loss": 0.0003, + "step": 14300 + }, + { + "epoch": 143.79, + "learning_rate": 6.5007594936708865e-06, + "loss": 0.0003, + "step": 14325 + }, + { + "epoch": 144.04, + "learning_rate": 6.494430379746836e-06, + "loss": 0.0003, + "step": 14350 + }, + { + "epoch": 144.29, + "learning_rate": 6.4881012658227845e-06, + "loss": 0.0004, + "step": 14375 + }, + { + "epoch": 144.54, + "learning_rate": 6.481772151898734e-06, + "loss": 0.0003, + "step": 14400 + }, + { + "epoch": 144.79, + "learning_rate": 6.475443037974683e-06, + "loss": 0.0004, + "step": 14425 + }, + { + "epoch": 145.04, + "learning_rate": 6.469113924050634e-06, + "loss": 0.0004, + "step": 14450 + }, + { + "epoch": 145.29, + "learning_rate": 6.462784810126583e-06, + "loss": 0.0002, + "step": 14475 + }, + { + "epoch": 145.55, + "learning_rate": 6.4564556962025325e-06, + "loss": 0.0002, + "step": 14500 + }, + { + "epoch": 145.8, + "learning_rate": 6.450126582278482e-06, + "loss": 0.0002, + "step": 14525 + }, + { + "epoch": 146.05, + "learning_rate": 6.443797468354431e-06, + "loss": 0.0003, + "step": 14550 + }, + { + "epoch": 146.3, + "learning_rate": 6.437468354430381e-06, + "loss": 0.0003, + "step": 14575 + }, + { + "epoch": 146.55, + "learning_rate": 6.43113924050633e-06, + "loss": 0.0002, + "step": 14600 + }, + { + "epoch": 146.8, + "learning_rate": 6.42481012658228e-06, + "loss": 0.0002, + "step": 14625 + }, + { + "epoch": 147.05, + "learning_rate": 6.418481012658228e-06, + "loss": 0.0001, + "step": 14650 + }, + { + "epoch": 147.3, + "learning_rate": 6.412151898734178e-06, + "loss": 0.0001, + "step": 14675 + }, + { + "epoch": 147.55, + "learning_rate": 6.405822784810127e-06, + "loss": 0.0001, + "step": 14700 + }, + { + "epoch": 147.8, + "learning_rate": 6.3994936708860765e-06, + "loss": 0.0003, + "step": 14725 + }, + { + "epoch": 148.06, + "learning_rate": 6.393164556962026e-06, + "loss": 0.0002, + "step": 14750 + }, + { + "epoch": 148.31, + "learning_rate": 6.386835443037975e-06, + "loss": 0.0001, + "step": 14775 + }, + { + "epoch": 148.56, + "learning_rate": 6.380506329113925e-06, + "loss": 0.0001, + "step": 14800 + }, + { + "epoch": 148.81, + "learning_rate": 6.374177215189874e-06, + "loss": 0.0, + "step": 14825 + }, + { + "epoch": 149.06, + "learning_rate": 6.367848101265824e-06, + "loss": 0.0001, + "step": 14850 + }, + { + "epoch": 149.31, + "learning_rate": 6.361518987341772e-06, + "loss": 0.0, + "step": 14875 + }, + { + "epoch": 149.56, + "learning_rate": 6.355189873417722e-06, + "loss": 0.0, + "step": 14900 + }, + { + "epoch": 149.81, + "learning_rate": 6.348860759493671e-06, + "loss": 0.0001, + "step": 14925 + }, + { + "epoch": 150.06, + "learning_rate": 6.3425316455696205e-06, + "loss": 0.0001, + "step": 14950 + }, + { + "epoch": 150.31, + "learning_rate": 6.33620253164557e-06, + "loss": 0.0001, + "step": 14975 + }, + { + "epoch": 150.56, + "learning_rate": 6.329873417721519e-06, + "loss": 0.0, + "step": 15000 + }, + { + "epoch": 150.56, + "eval_loss": 0.2619960606098175, + "eval_runtime": 2808.3991, + "eval_samples_per_second": 4.537, + "eval_steps_per_second": 0.284, + "eval_wer": 7.058972956073159, + "step": 15000 + }, + { + "epoch": 150.82, + "learning_rate": 6.323544303797469e-06, + "loss": 0.0002, + "step": 15025 + }, + { + "epoch": 151.07, + "learning_rate": 6.317215189873418e-06, + "loss": 0.0, + "step": 15050 + }, + { + "epoch": 151.32, + "learning_rate": 6.310886075949368e-06, + "loss": 0.0, + "step": 15075 + }, + { + "epoch": 151.57, + "learning_rate": 6.304556962025316e-06, + "loss": 0.0001, + "step": 15100 + }, + { + "epoch": 151.82, + "learning_rate": 6.298227848101266e-06, + "loss": 0.0, + "step": 15125 + }, + { + "epoch": 152.07, + "learning_rate": 6.291898734177215e-06, + "loss": 0.0, + "step": 15150 + }, + { + "epoch": 152.32, + "learning_rate": 6.2855696202531645e-06, + "loss": 0.0, + "step": 15175 + }, + { + "epoch": 152.57, + "learning_rate": 6.279240506329114e-06, + "loss": 0.0003, + "step": 15200 + }, + { + "epoch": 152.82, + "learning_rate": 6.272911392405063e-06, + "loss": 0.0002, + "step": 15225 + }, + { + "epoch": 153.07, + "learning_rate": 6.266582278481013e-06, + "loss": 0.001, + "step": 15250 + }, + { + "epoch": 153.32, + "learning_rate": 6.260253164556963e-06, + "loss": 0.0012, + "step": 15275 + }, + { + "epoch": 153.58, + "learning_rate": 6.2539240506329125e-06, + "loss": 0.0017, + "step": 15300 + }, + { + "epoch": 153.83, + "learning_rate": 6.247594936708862e-06, + "loss": 0.0018, + "step": 15325 + }, + { + "epoch": 154.08, + "learning_rate": 6.241265822784811e-06, + "loss": 0.0011, + "step": 15350 + }, + { + "epoch": 154.33, + "learning_rate": 6.234936708860761e-06, + "loss": 0.0011, + "step": 15375 + }, + { + "epoch": 154.58, + "learning_rate": 6.228607594936709e-06, + "loss": 0.0019, + "step": 15400 + }, + { + "epoch": 154.83, + "learning_rate": 6.222278481012659e-06, + "loss": 0.0018, + "step": 15425 + }, + { + "epoch": 155.08, + "learning_rate": 6.215949367088608e-06, + "loss": 0.0016, + "step": 15450 + }, + { + "epoch": 155.33, + "learning_rate": 6.209620253164558e-06, + "loss": 0.001, + "step": 15475 + }, + { + "epoch": 155.58, + "learning_rate": 6.203291139240507e-06, + "loss": 0.0011, + "step": 15500 + }, + { + "epoch": 155.83, + "learning_rate": 6.1969620253164565e-06, + "loss": 0.001, + "step": 15525 + }, + { + "epoch": 156.09, + "learning_rate": 6.190632911392406e-06, + "loss": 0.001, + "step": 15550 + }, + { + "epoch": 156.34, + "learning_rate": 6.184303797468355e-06, + "loss": 0.0007, + "step": 15575 + }, + { + "epoch": 156.59, + "learning_rate": 6.177974683544305e-06, + "loss": 0.0008, + "step": 15600 + }, + { + "epoch": 156.84, + "learning_rate": 6.171898734177215e-06, + "loss": 0.0008, + "step": 15625 + }, + { + "epoch": 157.09, + "learning_rate": 6.165569620253165e-06, + "loss": 0.0006, + "step": 15650 + }, + { + "epoch": 157.34, + "learning_rate": 6.159240506329115e-06, + "loss": 0.0002, + "step": 15675 + }, + { + "epoch": 157.59, + "learning_rate": 6.1529113924050645e-06, + "loss": 0.0002, + "step": 15700 + }, + { + "epoch": 157.84, + "learning_rate": 6.146582278481014e-06, + "loss": 0.0003, + "step": 15725 + }, + { + "epoch": 158.09, + "learning_rate": 6.140253164556963e-06, + "loss": 0.0004, + "step": 15750 + }, + { + "epoch": 158.34, + "learning_rate": 6.133924050632912e-06, + "loss": 0.0002, + "step": 15775 + }, + { + "epoch": 158.59, + "learning_rate": 6.127594936708861e-06, + "loss": 0.0002, + "step": 15800 + }, + { + "epoch": 158.85, + "learning_rate": 6.121265822784811e-06, + "loss": 0.0003, + "step": 15825 + }, + { + "epoch": 159.1, + "learning_rate": 6.11493670886076e-06, + "loss": 0.0003, + "step": 15850 + }, + { + "epoch": 159.35, + "learning_rate": 6.10860759493671e-06, + "loss": 0.0002, + "step": 15875 + }, + { + "epoch": 159.6, + "learning_rate": 6.102278481012659e-06, + "loss": 0.0002, + "step": 15900 + }, + { + "epoch": 159.85, + "learning_rate": 6.0959493670886085e-06, + "loss": 0.0001, + "step": 15925 + }, + { + "epoch": 160.1, + "learning_rate": 6.089620253164558e-06, + "loss": 0.0001, + "step": 15950 + }, + { + "epoch": 160.35, + "learning_rate": 6.083291139240507e-06, + "loss": 0.0001, + "step": 15975 + }, + { + "epoch": 160.6, + "learning_rate": 6.076962025316456e-06, + "loss": 0.0001, + "step": 16000 + }, + { + "epoch": 160.6, + "eval_loss": 0.2546827495098114, + "eval_runtime": 2784.4693, + "eval_samples_per_second": 4.576, + "eval_steps_per_second": 0.286, + "eval_wer": 7.196732843520401, + "step": 16000 + }, + { + "epoch": 160.85, + "learning_rate": 6.070632911392405e-06, + "loss": 0.0005, + "step": 16025 + }, + { + "epoch": 161.1, + "learning_rate": 6.064303797468355e-06, + "loss": 0.0005, + "step": 16050 + }, + { + "epoch": 161.36, + "learning_rate": 6.057974683544304e-06, + "loss": 0.0004, + "step": 16075 + }, + { + "epoch": 161.61, + "learning_rate": 6.051645569620254e-06, + "loss": 0.0001, + "step": 16100 + }, + { + "epoch": 161.86, + "learning_rate": 6.045316455696203e-06, + "loss": 0.0001, + "step": 16125 + }, + { + "epoch": 162.11, + "learning_rate": 6.0389873417721525e-06, + "loss": 0.0001, + "step": 16150 + }, + { + "epoch": 162.36, + "learning_rate": 6.032658227848102e-06, + "loss": 0.0001, + "step": 16175 + }, + { + "epoch": 162.61, + "learning_rate": 6.0263291139240505e-06, + "loss": 0.0001, + "step": 16200 + }, + { + "epoch": 162.86, + "learning_rate": 6.02e-06, + "loss": 0.0001, + "step": 16225 + }, + { + "epoch": 163.11, + "learning_rate": 6.013670886075949e-06, + "loss": 0.0001, + "step": 16250 + }, + { + "epoch": 163.36, + "learning_rate": 6.007341772151899e-06, + "loss": 0.0, + "step": 16275 + }, + { + "epoch": 163.61, + "learning_rate": 6.001012658227848e-06, + "loss": 0.0, + "step": 16300 + }, + { + "epoch": 163.86, + "learning_rate": 5.994683544303798e-06, + "loss": 0.0001, + "step": 16325 + }, + { + "epoch": 164.12, + "learning_rate": 5.988354430379747e-06, + "loss": 0.0, + "step": 16350 + }, + { + "epoch": 164.37, + "learning_rate": 5.9820253164556965e-06, + "loss": 0.0, + "step": 16375 + }, + { + "epoch": 164.62, + "learning_rate": 5.975696202531646e-06, + "loss": 0.0002, + "step": 16400 + }, + { + "epoch": 164.87, + "learning_rate": 5.9693670886075945e-06, + "loss": 0.0, + "step": 16425 + }, + { + "epoch": 165.12, + "learning_rate": 5.963037974683544e-06, + "loss": 0.0, + "step": 16450 + }, + { + "epoch": 165.37, + "learning_rate": 5.956708860759493e-06, + "loss": 0.0, + "step": 16475 + }, + { + "epoch": 165.62, + "learning_rate": 5.950379746835444e-06, + "loss": 0.0, + "step": 16500 + }, + { + "epoch": 165.87, + "learning_rate": 5.944050632911393e-06, + "loss": 0.0, + "step": 16525 + }, + { + "epoch": 166.12, + "learning_rate": 5.9377215189873425e-06, + "loss": 0.0, + "step": 16550 + }, + { + "epoch": 166.37, + "learning_rate": 5.931392405063292e-06, + "loss": 0.0, + "step": 16575 + }, + { + "epoch": 166.62, + "learning_rate": 5.925063291139241e-06, + "loss": 0.0, + "step": 16600 + }, + { + "epoch": 166.88, + "learning_rate": 5.918734177215191e-06, + "loss": 0.0, + "step": 16625 + }, + { + "epoch": 167.13, + "learning_rate": 5.91240506329114e-06, + "loss": 0.0, + "step": 16650 + }, + { + "epoch": 167.38, + "learning_rate": 5.90607594936709e-06, + "loss": 0.0, + "step": 16675 + }, + { + "epoch": 167.63, + "learning_rate": 5.899746835443039e-06, + "loss": 0.0, + "step": 16700 + }, + { + "epoch": 167.88, + "learning_rate": 5.893417721518988e-06, + "loss": 0.0, + "step": 16725 + }, + { + "epoch": 168.13, + "learning_rate": 5.887088607594937e-06, + "loss": 0.0, + "step": 16750 + }, + { + "epoch": 168.38, + "learning_rate": 5.8807594936708865e-06, + "loss": 0.0, + "step": 16775 + }, + { + "epoch": 168.63, + "learning_rate": 5.874430379746836e-06, + "loss": 0.0, + "step": 16800 + }, + { + "epoch": 168.88, + "learning_rate": 5.868101265822785e-06, + "loss": 0.0, + "step": 16825 + }, + { + "epoch": 169.13, + "learning_rate": 5.861772151898735e-06, + "loss": 0.0, + "step": 16850 + }, + { + "epoch": 169.39, + "learning_rate": 5.855443037974684e-06, + "loss": 0.0, + "step": 16875 + }, + { + "epoch": 169.64, + "learning_rate": 5.849113924050634e-06, + "loss": 0.0, + "step": 16900 + }, + { + "epoch": 169.89, + "learning_rate": 5.842784810126583e-06, + "loss": 0.0, + "step": 16925 + }, + { + "epoch": 170.14, + "learning_rate": 5.836455696202532e-06, + "loss": 0.0, + "step": 16950 + }, + { + "epoch": 170.39, + "learning_rate": 5.830126582278481e-06, + "loss": 0.0, + "step": 16975 + }, + { + "epoch": 170.64, + "learning_rate": 5.8237974683544305e-06, + "loss": 0.0, + "step": 17000 + }, + { + "epoch": 170.64, + "eval_loss": 0.27676019072532654, + "eval_runtime": 2784.6513, + "eval_samples_per_second": 4.576, + "eval_steps_per_second": 0.286, + "eval_wer": 7.0736282632483976, + "step": 17000 + }, + { + "epoch": 170.89, + "learning_rate": 5.81746835443038e-06, + "loss": 0.0, + "step": 17025 + }, + { + "epoch": 171.14, + "learning_rate": 5.811139240506329e-06, + "loss": 0.0, + "step": 17050 + }, + { + "epoch": 171.39, + "learning_rate": 5.804810126582279e-06, + "loss": 0.0, + "step": 17075 + }, + { + "epoch": 171.64, + "learning_rate": 5.798481012658228e-06, + "loss": 0.0, + "step": 17100 + }, + { + "epoch": 171.89, + "learning_rate": 5.792151898734178e-06, + "loss": 0.0, + "step": 17125 + }, + { + "epoch": 172.15, + "learning_rate": 5.785822784810127e-06, + "loss": 0.0, + "step": 17150 + }, + { + "epoch": 172.4, + "learning_rate": 5.779493670886076e-06, + "loss": 0.0, + "step": 17175 + }, + { + "epoch": 172.65, + "learning_rate": 5.773164556962025e-06, + "loss": 0.0, + "step": 17200 + }, + { + "epoch": 172.9, + "learning_rate": 5.7668354430379745e-06, + "loss": 0.0, + "step": 17225 + }, + { + "epoch": 173.15, + "learning_rate": 5.760506329113924e-06, + "loss": 0.0, + "step": 17250 + }, + { + "epoch": 173.4, + "learning_rate": 5.754177215189873e-06, + "loss": 0.0, + "step": 17275 + }, + { + "epoch": 173.65, + "learning_rate": 5.747848101265823e-06, + "loss": 0.0, + "step": 17300 + }, + { + "epoch": 173.9, + "learning_rate": 5.741518987341773e-06, + "loss": 0.0, + "step": 17325 + }, + { + "epoch": 174.15, + "learning_rate": 5.7351898734177225e-06, + "loss": 0.0, + "step": 17350 + }, + { + "epoch": 174.4, + "learning_rate": 5.728860759493672e-06, + "loss": 0.0, + "step": 17375 + }, + { + "epoch": 174.65, + "learning_rate": 5.722531645569621e-06, + "loss": 0.0, + "step": 17400 + }, + { + "epoch": 174.91, + "learning_rate": 5.716202531645571e-06, + "loss": 0.0, + "step": 17425 + }, + { + "epoch": 175.16, + "learning_rate": 5.70987341772152e-06, + "loss": 0.0, + "step": 17450 + }, + { + "epoch": 175.41, + "learning_rate": 5.703544303797469e-06, + "loss": 0.0, + "step": 17475 + }, + { + "epoch": 175.66, + "learning_rate": 5.697215189873418e-06, + "loss": 0.0, + "step": 17500 + }, + { + "epoch": 175.91, + "learning_rate": 5.690886075949368e-06, + "loss": 0.0, + "step": 17525 + }, + { + "epoch": 176.16, + "learning_rate": 5.684556962025317e-06, + "loss": 0.0, + "step": 17550 + }, + { + "epoch": 176.41, + "learning_rate": 5.6782278481012665e-06, + "loss": 0.0, + "step": 17575 + }, + { + "epoch": 176.66, + "learning_rate": 5.671898734177216e-06, + "loss": 0.0, + "step": 17600 + }, + { + "epoch": 176.91, + "learning_rate": 5.665569620253165e-06, + "loss": 0.0, + "step": 17625 + }, + { + "epoch": 177.16, + "learning_rate": 5.659240506329115e-06, + "loss": 0.0, + "step": 17650 + }, + { + "epoch": 177.42, + "learning_rate": 5.652911392405064e-06, + "loss": 0.0, + "step": 17675 + }, + { + "epoch": 177.67, + "learning_rate": 5.646582278481013e-06, + "loss": 0.0, + "step": 17700 + }, + { + "epoch": 177.92, + "learning_rate": 5.640253164556962e-06, + "loss": 0.0, + "step": 17725 + }, + { + "epoch": 178.17, + "learning_rate": 5.633924050632912e-06, + "loss": 0.0, + "step": 17750 + }, + { + "epoch": 178.42, + "learning_rate": 5.627594936708861e-06, + "loss": 0.0, + "step": 17775 + }, + { + "epoch": 178.67, + "learning_rate": 5.6212658227848105e-06, + "loss": 0.0, + "step": 17800 + }, + { + "epoch": 178.92, + "learning_rate": 5.61493670886076e-06, + "loss": 0.0, + "step": 17825 + }, + { + "epoch": 179.17, + "learning_rate": 5.608607594936709e-06, + "loss": 0.0, + "step": 17850 + }, + { + "epoch": 179.42, + "learning_rate": 5.602278481012659e-06, + "loss": 0.0, + "step": 17875 + }, + { + "epoch": 179.67, + "learning_rate": 5.595949367088608e-06, + "loss": 0.0, + "step": 17900 + }, + { + "epoch": 179.92, + "learning_rate": 5.589620253164557e-06, + "loss": 0.0, + "step": 17925 + }, + { + "epoch": 180.18, + "learning_rate": 5.583291139240506e-06, + "loss": 0.0, + "step": 17950 + }, + { + "epoch": 180.43, + "learning_rate": 5.576962025316456e-06, + "loss": 0.0, + "step": 17975 + }, + { + "epoch": 180.68, + "learning_rate": 5.570632911392405e-06, + "loss": 0.0, + "step": 18000 + }, + { + "epoch": 180.68, + "eval_loss": 0.28781425952911377, + "eval_runtime": 2780.8898, + "eval_samples_per_second": 4.582, + "eval_steps_per_second": 0.287, + "eval_wer": 7.000351727372206, + "step": 18000 + }, + { + "epoch": 180.93, + "learning_rate": 5.5643037974683545e-06, + "loss": 0.0, + "step": 18025 + }, + { + "epoch": 181.18, + "learning_rate": 5.557974683544304e-06, + "loss": 0.0, + "step": 18050 + }, + { + "epoch": 181.43, + "learning_rate": 5.551645569620253e-06, + "loss": 0.0, + "step": 18075 + }, + { + "epoch": 181.68, + "learning_rate": 5.545316455696203e-06, + "loss": 0.0, + "step": 18100 + }, + { + "epoch": 181.93, + "learning_rate": 5.538987341772151e-06, + "loss": 0.0, + "step": 18125 + }, + { + "epoch": 182.18, + "learning_rate": 5.5326582278481025e-06, + "loss": 0.0, + "step": 18150 + }, + { + "epoch": 182.43, + "learning_rate": 5.526329113924052e-06, + "loss": 0.0, + "step": 18175 + }, + { + "epoch": 182.69, + "learning_rate": 5.5200000000000005e-06, + "loss": 0.0, + "step": 18200 + }, + { + "epoch": 182.94, + "learning_rate": 5.51367088607595e-06, + "loss": 0.0, + "step": 18225 + }, + { + "epoch": 183.19, + "learning_rate": 5.507341772151899e-06, + "loss": 0.0, + "step": 18250 + }, + { + "epoch": 183.44, + "learning_rate": 5.501012658227849e-06, + "loss": 0.0, + "step": 18275 + }, + { + "epoch": 183.69, + "learning_rate": 5.494683544303798e-06, + "loss": 0.0, + "step": 18300 + }, + { + "epoch": 183.94, + "learning_rate": 5.488354430379748e-06, + "loss": 0.0, + "step": 18325 + }, + { + "epoch": 184.19, + "learning_rate": 5.482025316455697e-06, + "loss": 0.0, + "step": 18350 + }, + { + "epoch": 184.44, + "learning_rate": 5.4756962025316465e-06, + "loss": 0.0, + "step": 18375 + }, + { + "epoch": 184.69, + "learning_rate": 5.469367088607596e-06, + "loss": 0.0, + "step": 18400 + }, + { + "epoch": 184.94, + "learning_rate": 5.4630379746835445e-06, + "loss": 0.0, + "step": 18425 + }, + { + "epoch": 185.19, + "learning_rate": 5.456708860759494e-06, + "loss": 0.0, + "step": 18450 + }, + { + "epoch": 185.45, + "learning_rate": 5.450379746835443e-06, + "loss": 0.0, + "step": 18475 + }, + { + "epoch": 185.7, + "learning_rate": 5.444050632911393e-06, + "loss": 0.0, + "step": 18500 + }, + { + "epoch": 185.95, + "learning_rate": 5.437721518987342e-06, + "loss": 0.0, + "step": 18525 + }, + { + "epoch": 186.2, + "learning_rate": 5.431392405063292e-06, + "loss": 0.0, + "step": 18550 + }, + { + "epoch": 186.45, + "learning_rate": 5.425063291139241e-06, + "loss": 0.0, + "step": 18575 + }, + { + "epoch": 186.7, + "learning_rate": 5.4187341772151905e-06, + "loss": 0.0, + "step": 18600 + }, + { + "epoch": 186.95, + "learning_rate": 5.41240506329114e-06, + "loss": 0.0, + "step": 18625 + }, + { + "epoch": 187.2, + "learning_rate": 5.4060759493670885e-06, + "loss": 0.0, + "step": 18650 + }, + { + "epoch": 187.45, + "learning_rate": 5.399746835443038e-06, + "loss": 0.0, + "step": 18675 + }, + { + "epoch": 187.7, + "learning_rate": 5.393417721518987e-06, + "loss": 0.0, + "step": 18700 + }, + { + "epoch": 187.95, + "learning_rate": 5.387088607594937e-06, + "loss": 0.0, + "step": 18725 + }, + { + "epoch": 188.21, + "learning_rate": 5.380759493670886e-06, + "loss": 0.0, + "step": 18750 + }, + { + "epoch": 188.46, + "learning_rate": 5.374430379746836e-06, + "loss": 0.0, + "step": 18775 + }, + { + "epoch": 188.71, + "learning_rate": 5.368101265822785e-06, + "loss": 0.0, + "step": 18800 + }, + { + "epoch": 188.96, + "learning_rate": 5.3617721518987345e-06, + "loss": 0.0, + "step": 18825 + }, + { + "epoch": 189.21, + "learning_rate": 5.355443037974684e-06, + "loss": 0.0, + "step": 18850 + }, + { + "epoch": 189.46, + "learning_rate": 5.3491139240506325e-06, + "loss": 0.0, + "step": 18875 + }, + { + "epoch": 189.71, + "learning_rate": 5.342784810126582e-06, + "loss": 0.0, + "step": 18900 + }, + { + "epoch": 189.96, + "learning_rate": 5.336455696202531e-06, + "loss": 0.0, + "step": 18925 + }, + { + "epoch": 190.21, + "learning_rate": 5.330126582278481e-06, + "loss": 0.0, + "step": 18950 + }, + { + "epoch": 190.46, + "learning_rate": 5.323797468354431e-06, + "loss": 0.0, + "step": 18975 + }, + { + "epoch": 190.72, + "learning_rate": 5.3174683544303805e-06, + "loss": 0.0, + "step": 19000 + }, + { + "epoch": 190.72, + "eval_loss": 0.2962440252304077, + "eval_runtime": 2778.8571, + "eval_samples_per_second": 4.585, + "eval_steps_per_second": 0.287, + "eval_wer": 6.946615601062998, + "step": 19000 + }, + { + "epoch": 190.97, + "learning_rate": 5.31113924050633e-06, + "loss": 0.0, + "step": 19025 + }, + { + "epoch": 191.22, + "learning_rate": 5.304810126582279e-06, + "loss": 0.0, + "step": 19050 + }, + { + "epoch": 191.47, + "learning_rate": 5.298481012658229e-06, + "loss": 0.0, + "step": 19075 + }, + { + "epoch": 191.72, + "learning_rate": 5.292151898734178e-06, + "loss": 0.0, + "step": 19100 + }, + { + "epoch": 191.97, + "learning_rate": 5.285822784810128e-06, + "loss": 0.0, + "step": 19125 + }, + { + "epoch": 192.22, + "learning_rate": 5.279493670886077e-06, + "loss": 0.0, + "step": 19150 + }, + { + "epoch": 192.47, + "learning_rate": 5.273164556962026e-06, + "loss": 0.0, + "step": 19175 + }, + { + "epoch": 192.72, + "learning_rate": 5.266835443037975e-06, + "loss": 0.0, + "step": 19200 + }, + { + "epoch": 192.97, + "learning_rate": 5.2605063291139245e-06, + "loss": 0.0, + "step": 19225 + }, + { + "epoch": 193.22, + "learning_rate": 5.254177215189874e-06, + "loss": 0.0, + "step": 19250 + }, + { + "epoch": 193.48, + "learning_rate": 5.247848101265823e-06, + "loss": 0.0, + "step": 19275 + }, + { + "epoch": 193.73, + "learning_rate": 5.241518987341773e-06, + "loss": 0.0, + "step": 19300 + }, + { + "epoch": 193.98, + "learning_rate": 5.235189873417722e-06, + "loss": 0.0, + "step": 19325 + }, + { + "epoch": 194.23, + "learning_rate": 5.228860759493672e-06, + "loss": 0.0, + "step": 19350 + }, + { + "epoch": 194.48, + "learning_rate": 5.222531645569621e-06, + "loss": 0.0, + "step": 19375 + }, + { + "epoch": 194.73, + "learning_rate": 5.21620253164557e-06, + "loss": 0.0, + "step": 19400 + }, + { + "epoch": 194.98, + "learning_rate": 5.209873417721519e-06, + "loss": 0.0, + "step": 19425 + }, + { + "epoch": 195.23, + "learning_rate": 5.2035443037974685e-06, + "loss": 0.0, + "step": 19450 + }, + { + "epoch": 195.48, + "learning_rate": 5.197215189873418e-06, + "loss": 0.0, + "step": 19475 + }, + { + "epoch": 195.73, + "learning_rate": 5.190886075949367e-06, + "loss": 0.0, + "step": 19500 + }, + { + "epoch": 195.98, + "learning_rate": 5.184556962025317e-06, + "loss": 0.0, + "step": 19525 + }, + { + "epoch": 196.24, + "learning_rate": 5.178227848101266e-06, + "loss": 0.0, + "step": 19550 + }, + { + "epoch": 196.49, + "learning_rate": 5.171898734177216e-06, + "loss": 0.0, + "step": 19575 + }, + { + "epoch": 196.74, + "learning_rate": 5.165569620253165e-06, + "loss": 0.0, + "step": 19600 + }, + { + "epoch": 196.99, + "learning_rate": 5.159240506329114e-06, + "loss": 0.0, + "step": 19625 + }, + { + "epoch": 197.24, + "learning_rate": 5.152911392405063e-06, + "loss": 0.0, + "step": 19650 + }, + { + "epoch": 197.49, + "learning_rate": 5.1465822784810125e-06, + "loss": 0.0, + "step": 19675 + }, + { + "epoch": 197.74, + "learning_rate": 5.140253164556962e-06, + "loss": 0.0, + "step": 19700 + }, + { + "epoch": 197.99, + "learning_rate": 5.133924050632911e-06, + "loss": 0.0, + "step": 19725 + }, + { + "epoch": 198.24, + "learning_rate": 5.127594936708861e-06, + "loss": 0.0, + "step": 19750 + }, + { + "epoch": 198.49, + "learning_rate": 5.12126582278481e-06, + "loss": 0.0, + "step": 19775 + }, + { + "epoch": 198.75, + "learning_rate": 5.1149367088607605e-06, + "loss": 0.0, + "step": 19800 + }, + { + "epoch": 199.0, + "learning_rate": 5.10860759493671e-06, + "loss": 0.0, + "step": 19825 + }, + { + "epoch": 199.25, + "learning_rate": 5.102278481012659e-06, + "loss": 0.001, + "step": 19850 + }, + { + "epoch": 199.5, + "learning_rate": 5.095949367088609e-06, + "loss": 0.0056, + "step": 19875 + }, + { + "epoch": 199.75, + "learning_rate": 5.089620253164557e-06, + "loss": 0.0061, + "step": 19900 + }, + { + "epoch": 200.0, + "learning_rate": 5.083291139240507e-06, + "loss": 0.0042, + "step": 19925 + }, + { + "epoch": 200.25, + "learning_rate": 5.076962025316456e-06, + "loss": 0.0026, + "step": 19950 + }, + { + "epoch": 200.5, + "learning_rate": 5.070886075949367e-06, + "loss": 0.002, + "step": 19975 + }, + { + "epoch": 200.75, + "learning_rate": 5.064556962025316e-06, + "loss": 0.0013, + "step": 20000 + }, + { + "epoch": 200.75, + "eval_loss": 0.2354433238506317, + "eval_runtime": 2781.1722, + "eval_samples_per_second": 4.582, + "eval_steps_per_second": 0.287, + "eval_wer": 7.604150382992028, + "step": 20000 + }, + { + "epoch": 201.0, + "learning_rate": 5.058227848101266e-06, + "loss": 0.0016, + "step": 20025 + }, + { + "epoch": 201.25, + "learning_rate": 5.051898734177215e-06, + "loss": 0.0008, + "step": 20050 + }, + { + "epoch": 201.51, + "learning_rate": 5.0455696202531645e-06, + "loss": 0.0005, + "step": 20075 + }, + { + "epoch": 201.76, + "learning_rate": 5.039240506329114e-06, + "loss": 0.0007, + "step": 20100 + }, + { + "epoch": 202.01, + "learning_rate": 5.032911392405063e-06, + "loss": 0.0004, + "step": 20125 + }, + { + "epoch": 202.26, + "learning_rate": 5.026582278481013e-06, + "loss": 0.0002, + "step": 20150 + }, + { + "epoch": 202.51, + "learning_rate": 5.020253164556963e-06, + "loss": 0.0001, + "step": 20175 + }, + { + "epoch": 202.76, + "learning_rate": 5.0139240506329125e-06, + "loss": 0.0002, + "step": 20200 + }, + { + "epoch": 203.01, + "learning_rate": 5.007594936708862e-06, + "loss": 0.0002, + "step": 20225 + }, + { + "epoch": 203.26, + "learning_rate": 5.001265822784811e-06, + "loss": 0.0001, + "step": 20250 + }, + { + "epoch": 203.51, + "learning_rate": 4.99493670886076e-06, + "loss": 0.0001, + "step": 20275 + }, + { + "epoch": 203.76, + "learning_rate": 4.988607594936709e-06, + "loss": 0.0001, + "step": 20300 + }, + { + "epoch": 204.02, + "learning_rate": 4.982278481012659e-06, + "loss": 0.0002, + "step": 20325 + }, + { + "epoch": 204.27, + "learning_rate": 4.975949367088607e-06, + "loss": 0.0001, + "step": 20350 + }, + { + "epoch": 204.52, + "learning_rate": 4.969620253164557e-06, + "loss": 0.0001, + "step": 20375 + }, + { + "epoch": 204.77, + "learning_rate": 4.963291139240507e-06, + "loss": 0.0001, + "step": 20400 + }, + { + "epoch": 205.02, + "learning_rate": 4.9569620253164565e-06, + "loss": 0.0001, + "step": 20425 + }, + { + "epoch": 205.27, + "learning_rate": 4.950632911392406e-06, + "loss": 0.0001, + "step": 20450 + }, + { + "epoch": 205.52, + "learning_rate": 4.944303797468355e-06, + "loss": 0.0001, + "step": 20475 + }, + { + "epoch": 205.77, + "learning_rate": 4.937974683544304e-06, + "loss": 0.0, + "step": 20500 + }, + { + "epoch": 206.02, + "learning_rate": 4.931645569620253e-06, + "loss": 0.0001, + "step": 20525 + }, + { + "epoch": 206.27, + "learning_rate": 4.925316455696203e-06, + "loss": 0.0, + "step": 20550 + }, + { + "epoch": 206.52, + "learning_rate": 4.918987341772152e-06, + "loss": 0.0, + "step": 20575 + }, + { + "epoch": 206.78, + "learning_rate": 4.912658227848102e-06, + "loss": 0.0, + "step": 20600 + }, + { + "epoch": 207.03, + "learning_rate": 4.906329113924051e-06, + "loss": 0.0, + "step": 20625 + }, + { + "epoch": 207.28, + "learning_rate": 4.9000000000000005e-06, + "loss": 0.0, + "step": 20650 + }, + { + "epoch": 207.53, + "learning_rate": 4.89367088607595e-06, + "loss": 0.0, + "step": 20675 + }, + { + "epoch": 207.78, + "learning_rate": 4.887341772151899e-06, + "loss": 0.0, + "step": 20700 + }, + { + "epoch": 208.03, + "learning_rate": 4.881012658227848e-06, + "loss": 0.0, + "step": 20725 + }, + { + "epoch": 208.28, + "learning_rate": 4.874683544303797e-06, + "loss": 0.0, + "step": 20750 + }, + { + "epoch": 208.53, + "learning_rate": 4.868354430379747e-06, + "loss": 0.0, + "step": 20775 + }, + { + "epoch": 208.78, + "learning_rate": 4.862025316455697e-06, + "loss": 0.0, + "step": 20800 + }, + { + "epoch": 209.03, + "learning_rate": 4.8556962025316465e-06, + "loss": 0.0, + "step": 20825 + }, + { + "epoch": 209.28, + "learning_rate": 4.849367088607596e-06, + "loss": 0.0, + "step": 20850 + }, + { + "epoch": 209.54, + "learning_rate": 4.8430379746835445e-06, + "loss": 0.0, + "step": 20875 + }, + { + "epoch": 209.79, + "learning_rate": 4.836708860759494e-06, + "loss": 0.0, + "step": 20900 + }, + { + "epoch": 210.04, + "learning_rate": 4.830379746835443e-06, + "loss": 0.0, + "step": 20925 + }, + { + "epoch": 210.29, + "learning_rate": 4.824050632911393e-06, + "loss": 0.0, + "step": 20950 + }, + { + "epoch": 210.54, + "learning_rate": 4.817721518987342e-06, + "loss": 0.0, + "step": 20975 + }, + { + "epoch": 210.79, + "learning_rate": 4.811392405063292e-06, + "loss": 0.0, + "step": 21000 + }, + { + "epoch": 210.79, + "eval_loss": 0.2719791829586029, + "eval_runtime": 2780.4356, + "eval_samples_per_second": 4.583, + "eval_steps_per_second": 0.287, + "eval_wer": 6.89483351571049, + "step": 21000 + }, + { + "epoch": 211.04, + "learning_rate": 4.805063291139241e-06, + "loss": 0.0, + "step": 21025 + }, + { + "epoch": 211.29, + "learning_rate": 4.7987341772151905e-06, + "loss": 0.0, + "step": 21050 + }, + { + "epoch": 211.54, + "learning_rate": 4.79240506329114e-06, + "loss": 0.0, + "step": 21075 + }, + { + "epoch": 211.79, + "learning_rate": 4.7860759493670885e-06, + "loss": 0.0, + "step": 21100 + }, + { + "epoch": 212.05, + "learning_rate": 4.779746835443038e-06, + "loss": 0.0, + "step": 21125 + }, + { + "epoch": 212.3, + "learning_rate": 4.773417721518987e-06, + "loss": 0.0, + "step": 21150 + }, + { + "epoch": 212.55, + "learning_rate": 4.767088607594937e-06, + "loss": 0.0, + "step": 21175 + }, + { + "epoch": 212.8, + "learning_rate": 4.760759493670886e-06, + "loss": 0.0, + "step": 21200 + }, + { + "epoch": 213.05, + "learning_rate": 4.754430379746836e-06, + "loss": 0.0, + "step": 21225 + }, + { + "epoch": 213.3, + "learning_rate": 4.748101265822785e-06, + "loss": 0.0, + "step": 21250 + }, + { + "epoch": 213.55, + "learning_rate": 4.7417721518987345e-06, + "loss": 0.0, + "step": 21275 + }, + { + "epoch": 213.8, + "learning_rate": 4.735443037974684e-06, + "loss": 0.0, + "step": 21300 + }, + { + "epoch": 214.05, + "learning_rate": 4.729113924050633e-06, + "loss": 0.0, + "step": 21325 + }, + { + "epoch": 214.3, + "learning_rate": 4.722784810126583e-06, + "loss": 0.0, + "step": 21350 + }, + { + "epoch": 214.55, + "learning_rate": 4.716455696202532e-06, + "loss": 0.0, + "step": 21375 + }, + { + "epoch": 214.81, + "learning_rate": 4.710126582278482e-06, + "loss": 0.0, + "step": 21400 + }, + { + "epoch": 215.06, + "learning_rate": 4.703797468354431e-06, + "loss": 0.0, + "step": 21425 + }, + { + "epoch": 215.31, + "learning_rate": 4.69746835443038e-06, + "loss": 0.0, + "step": 21450 + }, + { + "epoch": 215.56, + "learning_rate": 4.691139240506329e-06, + "loss": 0.0, + "step": 21475 + }, + { + "epoch": 215.81, + "learning_rate": 4.6848101265822785e-06, + "loss": 0.0, + "step": 21500 + }, + { + "epoch": 216.06, + "learning_rate": 4.678481012658228e-06, + "loss": 0.0, + "step": 21525 + }, + { + "epoch": 216.31, + "learning_rate": 4.672151898734177e-06, + "loss": 0.0, + "step": 21550 + }, + { + "epoch": 216.56, + "learning_rate": 4.665822784810127e-06, + "loss": 0.0, + "step": 21575 + }, + { + "epoch": 216.81, + "learning_rate": 4.659493670886076e-06, + "loss": 0.0, + "step": 21600 + }, + { + "epoch": 217.06, + "learning_rate": 4.653164556962026e-06, + "loss": 0.0, + "step": 21625 + }, + { + "epoch": 217.31, + "learning_rate": 4.646835443037975e-06, + "loss": 0.0, + "step": 21650 + }, + { + "epoch": 217.57, + "learning_rate": 4.6405063291139245e-06, + "loss": 0.0, + "step": 21675 + }, + { + "epoch": 217.82, + "learning_rate": 4.634177215189874e-06, + "loss": 0.0, + "step": 21700 + }, + { + "epoch": 218.07, + "learning_rate": 4.627848101265823e-06, + "loss": 0.0, + "step": 21725 + }, + { + "epoch": 218.32, + "learning_rate": 4.621518987341773e-06, + "loss": 0.0, + "step": 21750 + }, + { + "epoch": 218.57, + "learning_rate": 4.615189873417722e-06, + "loss": 0.0, + "step": 21775 + }, + { + "epoch": 218.82, + "learning_rate": 4.608860759493672e-06, + "loss": 0.0, + "step": 21800 + }, + { + "epoch": 219.07, + "learning_rate": 4.60253164556962e-06, + "loss": 0.0, + "step": 21825 + }, + { + "epoch": 219.32, + "learning_rate": 4.59620253164557e-06, + "loss": 0.0, + "step": 21850 + }, + { + "epoch": 219.57, + "learning_rate": 4.589873417721519e-06, + "loss": 0.0, + "step": 21875 + }, + { + "epoch": 219.82, + "learning_rate": 4.5835443037974685e-06, + "loss": 0.0, + "step": 21900 + }, + { + "epoch": 220.08, + "learning_rate": 4.577215189873418e-06, + "loss": 0.0, + "step": 21925 + }, + { + "epoch": 220.33, + "learning_rate": 4.570886075949367e-06, + "loss": 0.0, + "step": 21950 + }, + { + "epoch": 220.58, + "learning_rate": 4.564556962025317e-06, + "loss": 0.0, + "step": 21975 + }, + { + "epoch": 220.83, + "learning_rate": 4.558227848101266e-06, + "loss": 0.0, + "step": 22000 + }, + { + "epoch": 220.83, + "eval_loss": 0.2865145206451416, + "eval_runtime": 2791.2624, + "eval_samples_per_second": 4.565, + "eval_steps_per_second": 0.286, + "eval_wer": 6.898741597623887, + "step": 22000 + }, + { + "epoch": 221.08, + "learning_rate": 4.551898734177216e-06, + "loss": 0.0, + "step": 22025 + }, + { + "epoch": 221.33, + "learning_rate": 4.545569620253165e-06, + "loss": 0.0, + "step": 22050 + }, + { + "epoch": 221.58, + "learning_rate": 4.5392405063291145e-06, + "loss": 0.0, + "step": 22075 + }, + { + "epoch": 221.83, + "learning_rate": 4.532911392405064e-06, + "loss": 0.0, + "step": 22100 + }, + { + "epoch": 222.08, + "learning_rate": 4.526582278481013e-06, + "loss": 0.0, + "step": 22125 + }, + { + "epoch": 222.33, + "learning_rate": 4.520253164556963e-06, + "loss": 0.0, + "step": 22150 + }, + { + "epoch": 222.58, + "learning_rate": 4.513924050632912e-06, + "loss": 0.0, + "step": 22175 + }, + { + "epoch": 222.84, + "learning_rate": 4.507594936708861e-06, + "loss": 0.0, + "step": 22200 + }, + { + "epoch": 223.09, + "learning_rate": 4.50126582278481e-06, + "loss": 0.0, + "step": 22225 + }, + { + "epoch": 223.34, + "learning_rate": 4.49493670886076e-06, + "loss": 0.0, + "step": 22250 + }, + { + "epoch": 223.59, + "learning_rate": 4.488607594936709e-06, + "loss": 0.0, + "step": 22275 + }, + { + "epoch": 223.84, + "learning_rate": 4.4822784810126585e-06, + "loss": 0.0, + "step": 22300 + }, + { + "epoch": 224.09, + "learning_rate": 4.475949367088608e-06, + "loss": 0.0, + "step": 22325 + }, + { + "epoch": 224.34, + "learning_rate": 4.469620253164557e-06, + "loss": 0.0, + "step": 22350 + }, + { + "epoch": 224.59, + "learning_rate": 4.463291139240507e-06, + "loss": 0.0, + "step": 22375 + }, + { + "epoch": 224.84, + "learning_rate": 4.456962025316456e-06, + "loss": 0.0, + "step": 22400 + }, + { + "epoch": 225.09, + "learning_rate": 4.450632911392405e-06, + "loss": 0.0, + "step": 22425 + }, + { + "epoch": 225.35, + "learning_rate": 4.444303797468355e-06, + "loss": 0.0, + "step": 22450 + }, + { + "epoch": 225.6, + "learning_rate": 4.4379746835443045e-06, + "loss": 0.0, + "step": 22475 + }, + { + "epoch": 225.85, + "learning_rate": 4.431645569620254e-06, + "loss": 0.0, + "step": 22500 + }, + { + "epoch": 226.1, + "learning_rate": 4.425316455696203e-06, + "loss": 0.0, + "step": 22525 + }, + { + "epoch": 226.35, + "learning_rate": 4.418987341772153e-06, + "loss": 0.0, + "step": 22550 + }, + { + "epoch": 226.6, + "learning_rate": 4.412658227848101e-06, + "loss": 0.0, + "step": 22575 + }, + { + "epoch": 226.85, + "learning_rate": 4.406329113924051e-06, + "loss": 0.0, + "step": 22600 + }, + { + "epoch": 227.1, + "learning_rate": 4.4e-06, + "loss": 0.0, + "step": 22625 + }, + { + "epoch": 227.35, + "learning_rate": 4.39367088607595e-06, + "loss": 0.0, + "step": 22650 + }, + { + "epoch": 227.6, + "learning_rate": 4.387341772151899e-06, + "loss": 0.0, + "step": 22675 + }, + { + "epoch": 227.85, + "learning_rate": 4.3810126582278485e-06, + "loss": 0.0, + "step": 22700 + }, + { + "epoch": 228.11, + "learning_rate": 4.374683544303798e-06, + "loss": 0.0, + "step": 22725 + }, + { + "epoch": 228.36, + "learning_rate": 4.368354430379747e-06, + "loss": 0.0, + "step": 22750 + }, + { + "epoch": 228.61, + "learning_rate": 4.362025316455697e-06, + "loss": 0.0, + "step": 22775 + }, + { + "epoch": 228.86, + "learning_rate": 4.355696202531645e-06, + "loss": 0.0, + "step": 22800 + }, + { + "epoch": 229.11, + "learning_rate": 4.349367088607595e-06, + "loss": 0.0, + "step": 22825 + }, + { + "epoch": 229.36, + "learning_rate": 4.343037974683545e-06, + "loss": 0.0, + "step": 22850 + }, + { + "epoch": 229.61, + "learning_rate": 4.3367088607594945e-06, + "loss": 0.0, + "step": 22875 + }, + { + "epoch": 229.86, + "learning_rate": 4.330379746835444e-06, + "loss": 0.0, + "step": 22900 + }, + { + "epoch": 230.11, + "learning_rate": 4.3240506329113925e-06, + "loss": 0.0, + "step": 22925 + }, + { + "epoch": 230.36, + "learning_rate": 4.317721518987342e-06, + "loss": 0.0, + "step": 22950 + }, + { + "epoch": 230.61, + "learning_rate": 4.311392405063291e-06, + "loss": 0.0, + "step": 22975 + }, + { + "epoch": 230.87, + "learning_rate": 4.305063291139241e-06, + "loss": 0.0, + "step": 23000 + }, + { + "epoch": 230.87, + "eval_loss": 0.2953989505767822, + "eval_runtime": 2779.9715, + "eval_samples_per_second": 4.584, + "eval_steps_per_second": 0.287, + "eval_wer": 6.888971392840395, + "step": 23000 + }, + { + "epoch": 231.12, + "learning_rate": 4.29873417721519e-06, + "loss": 0.0, + "step": 23025 + }, + { + "epoch": 231.37, + "learning_rate": 4.29240506329114e-06, + "loss": 0.0, + "step": 23050 + }, + { + "epoch": 231.62, + "learning_rate": 4.286075949367089e-06, + "loss": 0.0, + "step": 23075 + }, + { + "epoch": 231.87, + "learning_rate": 4.2797468354430385e-06, + "loss": 0.0, + "step": 23100 + }, + { + "epoch": 232.12, + "learning_rate": 4.273417721518988e-06, + "loss": 0.0, + "step": 23125 + }, + { + "epoch": 232.37, + "learning_rate": 4.2670886075949365e-06, + "loss": 0.0, + "step": 23150 + }, + { + "epoch": 232.62, + "learning_rate": 4.260759493670886e-06, + "loss": 0.0, + "step": 23175 + }, + { + "epoch": 232.87, + "learning_rate": 4.254430379746835e-06, + "loss": 0.0, + "step": 23200 + }, + { + "epoch": 233.12, + "learning_rate": 4.248101265822785e-06, + "loss": 0.0, + "step": 23225 + }, + { + "epoch": 233.38, + "learning_rate": 4.241772151898734e-06, + "loss": 0.0, + "step": 23250 + }, + { + "epoch": 233.63, + "learning_rate": 4.2354430379746845e-06, + "loss": 0.0, + "step": 23275 + }, + { + "epoch": 233.88, + "learning_rate": 4.229113924050633e-06, + "loss": 0.0, + "step": 23300 + }, + { + "epoch": 234.13, + "learning_rate": 4.2227848101265825e-06, + "loss": 0.0, + "step": 23325 + }, + { + "epoch": 234.38, + "learning_rate": 4.216455696202532e-06, + "loss": 0.0, + "step": 23350 + }, + { + "epoch": 234.63, + "learning_rate": 4.210126582278481e-06, + "loss": 0.0, + "step": 23375 + }, + { + "epoch": 234.88, + "learning_rate": 4.203797468354431e-06, + "loss": 0.0, + "step": 23400 + }, + { + "epoch": 235.13, + "learning_rate": 4.19746835443038e-06, + "loss": 0.0, + "step": 23425 + }, + { + "epoch": 235.38, + "learning_rate": 4.19113924050633e-06, + "loss": 0.0, + "step": 23450 + }, + { + "epoch": 235.63, + "learning_rate": 4.184810126582279e-06, + "loss": 0.0, + "step": 23475 + }, + { + "epoch": 235.88, + "learning_rate": 4.1784810126582285e-06, + "loss": 0.0, + "step": 23500 + }, + { + "epoch": 236.14, + "learning_rate": 4.172151898734177e-06, + "loss": 0.0, + "step": 23525 + }, + { + "epoch": 236.39, + "learning_rate": 4.1658227848101265e-06, + "loss": 0.0, + "step": 23550 + }, + { + "epoch": 236.64, + "learning_rate": 4.159493670886076e-06, + "loss": 0.0, + "step": 23575 + }, + { + "epoch": 236.89, + "learning_rate": 4.153164556962025e-06, + "loss": 0.0, + "step": 23600 + }, + { + "epoch": 237.14, + "learning_rate": 4.146835443037975e-06, + "loss": 0.0, + "step": 23625 + }, + { + "epoch": 237.39, + "learning_rate": 4.140506329113924e-06, + "loss": 0.0, + "step": 23650 + }, + { + "epoch": 237.64, + "learning_rate": 4.134177215189874e-06, + "loss": 0.0, + "step": 23675 + }, + { + "epoch": 237.89, + "learning_rate": 4.127848101265823e-06, + "loss": 0.0, + "step": 23700 + }, + { + "epoch": 238.14, + "learning_rate": 4.1215189873417725e-06, + "loss": 0.0, + "step": 23725 + }, + { + "epoch": 238.39, + "learning_rate": 4.115189873417722e-06, + "loss": 0.0, + "step": 23750 + }, + { + "epoch": 238.64, + "learning_rate": 4.108860759493671e-06, + "loss": 0.0, + "step": 23775 + }, + { + "epoch": 238.9, + "learning_rate": 4.102531645569621e-06, + "loss": 0.0, + "step": 23800 + }, + { + "epoch": 239.15, + "learning_rate": 4.09620253164557e-06, + "loss": 0.0, + "step": 23825 + }, + { + "epoch": 239.4, + "learning_rate": 4.08987341772152e-06, + "loss": 0.0, + "step": 23850 + }, + { + "epoch": 239.65, + "learning_rate": 4.083544303797469e-06, + "loss": 0.0, + "step": 23875 + }, + { + "epoch": 239.9, + "learning_rate": 4.077215189873418e-06, + "loss": 0.0, + "step": 23900 + }, + { + "epoch": 240.15, + "learning_rate": 4.070886075949367e-06, + "loss": 0.0, + "step": 23925 + }, + { + "epoch": 240.4, + "learning_rate": 4.0645569620253165e-06, + "loss": 0.0, + "step": 23950 + }, + { + "epoch": 240.65, + "learning_rate": 4.058227848101266e-06, + "loss": 0.0, + "step": 23975 + }, + { + "epoch": 240.9, + "learning_rate": 4.051898734177215e-06, + "loss": 0.0, + "step": 24000 + }, + { + "epoch": 240.9, + "eval_loss": 0.3031490743160248, + "eval_runtime": 2780.7351, + "eval_samples_per_second": 4.582, + "eval_steps_per_second": 0.287, + "eval_wer": 6.88213224949195, + "step": 24000 + }, + { + "epoch": 241.15, + "learning_rate": 4.045569620253165e-06, + "loss": 0.0, + "step": 24025 + }, + { + "epoch": 241.41, + "learning_rate": 4.039240506329114e-06, + "loss": 0.0, + "step": 24050 + }, + { + "epoch": 241.66, + "learning_rate": 4.032911392405064e-06, + "loss": 0.0, + "step": 24075 + }, + { + "epoch": 241.91, + "learning_rate": 4.026582278481013e-06, + "loss": 0.0, + "step": 24100 + }, + { + "epoch": 242.16, + "learning_rate": 4.0202531645569625e-06, + "loss": 0.0, + "step": 24125 + }, + { + "epoch": 242.41, + "learning_rate": 4.013924050632912e-06, + "loss": 0.0, + "step": 24150 + }, + { + "epoch": 242.66, + "learning_rate": 4.007594936708861e-06, + "loss": 0.0, + "step": 24175 + }, + { + "epoch": 242.91, + "learning_rate": 4.001265822784811e-06, + "loss": 0.0, + "step": 24200 + }, + { + "epoch": 243.16, + "learning_rate": 3.99493670886076e-06, + "loss": 0.0, + "step": 24225 + }, + { + "epoch": 243.41, + "learning_rate": 3.98860759493671e-06, + "loss": 0.0, + "step": 24250 + }, + { + "epoch": 243.66, + "learning_rate": 3.982278481012658e-06, + "loss": 0.0, + "step": 24275 + }, + { + "epoch": 243.91, + "learning_rate": 3.975949367088608e-06, + "loss": 0.0, + "step": 24300 + }, + { + "epoch": 244.17, + "learning_rate": 3.969620253164557e-06, + "loss": 0.0, + "step": 24325 + }, + { + "epoch": 244.42, + "learning_rate": 3.9632911392405065e-06, + "loss": 0.0, + "step": 24350 + }, + { + "epoch": 244.67, + "learning_rate": 3.956962025316456e-06, + "loss": 0.0, + "step": 24375 + }, + { + "epoch": 244.92, + "learning_rate": 3.950632911392405e-06, + "loss": 0.0, + "step": 24400 + }, + { + "epoch": 245.17, + "learning_rate": 3.944303797468355e-06, + "loss": 0.0, + "step": 24425 + }, + { + "epoch": 245.42, + "learning_rate": 3.937974683544304e-06, + "loss": 0.0, + "step": 24450 + }, + { + "epoch": 245.67, + "learning_rate": 3.931645569620254e-06, + "loss": 0.0, + "step": 24475 + }, + { + "epoch": 245.92, + "learning_rate": 3.925316455696203e-06, + "loss": 0.0, + "step": 24500 + }, + { + "epoch": 246.17, + "learning_rate": 3.9189873417721525e-06, + "loss": 0.0, + "step": 24525 + }, + { + "epoch": 246.42, + "learning_rate": 3.912658227848102e-06, + "loss": 0.0, + "step": 24550 + }, + { + "epoch": 246.68, + "learning_rate": 3.906329113924051e-06, + "loss": 0.0, + "step": 24575 + }, + { + "epoch": 246.93, + "learning_rate": 3.900000000000001e-06, + "loss": 0.0, + "step": 24600 + }, + { + "epoch": 247.18, + "learning_rate": 3.89367088607595e-06, + "loss": 0.0, + "step": 24625 + }, + { + "epoch": 247.43, + "learning_rate": 3.887341772151899e-06, + "loss": 0.0, + "step": 24650 + }, + { + "epoch": 247.68, + "learning_rate": 3.881012658227848e-06, + "loss": 0.0, + "step": 24675 + }, + { + "epoch": 247.93, + "learning_rate": 3.874683544303798e-06, + "loss": 0.0, + "step": 24700 + }, + { + "epoch": 248.18, + "learning_rate": 3.868354430379747e-06, + "loss": 0.0, + "step": 24725 + }, + { + "epoch": 248.43, + "learning_rate": 3.8620253164556965e-06, + "loss": 0.0, + "step": 24750 + }, + { + "epoch": 248.68, + "learning_rate": 3.855696202531646e-06, + "loss": 0.0, + "step": 24775 + }, + { + "epoch": 248.93, + "learning_rate": 3.849367088607595e-06, + "loss": 0.0, + "step": 24800 + }, + { + "epoch": 249.18, + "learning_rate": 3.843037974683545e-06, + "loss": 0.0, + "step": 24825 + }, + { + "epoch": 249.44, + "learning_rate": 3.836708860759493e-06, + "loss": 0.0, + "step": 24850 + }, + { + "epoch": 249.69, + "learning_rate": 3.830379746835443e-06, + "loss": 0.0, + "step": 24875 + }, + { + "epoch": 249.94, + "learning_rate": 3.824050632911392e-06, + "loss": 0.0, + "step": 24900 + }, + { + "epoch": 250.19, + "learning_rate": 3.8177215189873425e-06, + "loss": 0.0, + "step": 24925 + }, + { + "epoch": 250.44, + "learning_rate": 3.8113924050632915e-06, + "loss": 0.0, + "step": 24950 + }, + { + "epoch": 250.69, + "learning_rate": 3.805063291139241e-06, + "loss": 0.0, + "step": 24975 + }, + { + "epoch": 250.94, + "learning_rate": 3.7987341772151903e-06, + "loss": 0.0, + "step": 25000 + }, + { + "epoch": 250.94, + "eval_loss": 0.3101833760738373, + "eval_runtime": 2782.1977, + "eval_samples_per_second": 4.58, + "eval_steps_per_second": 0.286, + "eval_wer": 6.877247147100203, + "step": 25000 + }, + { + "epoch": 251.19, + "learning_rate": 3.7924050632911398e-06, + "loss": 0.0, + "step": 25025 + }, + { + "epoch": 251.44, + "learning_rate": 3.786075949367089e-06, + "loss": 0.0, + "step": 25050 + }, + { + "epoch": 251.69, + "learning_rate": 3.779746835443038e-06, + "loss": 0.0, + "step": 25075 + }, + { + "epoch": 251.94, + "learning_rate": 3.7734177215189876e-06, + "loss": 0.0, + "step": 25100 + }, + { + "epoch": 252.2, + "learning_rate": 3.767088607594937e-06, + "loss": 0.0, + "step": 25125 + }, + { + "epoch": 252.45, + "learning_rate": 3.7607594936708865e-06, + "loss": 0.0, + "step": 25150 + }, + { + "epoch": 252.7, + "learning_rate": 3.7544303797468355e-06, + "loss": 0.0, + "step": 25175 + }, + { + "epoch": 252.95, + "learning_rate": 3.748101265822785e-06, + "loss": 0.0, + "step": 25200 + }, + { + "epoch": 253.2, + "learning_rate": 3.7417721518987344e-06, + "loss": 0.0, + "step": 25225 + }, + { + "epoch": 253.45, + "learning_rate": 3.7354430379746838e-06, + "loss": 0.0, + "step": 25250 + }, + { + "epoch": 253.7, + "learning_rate": 3.7291139240506328e-06, + "loss": 0.0, + "step": 25275 + }, + { + "epoch": 253.95, + "learning_rate": 3.722784810126582e-06, + "loss": 0.0, + "step": 25300 + }, + { + "epoch": 254.2, + "learning_rate": 3.716455696202532e-06, + "loss": 0.0, + "step": 25325 + }, + { + "epoch": 254.45, + "learning_rate": 3.7101265822784815e-06, + "loss": 0.0, + "step": 25350 + }, + { + "epoch": 254.71, + "learning_rate": 3.703797468354431e-06, + "loss": 0.0, + "step": 25375 + }, + { + "epoch": 254.96, + "learning_rate": 3.6974683544303803e-06, + "loss": 0.0, + "step": 25400 + }, + { + "epoch": 255.21, + "learning_rate": 3.6911392405063293e-06, + "loss": 0.0, + "step": 25425 + }, + { + "epoch": 255.46, + "learning_rate": 3.6848101265822788e-06, + "loss": 0.0, + "step": 25450 + }, + { + "epoch": 255.71, + "learning_rate": 3.678481012658228e-06, + "loss": 0.0, + "step": 25475 + }, + { + "epoch": 255.96, + "learning_rate": 3.6721518987341776e-06, + "loss": 0.0, + "step": 25500 + }, + { + "epoch": 256.21, + "learning_rate": 3.665822784810127e-06, + "loss": 0.0, + "step": 25525 + }, + { + "epoch": 256.46, + "learning_rate": 3.659493670886076e-06, + "loss": 0.0, + "step": 25550 + }, + { + "epoch": 256.71, + "learning_rate": 3.6531645569620255e-06, + "loss": 0.0, + "step": 25575 + }, + { + "epoch": 256.96, + "learning_rate": 3.646835443037975e-06, + "loss": 0.0, + "step": 25600 + }, + { + "epoch": 257.21, + "learning_rate": 3.6405063291139243e-06, + "loss": 0.0, + "step": 25625 + }, + { + "epoch": 257.47, + "learning_rate": 3.6341772151898734e-06, + "loss": 0.0, + "step": 25650 + }, + { + "epoch": 257.72, + "learning_rate": 3.6278481012658228e-06, + "loss": 0.0, + "step": 25675 + }, + { + "epoch": 257.97, + "learning_rate": 3.621518987341772e-06, + "loss": 0.0, + "step": 25700 + }, + { + "epoch": 258.22, + "learning_rate": 3.6151898734177216e-06, + "loss": 0.0, + "step": 25725 + }, + { + "epoch": 258.47, + "learning_rate": 3.6088607594936715e-06, + "loss": 0.0, + "step": 25750 + }, + { + "epoch": 258.72, + "learning_rate": 3.602531645569621e-06, + "loss": 0.0, + "step": 25775 + }, + { + "epoch": 258.97, + "learning_rate": 3.59620253164557e-06, + "loss": 0.0, + "step": 25800 + }, + { + "epoch": 259.22, + "learning_rate": 3.5898734177215193e-06, + "loss": 0.0, + "step": 25825 + }, + { + "epoch": 259.47, + "learning_rate": 3.5835443037974688e-06, + "loss": 0.0, + "step": 25850 + }, + { + "epoch": 259.72, + "learning_rate": 3.577215189873418e-06, + "loss": 0.0, + "step": 25875 + }, + { + "epoch": 259.97, + "learning_rate": 3.5708860759493676e-06, + "loss": 0.0, + "step": 25900 + }, + { + "epoch": 260.23, + "learning_rate": 3.5645569620253166e-06, + "loss": 0.0, + "step": 25925 + }, + { + "epoch": 260.48, + "learning_rate": 3.558227848101266e-06, + "loss": 0.0, + "step": 25950 + }, + { + "epoch": 260.73, + "learning_rate": 3.5518987341772155e-06, + "loss": 0.0, + "step": 25975 + }, + { + "epoch": 260.98, + "learning_rate": 3.545569620253165e-06, + "loss": 0.0, + "step": 26000 + }, + { + "epoch": 260.98, + "eval_loss": 0.3166370987892151, + "eval_runtime": 2780.7731, + "eval_samples_per_second": 4.582, + "eval_steps_per_second": 0.287, + "eval_wer": 6.889948413318743, + "step": 26000 + }, + { + "epoch": 261.23, + "learning_rate": 3.539240506329114e-06, + "loss": 0.0, + "step": 26025 + }, + { + "epoch": 261.48, + "learning_rate": 3.5329113924050633e-06, + "loss": 0.0, + "step": 26050 + }, + { + "epoch": 261.73, + "learning_rate": 3.5265822784810128e-06, + "loss": 0.0, + "step": 26075 + }, + { + "epoch": 261.98, + "learning_rate": 3.520253164556962e-06, + "loss": 0.0, + "step": 26100 + }, + { + "epoch": 262.23, + "learning_rate": 3.5139240506329116e-06, + "loss": 0.0, + "step": 26125 + }, + { + "epoch": 262.48, + "learning_rate": 3.5075949367088615e-06, + "loss": 0.0, + "step": 26150 + }, + { + "epoch": 262.74, + "learning_rate": 3.5012658227848105e-06, + "loss": 0.0, + "step": 26175 + }, + { + "epoch": 262.99, + "learning_rate": 3.49493670886076e-06, + "loss": 0.0, + "step": 26200 + }, + { + "epoch": 263.24, + "learning_rate": 3.4886075949367093e-06, + "loss": 0.0, + "step": 26225 + }, + { + "epoch": 263.49, + "learning_rate": 3.4822784810126588e-06, + "loss": 0.0, + "step": 26250 + }, + { + "epoch": 263.74, + "learning_rate": 3.4759493670886078e-06, + "loss": 0.0, + "step": 26275 + }, + { + "epoch": 263.99, + "learning_rate": 3.469620253164557e-06, + "loss": 0.0, + "step": 26300 + }, + { + "epoch": 264.24, + "learning_rate": 3.4632911392405066e-06, + "loss": 0.0, + "step": 26325 + }, + { + "epoch": 264.49, + "learning_rate": 3.456962025316456e-06, + "loss": 0.0, + "step": 26350 + }, + { + "epoch": 264.74, + "learning_rate": 3.4506329113924055e-06, + "loss": 0.0, + "step": 26375 + }, + { + "epoch": 264.99, + "learning_rate": 3.4443037974683545e-06, + "loss": 0.0, + "step": 26400 + }, + { + "epoch": 265.24, + "learning_rate": 3.437974683544304e-06, + "loss": 0.0, + "step": 26425 + }, + { + "epoch": 265.5, + "learning_rate": 3.4316455696202533e-06, + "loss": 0.0, + "step": 26450 + }, + { + "epoch": 265.75, + "learning_rate": 3.4253164556962028e-06, + "loss": 0.0, + "step": 26475 + }, + { + "epoch": 266.0, + "learning_rate": 3.4189873417721518e-06, + "loss": 0.0, + "step": 26500 + }, + { + "epoch": 266.25, + "learning_rate": 3.412658227848101e-06, + "loss": 0.0, + "step": 26525 + }, + { + "epoch": 266.5, + "learning_rate": 3.4063291139240506e-06, + "loss": 0.0, + "step": 26550 + }, + { + "epoch": 266.75, + "learning_rate": 3.4000000000000005e-06, + "loss": 0.0, + "step": 26575 + }, + { + "epoch": 267.0, + "learning_rate": 3.39367088607595e-06, + "loss": 0.0, + "step": 26600 + }, + { + "epoch": 267.25, + "learning_rate": 3.3873417721518993e-06, + "loss": 0.0, + "step": 26625 + }, + { + "epoch": 267.5, + "learning_rate": 3.3810126582278483e-06, + "loss": 0.0, + "step": 26650 + }, + { + "epoch": 267.75, + "learning_rate": 3.3746835443037978e-06, + "loss": 0.0, + "step": 26675 + }, + { + "epoch": 268.01, + "learning_rate": 3.368354430379747e-06, + "loss": 0.0, + "step": 26700 + }, + { + "epoch": 268.26, + "learning_rate": 3.3620253164556966e-06, + "loss": 0.0, + "step": 26725 + }, + { + "epoch": 268.51, + "learning_rate": 3.355696202531646e-06, + "loss": 0.0, + "step": 26750 + }, + { + "epoch": 268.76, + "learning_rate": 3.349367088607595e-06, + "loss": 0.0, + "step": 26775 + }, + { + "epoch": 269.01, + "learning_rate": 3.3430379746835445e-06, + "loss": 0.0, + "step": 26800 + }, + { + "epoch": 269.26, + "learning_rate": 3.336708860759494e-06, + "loss": 0.0, + "step": 26825 + }, + { + "epoch": 269.51, + "learning_rate": 3.3303797468354433e-06, + "loss": 0.0, + "step": 26850 + }, + { + "epoch": 269.76, + "learning_rate": 3.3240506329113923e-06, + "loss": 0.0, + "step": 26875 + }, + { + "epoch": 270.01, + "learning_rate": 3.3177215189873418e-06, + "loss": 0.0, + "step": 26900 + }, + { + "epoch": 270.26, + "learning_rate": 3.311392405063291e-06, + "loss": 0.0, + "step": 26925 + }, + { + "epoch": 270.51, + "learning_rate": 3.3050632911392406e-06, + "loss": 0.0, + "step": 26950 + }, + { + "epoch": 270.77, + "learning_rate": 3.2987341772151905e-06, + "loss": 0.0, + "step": 26975 + }, + { + "epoch": 271.02, + "learning_rate": 3.29240506329114e-06, + "loss": 0.0, + "step": 27000 + }, + { + "epoch": 271.02, + "eval_loss": 0.3233168423175812, + "eval_runtime": 2786.2635, + "eval_samples_per_second": 4.573, + "eval_steps_per_second": 0.286, + "eval_wer": 6.891902454275442, + "step": 27000 + }, + { + "epoch": 271.27, + "learning_rate": 3.286075949367089e-06, + "loss": 0.0, + "step": 27025 + }, + { + "epoch": 271.52, + "learning_rate": 3.2797468354430383e-06, + "loss": 0.0, + "step": 27050 + }, + { + "epoch": 271.77, + "learning_rate": 3.2734177215189878e-06, + "loss": 0.0, + "step": 27075 + }, + { + "epoch": 272.02, + "learning_rate": 3.267088607594937e-06, + "loss": 0.0, + "step": 27100 + }, + { + "epoch": 272.27, + "learning_rate": 3.260759493670886e-06, + "loss": 0.0, + "step": 27125 + }, + { + "epoch": 272.52, + "learning_rate": 3.2544303797468356e-06, + "loss": 0.0, + "step": 27150 + }, + { + "epoch": 272.77, + "learning_rate": 3.248101265822785e-06, + "loss": 0.0, + "step": 27175 + }, + { + "epoch": 273.02, + "learning_rate": 3.2417721518987345e-06, + "loss": 0.0, + "step": 27200 + }, + { + "epoch": 273.27, + "learning_rate": 3.235443037974684e-06, + "loss": 0.0, + "step": 27225 + }, + { + "epoch": 273.53, + "learning_rate": 3.229113924050633e-06, + "loss": 0.0, + "step": 27250 + }, + { + "epoch": 273.78, + "learning_rate": 3.2227848101265823e-06, + "loss": 0.0, + "step": 27275 + }, + { + "epoch": 274.03, + "learning_rate": 3.2164556962025318e-06, + "loss": 0.0, + "step": 27300 + }, + { + "epoch": 274.28, + "learning_rate": 3.210126582278481e-06, + "loss": 0.0, + "step": 27325 + }, + { + "epoch": 274.53, + "learning_rate": 3.20379746835443e-06, + "loss": 0.0, + "step": 27350 + }, + { + "epoch": 274.78, + "learning_rate": 3.1974683544303805e-06, + "loss": 0.0, + "step": 27375 + }, + { + "epoch": 275.03, + "learning_rate": 3.1911392405063295e-06, + "loss": 0.0, + "step": 27400 + }, + { + "epoch": 275.28, + "learning_rate": 3.184810126582279e-06, + "loss": 0.0, + "step": 27425 + }, + { + "epoch": 275.53, + "learning_rate": 3.1784810126582283e-06, + "loss": 0.0, + "step": 27450 + }, + { + "epoch": 275.78, + "learning_rate": 3.1721518987341778e-06, + "loss": 0.0, + "step": 27475 + }, + { + "epoch": 276.04, + "learning_rate": 3.1658227848101268e-06, + "loss": 0.0, + "step": 27500 + }, + { + "epoch": 276.29, + "learning_rate": 3.159493670886076e-06, + "loss": 0.0, + "step": 27525 + }, + { + "epoch": 276.54, + "learning_rate": 3.1531645569620256e-06, + "loss": 0.0, + "step": 27550 + }, + { + "epoch": 276.79, + "learning_rate": 3.146835443037975e-06, + "loss": 0.0, + "step": 27575 + }, + { + "epoch": 277.04, + "learning_rate": 3.1405063291139245e-06, + "loss": 0.0, + "step": 27600 + }, + { + "epoch": 277.29, + "learning_rate": 3.1341772151898735e-06, + "loss": 0.0, + "step": 27625 + }, + { + "epoch": 277.54, + "learning_rate": 3.127848101265823e-06, + "loss": 0.0, + "step": 27650 + }, + { + "epoch": 277.79, + "learning_rate": 3.1215189873417723e-06, + "loss": 0.0, + "step": 27675 + }, + { + "epoch": 278.04, + "learning_rate": 3.1151898734177218e-06, + "loss": 0.0, + "step": 27700 + }, + { + "epoch": 278.29, + "learning_rate": 3.1088607594936708e-06, + "loss": 0.0, + "step": 27725 + }, + { + "epoch": 278.54, + "learning_rate": 3.10253164556962e-06, + "loss": 0.0, + "step": 27750 + }, + { + "epoch": 278.8, + "learning_rate": 3.0962025316455696e-06, + "loss": 0.0, + "step": 27775 + }, + { + "epoch": 279.05, + "learning_rate": 3.0898734177215195e-06, + "loss": 0.0, + "step": 27800 + }, + { + "epoch": 279.3, + "learning_rate": 3.083544303797469e-06, + "loss": 0.0, + "step": 27825 + }, + { + "epoch": 279.55, + "learning_rate": 3.0772151898734183e-06, + "loss": 0.0, + "step": 27850 + }, + { + "epoch": 279.8, + "learning_rate": 3.0708860759493673e-06, + "loss": 0.0, + "step": 27875 + }, + { + "epoch": 280.05, + "learning_rate": 3.0645569620253168e-06, + "loss": 0.0, + "step": 27900 + }, + { + "epoch": 280.3, + "learning_rate": 3.058227848101266e-06, + "loss": 0.0, + "step": 27925 + }, + { + "epoch": 280.55, + "learning_rate": 3.0518987341772156e-06, + "loss": 0.0, + "step": 27950 + }, + { + "epoch": 280.8, + "learning_rate": 3.0455696202531646e-06, + "loss": 0.0, + "step": 27975 + }, + { + "epoch": 281.05, + "learning_rate": 3.039240506329114e-06, + "loss": 0.0, + "step": 28000 + }, + { + "epoch": 281.05, + "eval_loss": 0.32482120394706726, + "eval_runtime": 2800.9161, + "eval_samples_per_second": 4.549, + "eval_steps_per_second": 0.285, + "eval_wer": 6.891902454275442, + "step": 28000 + }, + { + "epoch": 281.3, + "learning_rate": 3.0329113924050635e-06, + "loss": 0.0, + "step": 28025 + }, + { + "epoch": 281.56, + "learning_rate": 3.026835443037975e-06, + "loss": 0.0, + "step": 28050 + }, + { + "epoch": 281.81, + "learning_rate": 3.0205063291139244e-06, + "loss": 0.0, + "step": 28075 + }, + { + "epoch": 282.06, + "learning_rate": 3.0141772151898734e-06, + "loss": 0.0, + "step": 28100 + }, + { + "epoch": 282.31, + "learning_rate": 3.0078481012658228e-06, + "loss": 0.0, + "step": 28125 + }, + { + "epoch": 282.56, + "learning_rate": 3.0015189873417722e-06, + "loss": 0.0, + "step": 28150 + }, + { + "epoch": 282.81, + "learning_rate": 2.9951898734177216e-06, + "loss": 0.0, + "step": 28175 + }, + { + "epoch": 283.06, + "learning_rate": 2.9888607594936715e-06, + "loss": 0.0, + "step": 28200 + }, + { + "epoch": 283.31, + "learning_rate": 2.982531645569621e-06, + "loss": 0.0, + "step": 28225 + }, + { + "epoch": 283.56, + "learning_rate": 2.97620253164557e-06, + "loss": 0.0, + "step": 28250 + }, + { + "epoch": 283.81, + "learning_rate": 2.9698734177215194e-06, + "loss": 0.0, + "step": 28275 + }, + { + "epoch": 284.07, + "learning_rate": 2.9635443037974688e-06, + "loss": 0.0, + "step": 28300 + }, + { + "epoch": 284.32, + "learning_rate": 2.957215189873418e-06, + "loss": 0.0, + "step": 28325 + }, + { + "epoch": 284.57, + "learning_rate": 2.950886075949367e-06, + "loss": 0.0, + "step": 28350 + }, + { + "epoch": 284.82, + "learning_rate": 2.9445569620253166e-06, + "loss": 0.0, + "step": 28375 + }, + { + "epoch": 285.07, + "learning_rate": 2.938227848101266e-06, + "loss": 0.0, + "step": 28400 + }, + { + "epoch": 285.32, + "learning_rate": 2.9318987341772155e-06, + "loss": 0.0, + "step": 28425 + }, + { + "epoch": 285.57, + "learning_rate": 2.925569620253165e-06, + "loss": 0.0, + "step": 28450 + }, + { + "epoch": 285.82, + "learning_rate": 2.919240506329114e-06, + "loss": 0.0, + "step": 28475 + }, + { + "epoch": 286.07, + "learning_rate": 2.9129113924050634e-06, + "loss": 0.0, + "step": 28500 + }, + { + "epoch": 286.32, + "learning_rate": 2.9065822784810128e-06, + "loss": 0.0, + "step": 28525 + }, + { + "epoch": 286.57, + "learning_rate": 2.900253164556962e-06, + "loss": 0.0, + "step": 28550 + }, + { + "epoch": 286.83, + "learning_rate": 2.8939240506329112e-06, + "loss": 0.0, + "step": 28575 + }, + { + "epoch": 287.08, + "learning_rate": 2.887594936708861e-06, + "loss": 0.0, + "step": 28600 + }, + { + "epoch": 287.33, + "learning_rate": 2.8812658227848105e-06, + "loss": 0.0, + "step": 28625 + }, + { + "epoch": 287.58, + "learning_rate": 2.87493670886076e-06, + "loss": 0.0, + "step": 28650 + }, + { + "epoch": 287.83, + "learning_rate": 2.8686075949367093e-06, + "loss": 0.0, + "step": 28675 + }, + { + "epoch": 288.08, + "learning_rate": 2.8622784810126588e-06, + "loss": 0.0, + "step": 28700 + }, + { + "epoch": 288.33, + "learning_rate": 2.8559493670886078e-06, + "loss": 0.0, + "step": 28725 + }, + { + "epoch": 288.58, + "learning_rate": 2.849620253164557e-06, + "loss": 0.0, + "step": 28750 + }, + { + "epoch": 288.83, + "learning_rate": 2.8432911392405066e-06, + "loss": 0.0, + "step": 28775 + }, + { + "epoch": 289.08, + "learning_rate": 2.836962025316456e-06, + "loss": 0.0, + "step": 28800 + }, + { + "epoch": 289.34, + "learning_rate": 2.830632911392405e-06, + "loss": 0.0, + "step": 28825 + }, + { + "epoch": 289.59, + "learning_rate": 2.8243037974683545e-06, + "loss": 0.0, + "step": 28850 + }, + { + "epoch": 289.84, + "learning_rate": 2.817974683544304e-06, + "loss": 0.0, + "step": 28875 + }, + { + "epoch": 290.09, + "learning_rate": 2.8116455696202533e-06, + "loss": 0.0, + "step": 28900 + }, + { + "epoch": 290.34, + "learning_rate": 2.8053164556962028e-06, + "loss": 0.0, + "step": 28925 + }, + { + "epoch": 290.59, + "learning_rate": 2.7989873417721518e-06, + "loss": 0.0, + "step": 28950 + }, + { + "epoch": 290.84, + "learning_rate": 2.792658227848101e-06, + "loss": 0.0, + "step": 28975 + }, + { + "epoch": 291.09, + "learning_rate": 2.7863291139240506e-06, + "loss": 0.0, + "step": 29000 + }, + { + "epoch": 291.09, + "eval_loss": 0.33633747696876526, + "eval_runtime": 2783.0499, + "eval_samples_per_second": 4.578, + "eval_steps_per_second": 0.286, + "eval_wer": 6.902649679537283, + "step": 29000 + }, + { + "epoch": 291.34, + "learning_rate": 2.7800000000000005e-06, + "loss": 0.0, + "step": 29025 + }, + { + "epoch": 291.59, + "learning_rate": 2.77367088607595e-06, + "loss": 0.0, + "step": 29050 + }, + { + "epoch": 291.84, + "learning_rate": 2.7673417721518993e-06, + "loss": 0.0, + "step": 29075 + }, + { + "epoch": 292.1, + "learning_rate": 2.7610126582278483e-06, + "loss": 0.0, + "step": 29100 + }, + { + "epoch": 292.35, + "learning_rate": 2.7546835443037978e-06, + "loss": 0.0, + "step": 29125 + }, + { + "epoch": 292.6, + "learning_rate": 2.748354430379747e-06, + "loss": 0.0, + "step": 29150 + }, + { + "epoch": 292.85, + "learning_rate": 2.7420253164556966e-06, + "loss": 0.0, + "step": 29175 + }, + { + "epoch": 293.1, + "learning_rate": 2.7356962025316456e-06, + "loss": 0.0, + "step": 29200 + }, + { + "epoch": 293.35, + "learning_rate": 2.729367088607595e-06, + "loss": 0.0, + "step": 29225 + }, + { + "epoch": 293.6, + "learning_rate": 2.7230379746835445e-06, + "loss": 0.0, + "step": 29250 + }, + { + "epoch": 293.85, + "learning_rate": 2.716708860759494e-06, + "loss": 0.0, + "step": 29275 + }, + { + "epoch": 294.1, + "learning_rate": 2.7103797468354433e-06, + "loss": 0.0, + "step": 29300 + }, + { + "epoch": 294.35, + "learning_rate": 2.7040506329113923e-06, + "loss": 0.0, + "step": 29325 + }, + { + "epoch": 294.6, + "learning_rate": 2.6977215189873418e-06, + "loss": 0.0, + "step": 29350 + }, + { + "epoch": 294.86, + "learning_rate": 2.691392405063291e-06, + "loss": 0.0, + "step": 29375 + }, + { + "epoch": 295.11, + "learning_rate": 2.6850632911392406e-06, + "loss": 0.0, + "step": 29400 + }, + { + "epoch": 295.36, + "learning_rate": 2.6787341772151905e-06, + "loss": 0.0, + "step": 29425 + }, + { + "epoch": 295.61, + "learning_rate": 2.6724050632911395e-06, + "loss": 0.0, + "step": 29450 + }, + { + "epoch": 295.86, + "learning_rate": 2.666075949367089e-06, + "loss": 0.0, + "step": 29475 + }, + { + "epoch": 296.11, + "learning_rate": 2.6597468354430383e-06, + "loss": 0.0, + "step": 29500 + }, + { + "epoch": 296.36, + "learning_rate": 2.6534177215189878e-06, + "loss": 0.0, + "step": 29525 + }, + { + "epoch": 296.61, + "learning_rate": 2.647088607594937e-06, + "loss": 0.0, + "step": 29550 + }, + { + "epoch": 296.86, + "learning_rate": 2.640759493670886e-06, + "loss": 0.0, + "step": 29575 + }, + { + "epoch": 297.11, + "learning_rate": 2.6344303797468356e-06, + "loss": 0.0, + "step": 29600 + }, + { + "epoch": 297.37, + "learning_rate": 2.628101265822785e-06, + "loss": 0.0, + "step": 29625 + }, + { + "epoch": 297.62, + "learning_rate": 2.6217721518987345e-06, + "loss": 0.0, + "step": 29650 + }, + { + "epoch": 297.87, + "learning_rate": 2.6154430379746835e-06, + "loss": 0.0, + "step": 29675 + }, + { + "epoch": 298.12, + "learning_rate": 2.609113924050633e-06, + "loss": 0.0, + "step": 29700 + }, + { + "epoch": 298.37, + "learning_rate": 2.6027848101265823e-06, + "loss": 0.0, + "step": 29725 + }, + { + "epoch": 298.62, + "learning_rate": 2.5964556962025318e-06, + "loss": 0.0, + "step": 29750 + }, + { + "epoch": 298.87, + "learning_rate": 2.590126582278481e-06, + "loss": 0.0, + "step": 29775 + }, + { + "epoch": 299.12, + "learning_rate": 2.58379746835443e-06, + "loss": 0.0, + "step": 29800 + }, + { + "epoch": 299.37, + "learning_rate": 2.5774683544303796e-06, + "loss": 0.0, + "step": 29825 + }, + { + "epoch": 299.62, + "learning_rate": 2.5711392405063295e-06, + "loss": 0.0, + "step": 29850 + }, + { + "epoch": 299.87, + "learning_rate": 2.564810126582279e-06, + "loss": 0.0, + "step": 29875 + }, + { + "epoch": 300.13, + "learning_rate": 2.5584810126582283e-06, + "loss": 0.0, + "step": 29900 + }, + { + "epoch": 300.38, + "learning_rate": 2.5521518987341778e-06, + "loss": 0.0, + "step": 29925 + }, + { + "epoch": 300.63, + "learning_rate": 2.5458227848101268e-06, + "loss": 0.0, + "step": 29950 + }, + { + "epoch": 300.88, + "learning_rate": 2.539493670886076e-06, + "loss": 0.0, + "step": 29975 + }, + { + "epoch": 301.13, + "learning_rate": 2.5331645569620256e-06, + "loss": 0.0, + "step": 30000 + }, + { + "epoch": 301.13, + "eval_loss": 0.34187453985214233, + "eval_runtime": 2782.5975, + "eval_samples_per_second": 4.579, + "eval_steps_per_second": 0.286, + "eval_wer": 6.908511802407379, + "step": 30000 + }, + { + "epoch": 301.38, + "learning_rate": 2.526835443037975e-06, + "loss": 0.0, + "step": 30025 + }, + { + "epoch": 301.63, + "learning_rate": 2.520506329113924e-06, + "loss": 0.0, + "step": 30050 + }, + { + "epoch": 301.88, + "learning_rate": 2.5144303797468355e-06, + "loss": 0.0, + "step": 30075 + }, + { + "epoch": 302.13, + "learning_rate": 2.508101265822785e-06, + "loss": 0.0, + "step": 30100 + }, + { + "epoch": 302.38, + "learning_rate": 2.5017721518987344e-06, + "loss": 0.0, + "step": 30125 + }, + { + "epoch": 302.63, + "learning_rate": 2.495443037974684e-06, + "loss": 0.0, + "step": 30150 + }, + { + "epoch": 302.89, + "learning_rate": 2.4891139240506332e-06, + "loss": 0.0, + "step": 30175 + }, + { + "epoch": 303.14, + "learning_rate": 2.4827848101265826e-06, + "loss": 0.0, + "step": 30200 + }, + { + "epoch": 303.39, + "learning_rate": 2.4764556962025317e-06, + "loss": 0.0, + "step": 30225 + }, + { + "epoch": 303.64, + "learning_rate": 2.470126582278481e-06, + "loss": 0.0, + "step": 30250 + }, + { + "epoch": 303.89, + "learning_rate": 2.4637974683544305e-06, + "loss": 0.0, + "step": 30275 + }, + { + "epoch": 304.14, + "learning_rate": 2.45746835443038e-06, + "loss": 0.0, + "step": 30300 + }, + { + "epoch": 304.39, + "learning_rate": 2.4511392405063294e-06, + "loss": 0.0, + "step": 30325 + }, + { + "epoch": 304.64, + "learning_rate": 2.444810126582279e-06, + "loss": 0.0, + "step": 30350 + }, + { + "epoch": 304.89, + "learning_rate": 2.4384810126582282e-06, + "loss": 0.0, + "step": 30375 + }, + { + "epoch": 305.14, + "learning_rate": 2.4321518987341776e-06, + "loss": 0.0, + "step": 30400 + }, + { + "epoch": 305.4, + "learning_rate": 2.4258227848101266e-06, + "loss": 0.0, + "step": 30425 + }, + { + "epoch": 305.65, + "learning_rate": 2.419493670886076e-06, + "loss": 0.0, + "step": 30450 + }, + { + "epoch": 305.9, + "learning_rate": 2.4131645569620255e-06, + "loss": 0.0, + "step": 30475 + }, + { + "epoch": 306.15, + "learning_rate": 2.406835443037975e-06, + "loss": 0.0, + "step": 30500 + }, + { + "epoch": 306.4, + "learning_rate": 2.400506329113924e-06, + "loss": 0.0, + "step": 30525 + }, + { + "epoch": 306.65, + "learning_rate": 2.394177215189874e-06, + "loss": 0.0, + "step": 30550 + }, + { + "epoch": 306.9, + "learning_rate": 2.3878481012658232e-06, + "loss": 0.0, + "step": 30575 + }, + { + "epoch": 307.15, + "learning_rate": 2.3815189873417722e-06, + "loss": 0.0, + "step": 30600 + }, + { + "epoch": 307.4, + "learning_rate": 2.3751898734177216e-06, + "loss": 0.0, + "step": 30625 + }, + { + "epoch": 307.65, + "learning_rate": 2.368860759493671e-06, + "loss": 0.0, + "step": 30650 + }, + { + "epoch": 307.9, + "learning_rate": 2.3625316455696205e-06, + "loss": 0.0, + "step": 30675 + }, + { + "epoch": 308.16, + "learning_rate": 2.35620253164557e-06, + "loss": 0.0, + "step": 30700 + }, + { + "epoch": 308.41, + "learning_rate": 2.349873417721519e-06, + "loss": 0.0, + "step": 30725 + }, + { + "epoch": 308.66, + "learning_rate": 2.3435443037974688e-06, + "loss": 0.0, + "step": 30750 + }, + { + "epoch": 308.91, + "learning_rate": 2.337215189873418e-06, + "loss": 0.0, + "step": 30775 + }, + { + "epoch": 309.16, + "learning_rate": 2.3308860759493672e-06, + "loss": 0.0, + "step": 30800 + }, + { + "epoch": 309.41, + "learning_rate": 2.3245569620253166e-06, + "loss": 0.0, + "step": 30825 + }, + { + "epoch": 309.66, + "learning_rate": 2.318227848101266e-06, + "loss": 0.0, + "step": 30850 + }, + { + "epoch": 309.91, + "learning_rate": 2.3118987341772155e-06, + "loss": 0.0, + "step": 30875 + }, + { + "epoch": 310.16, + "learning_rate": 2.3055696202531645e-06, + "loss": 0.0, + "step": 30900 + }, + { + "epoch": 310.41, + "learning_rate": 2.299240506329114e-06, + "loss": 0.0, + "step": 30925 + }, + { + "epoch": 310.66, + "learning_rate": 2.2929113924050638e-06, + "loss": 0.0, + "step": 30950 + }, + { + "epoch": 310.92, + "learning_rate": 2.286582278481013e-06, + "loss": 0.0, + "step": 30975 + }, + { + "epoch": 311.17, + "learning_rate": 2.2802531645569622e-06, + "loss": 0.0, + "step": 31000 + }, + { + "epoch": 311.17, + "eval_loss": 0.34709784388542175, + "eval_runtime": 2784.8814, + "eval_samples_per_second": 4.575, + "eval_steps_per_second": 0.286, + "eval_wer": 6.885063310926998, + "step": 31000 + }, + { + "epoch": 311.42, + "learning_rate": 2.2739240506329116e-06, + "loss": 0.0, + "step": 31025 + }, + { + "epoch": 311.67, + "learning_rate": 2.267594936708861e-06, + "loss": 0.0, + "step": 31050 + }, + { + "epoch": 311.92, + "learning_rate": 2.26126582278481e-06, + "loss": 0.0, + "step": 31075 + }, + { + "epoch": 312.17, + "learning_rate": 2.2549367088607595e-06, + "loss": 0.0, + "step": 31100 + }, + { + "epoch": 312.42, + "learning_rate": 2.248607594936709e-06, + "loss": 0.0, + "step": 31125 + }, + { + "epoch": 312.67, + "learning_rate": 2.2422784810126584e-06, + "loss": 0.0, + "step": 31150 + }, + { + "epoch": 312.92, + "learning_rate": 2.2359493670886078e-06, + "loss": 0.0, + "step": 31175 + }, + { + "epoch": 313.17, + "learning_rate": 2.2296202531645572e-06, + "loss": 0.0, + "step": 31200 + }, + { + "epoch": 313.43, + "learning_rate": 2.2232911392405066e-06, + "loss": 0.0, + "step": 31225 + }, + { + "epoch": 313.68, + "learning_rate": 2.216962025316456e-06, + "loss": 0.0, + "step": 31250 + }, + { + "epoch": 313.93, + "learning_rate": 2.210632911392405e-06, + "loss": 0.0, + "step": 31275 + }, + { + "epoch": 314.18, + "learning_rate": 2.2043037974683545e-06, + "loss": 0.0, + "step": 31300 + }, + { + "epoch": 314.43, + "learning_rate": 2.197974683544304e-06, + "loss": 0.0, + "step": 31325 + }, + { + "epoch": 314.68, + "learning_rate": 2.1916455696202534e-06, + "loss": 0.0, + "step": 31350 + }, + { + "epoch": 314.93, + "learning_rate": 2.1853164556962028e-06, + "loss": 0.0, + "step": 31375 + }, + { + "epoch": 315.18, + "learning_rate": 2.1789873417721522e-06, + "loss": 0.0, + "step": 31400 + }, + { + "epoch": 315.43, + "learning_rate": 2.1726582278481016e-06, + "loss": 0.0, + "step": 31425 + }, + { + "epoch": 315.68, + "learning_rate": 2.1663291139240506e-06, + "loss": 0.0, + "step": 31450 + }, + { + "epoch": 315.93, + "learning_rate": 2.16e-06, + "loss": 0.0, + "step": 31475 + }, + { + "epoch": 316.19, + "learning_rate": 2.1536708860759495e-06, + "loss": 0.0, + "step": 31500 + }, + { + "epoch": 316.44, + "learning_rate": 2.147341772151899e-06, + "loss": 0.0, + "step": 31525 + }, + { + "epoch": 316.69, + "learning_rate": 2.1410126582278484e-06, + "loss": 0.0, + "step": 31550 + }, + { + "epoch": 316.94, + "learning_rate": 2.1346835443037978e-06, + "loss": 0.0, + "step": 31575 + }, + { + "epoch": 317.19, + "learning_rate": 2.128354430379747e-06, + "loss": 0.0, + "step": 31600 + }, + { + "epoch": 317.44, + "learning_rate": 2.1220253164556966e-06, + "loss": 0.0, + "step": 31625 + }, + { + "epoch": 317.69, + "learning_rate": 2.1156962025316456e-06, + "loss": 0.0, + "step": 31650 + }, + { + "epoch": 317.94, + "learning_rate": 2.109367088607595e-06, + "loss": 0.0, + "step": 31675 + }, + { + "epoch": 318.19, + "learning_rate": 2.1030379746835445e-06, + "loss": 0.0, + "step": 31700 + }, + { + "epoch": 318.44, + "learning_rate": 2.096708860759494e-06, + "loss": 0.0, + "step": 31725 + }, + { + "epoch": 318.7, + "learning_rate": 2.090379746835443e-06, + "loss": 0.0, + "step": 31750 + }, + { + "epoch": 318.95, + "learning_rate": 2.0840506329113928e-06, + "loss": 0.0, + "step": 31775 + }, + { + "epoch": 319.2, + "learning_rate": 2.077721518987342e-06, + "loss": 0.0, + "step": 31800 + }, + { + "epoch": 319.45, + "learning_rate": 2.0713924050632912e-06, + "loss": 0.0, + "step": 31825 + }, + { + "epoch": 319.7, + "learning_rate": 2.0650632911392406e-06, + "loss": 0.0, + "step": 31850 + }, + { + "epoch": 319.95, + "learning_rate": 2.05873417721519e-06, + "loss": 0.0, + "step": 31875 + }, + { + "epoch": 320.2, + "learning_rate": 2.0524050632911395e-06, + "loss": 0.0, + "step": 31900 + }, + { + "epoch": 320.45, + "learning_rate": 2.0460759493670885e-06, + "loss": 0.0, + "step": 31925 + }, + { + "epoch": 320.7, + "learning_rate": 2.039746835443038e-06, + "loss": 0.0, + "step": 31950 + }, + { + "epoch": 320.95, + "learning_rate": 2.0334177215189878e-06, + "loss": 0.0, + "step": 31975 + }, + { + "epoch": 321.2, + "learning_rate": 2.0270886075949368e-06, + "loss": 0.0, + "step": 32000 + }, + { + "epoch": 321.2, + "eval_loss": 0.3526245951652527, + "eval_runtime": 2793.8043, + "eval_samples_per_second": 4.561, + "eval_steps_per_second": 0.285, + "eval_wer": 6.870408003751758, + "step": 32000 + }, + { + "epoch": 321.46, + "learning_rate": 2.020759493670886e-06, + "loss": 0.0, + "step": 32025 + }, + { + "epoch": 321.71, + "learning_rate": 2.0144303797468356e-06, + "loss": 0.0, + "step": 32050 + }, + { + "epoch": 321.96, + "learning_rate": 2.008101265822785e-06, + "loss": 0.0, + "step": 32075 + }, + { + "epoch": 322.21, + "learning_rate": 2.0017721518987345e-06, + "loss": 0.0, + "step": 32100 + }, + { + "epoch": 322.46, + "learning_rate": 1.9954430379746835e-06, + "loss": 0.0, + "step": 32125 + }, + { + "epoch": 322.71, + "learning_rate": 1.989367088607595e-06, + "loss": 0.0, + "step": 32150 + }, + { + "epoch": 322.96, + "learning_rate": 1.9830379746835444e-06, + "loss": 0.0, + "step": 32175 + }, + { + "epoch": 323.21, + "learning_rate": 1.976708860759494e-06, + "loss": 0.0, + "step": 32200 + }, + { + "epoch": 323.46, + "learning_rate": 1.9703797468354432e-06, + "loss": 0.0, + "step": 32225 + }, + { + "epoch": 323.71, + "learning_rate": 1.9640506329113927e-06, + "loss": 0.0, + "step": 32250 + }, + { + "epoch": 323.96, + "learning_rate": 1.957721518987342e-06, + "loss": 0.0, + "step": 32275 + }, + { + "epoch": 324.22, + "learning_rate": 1.951392405063291e-06, + "loss": 0.0, + "step": 32300 + }, + { + "epoch": 324.47, + "learning_rate": 1.9450632911392405e-06, + "loss": 0.0, + "step": 32325 + }, + { + "epoch": 324.72, + "learning_rate": 1.93873417721519e-06, + "loss": 0.0, + "step": 32350 + }, + { + "epoch": 324.97, + "learning_rate": 1.9324050632911394e-06, + "loss": 0.0, + "step": 32375 + }, + { + "epoch": 325.22, + "learning_rate": 1.926075949367089e-06, + "loss": 0.0, + "step": 32400 + }, + { + "epoch": 325.47, + "learning_rate": 1.9197468354430382e-06, + "loss": 0.0, + "step": 32425 + }, + { + "epoch": 325.72, + "learning_rate": 1.9134177215189877e-06, + "loss": 0.0, + "step": 32450 + }, + { + "epoch": 325.97, + "learning_rate": 1.9070886075949369e-06, + "loss": 0.0, + "step": 32475 + }, + { + "epoch": 326.22, + "learning_rate": 1.900759493670886e-06, + "loss": 0.0, + "step": 32500 + }, + { + "epoch": 326.47, + "learning_rate": 1.8944303797468355e-06, + "loss": 0.0, + "step": 32525 + }, + { + "epoch": 326.73, + "learning_rate": 1.888101265822785e-06, + "loss": 0.0, + "step": 32550 + }, + { + "epoch": 326.98, + "learning_rate": 1.8817721518987344e-06, + "loss": 0.0, + "step": 32575 + }, + { + "epoch": 327.23, + "learning_rate": 1.8754430379746838e-06, + "loss": 0.0, + "step": 32600 + }, + { + "epoch": 327.48, + "learning_rate": 1.8691139240506332e-06, + "loss": 0.0, + "step": 32625 + }, + { + "epoch": 327.73, + "learning_rate": 1.8627848101265824e-06, + "loss": 0.0, + "step": 32650 + }, + { + "epoch": 327.98, + "learning_rate": 1.8564556962025319e-06, + "loss": 0.0, + "step": 32675 + }, + { + "epoch": 328.23, + "learning_rate": 1.850126582278481e-06, + "loss": 0.0, + "step": 32700 + }, + { + "epoch": 328.48, + "learning_rate": 1.8437974683544305e-06, + "loss": 0.0, + "step": 32725 + }, + { + "epoch": 328.73, + "learning_rate": 1.8374683544303797e-06, + "loss": 0.0, + "step": 32750 + }, + { + "epoch": 328.98, + "learning_rate": 1.8311392405063292e-06, + "loss": 0.0, + "step": 32775 + }, + { + "epoch": 329.23, + "learning_rate": 1.8248101265822788e-06, + "loss": 0.0, + "step": 32800 + }, + { + "epoch": 329.49, + "learning_rate": 1.818481012658228e-06, + "loss": 0.0, + "step": 32825 + }, + { + "epoch": 329.74, + "learning_rate": 1.8121518987341774e-06, + "loss": 0.0, + "step": 32850 + }, + { + "epoch": 329.99, + "learning_rate": 1.8058227848101267e-06, + "loss": 0.0, + "step": 32875 + }, + { + "epoch": 330.24, + "learning_rate": 1.799493670886076e-06, + "loss": 0.0, + "step": 32900 + }, + { + "epoch": 330.49, + "learning_rate": 1.7931645569620253e-06, + "loss": 0.0, + "step": 32925 + }, + { + "epoch": 330.74, + "learning_rate": 1.7868354430379747e-06, + "loss": 0.0, + "step": 32950 + }, + { + "epoch": 330.99, + "learning_rate": 1.7805063291139242e-06, + "loss": 0.0, + "step": 32975 + }, + { + "epoch": 331.24, + "learning_rate": 1.7741772151898736e-06, + "loss": 0.0, + "step": 33000 + }, + { + "epoch": 331.24, + "eval_loss": 0.3569923937320709, + "eval_runtime": 2780.874, + "eval_samples_per_second": 4.582, + "eval_steps_per_second": 0.287, + "eval_wer": 6.883109269970299, + "step": 33000 + }, + { + "epoch": 331.49, + "learning_rate": 1.767848101265823e-06, + "loss": 0.0, + "step": 33025 + }, + { + "epoch": 331.74, + "learning_rate": 1.7615189873417724e-06, + "loss": 0.0, + "step": 33050 + }, + { + "epoch": 331.99, + "learning_rate": 1.7551898734177217e-06, + "loss": 0.0, + "step": 33075 + }, + { + "epoch": 332.25, + "learning_rate": 1.748860759493671e-06, + "loss": 0.0, + "step": 33100 + }, + { + "epoch": 332.5, + "learning_rate": 1.7425316455696203e-06, + "loss": 0.0, + "step": 33125 + }, + { + "epoch": 332.75, + "learning_rate": 1.7362025316455697e-06, + "loss": 0.0, + "step": 33150 + }, + { + "epoch": 333.0, + "learning_rate": 1.729873417721519e-06, + "loss": 0.0, + "step": 33175 + }, + { + "epoch": 333.25, + "learning_rate": 1.7235443037974686e-06, + "loss": 0.0, + "step": 33200 + }, + { + "epoch": 333.5, + "learning_rate": 1.717215189873418e-06, + "loss": 0.0, + "step": 33225 + }, + { + "epoch": 333.75, + "learning_rate": 1.7108860759493672e-06, + "loss": 0.0, + "step": 33250 + }, + { + "epoch": 334.0, + "learning_rate": 1.7045569620253167e-06, + "loss": 0.0, + "step": 33275 + }, + { + "epoch": 334.25, + "learning_rate": 1.6982278481012659e-06, + "loss": 0.0, + "step": 33300 + }, + { + "epoch": 334.5, + "learning_rate": 1.6918987341772153e-06, + "loss": 0.0, + "step": 33325 + }, + { + "epoch": 334.76, + "learning_rate": 1.6855696202531645e-06, + "loss": 0.0, + "step": 33350 + }, + { + "epoch": 335.01, + "learning_rate": 1.679493670886076e-06, + "loss": 0.0, + "step": 33375 + }, + { + "epoch": 335.26, + "learning_rate": 1.6731645569620256e-06, + "loss": 0.0, + "step": 33400 + }, + { + "epoch": 335.51, + "learning_rate": 1.6668354430379748e-06, + "loss": 0.0, + "step": 33425 + }, + { + "epoch": 335.76, + "learning_rate": 1.6605063291139242e-06, + "loss": 0.0, + "step": 33450 + }, + { + "epoch": 336.01, + "learning_rate": 1.6541772151898735e-06, + "loss": 0.0, + "step": 33475 + }, + { + "epoch": 336.26, + "learning_rate": 1.6478481012658229e-06, + "loss": 0.0, + "step": 33500 + }, + { + "epoch": 336.51, + "learning_rate": 1.6415189873417723e-06, + "loss": 0.0, + "step": 33525 + }, + { + "epoch": 336.76, + "learning_rate": 1.6351898734177215e-06, + "loss": 0.0, + "step": 33550 + }, + { + "epoch": 337.01, + "learning_rate": 1.628860759493671e-06, + "loss": 0.0, + "step": 33575 + }, + { + "epoch": 337.26, + "learning_rate": 1.6225316455696206e-06, + "loss": 0.0, + "step": 33600 + }, + { + "epoch": 337.52, + "learning_rate": 1.6162025316455698e-06, + "loss": 0.0, + "step": 33625 + }, + { + "epoch": 337.77, + "learning_rate": 1.6098734177215192e-06, + "loss": 0.0, + "step": 33650 + }, + { + "epoch": 338.02, + "learning_rate": 1.6035443037974685e-06, + "loss": 0.0, + "step": 33675 + }, + { + "epoch": 338.27, + "learning_rate": 1.5972151898734179e-06, + "loss": 0.0, + "step": 33700 + }, + { + "epoch": 338.52, + "learning_rate": 1.590886075949367e-06, + "loss": 0.0, + "step": 33725 + }, + { + "epoch": 338.77, + "learning_rate": 1.5845569620253165e-06, + "loss": 0.0, + "step": 33750 + }, + { + "epoch": 339.02, + "learning_rate": 1.5782278481012657e-06, + "loss": 0.0, + "step": 33775 + }, + { + "epoch": 339.27, + "learning_rate": 1.5718987341772154e-06, + "loss": 0.0, + "step": 33800 + }, + { + "epoch": 339.52, + "learning_rate": 1.5655696202531648e-06, + "loss": 0.0, + "step": 33825 + }, + { + "epoch": 339.77, + "learning_rate": 1.559240506329114e-06, + "loss": 0.0, + "step": 33850 + }, + { + "epoch": 340.03, + "learning_rate": 1.5529113924050635e-06, + "loss": 0.0, + "step": 33875 + }, + { + "epoch": 340.28, + "learning_rate": 1.5465822784810127e-06, + "loss": 0.0, + "step": 33900 + }, + { + "epoch": 340.53, + "learning_rate": 1.540253164556962e-06, + "loss": 0.0, + "step": 33925 + }, + { + "epoch": 340.78, + "learning_rate": 1.5339240506329115e-06, + "loss": 0.0, + "step": 33950 + }, + { + "epoch": 341.03, + "learning_rate": 1.5275949367088607e-06, + "loss": 0.0, + "step": 33975 + }, + { + "epoch": 341.28, + "learning_rate": 1.5212658227848104e-06, + "loss": 0.0, + "step": 34000 + }, + { + "epoch": 341.28, + "eval_loss": 0.36138084530830383, + "eval_runtime": 2780.6897, + "eval_samples_per_second": 4.582, + "eval_steps_per_second": 0.287, + "eval_wer": 6.885063310926998, + "step": 34000 + }, + { + "epoch": 341.53, + "learning_rate": 1.5149367088607598e-06, + "loss": 0.0, + "step": 34025 + }, + { + "epoch": 341.78, + "learning_rate": 1.508607594936709e-06, + "loss": 0.0, + "step": 34050 + }, + { + "epoch": 342.03, + "learning_rate": 1.5022784810126585e-06, + "loss": 0.0, + "step": 34075 + }, + { + "epoch": 342.28, + "learning_rate": 1.4959493670886077e-06, + "loss": 0.0, + "step": 34100 + }, + { + "epoch": 342.53, + "learning_rate": 1.489620253164557e-06, + "loss": 0.0, + "step": 34125 + }, + { + "epoch": 342.79, + "learning_rate": 1.4832911392405063e-06, + "loss": 0.0, + "step": 34150 + }, + { + "epoch": 343.04, + "learning_rate": 1.4769620253164557e-06, + "loss": 0.0, + "step": 34175 + }, + { + "epoch": 343.29, + "learning_rate": 1.470632911392405e-06, + "loss": 0.0, + "step": 34200 + }, + { + "epoch": 343.54, + "learning_rate": 1.4643037974683546e-06, + "loss": 0.0, + "step": 34225 + }, + { + "epoch": 343.79, + "learning_rate": 1.457974683544304e-06, + "loss": 0.0, + "step": 34250 + }, + { + "epoch": 344.04, + "learning_rate": 1.4516455696202532e-06, + "loss": 0.0, + "step": 34275 + }, + { + "epoch": 344.29, + "learning_rate": 1.4453164556962027e-06, + "loss": 0.0, + "step": 34300 + }, + { + "epoch": 344.54, + "learning_rate": 1.4389873417721519e-06, + "loss": 0.0, + "step": 34325 + }, + { + "epoch": 344.79, + "learning_rate": 1.4326582278481013e-06, + "loss": 0.0, + "step": 34350 + }, + { + "epoch": 345.04, + "learning_rate": 1.4263291139240507e-06, + "loss": 0.0, + "step": 34375 + }, + { + "epoch": 345.29, + "learning_rate": 1.42e-06, + "loss": 0.0, + "step": 34400 + }, + { + "epoch": 345.55, + "learning_rate": 1.4136708860759496e-06, + "loss": 0.0, + "step": 34425 + }, + { + "epoch": 345.8, + "learning_rate": 1.407341772151899e-06, + "loss": 0.0, + "step": 34450 + }, + { + "epoch": 346.05, + "learning_rate": 1.4010126582278482e-06, + "loss": 0.0, + "step": 34475 + }, + { + "epoch": 346.3, + "learning_rate": 1.3946835443037977e-06, + "loss": 0.0, + "step": 34500 + }, + { + "epoch": 346.55, + "learning_rate": 1.3883544303797469e-06, + "loss": 0.0, + "step": 34525 + }, + { + "epoch": 346.8, + "learning_rate": 1.3820253164556963e-06, + "loss": 0.0, + "step": 34550 + }, + { + "epoch": 347.05, + "learning_rate": 1.3756962025316455e-06, + "loss": 0.0, + "step": 34575 + }, + { + "epoch": 347.3, + "learning_rate": 1.369367088607595e-06, + "loss": 0.0, + "step": 34600 + }, + { + "epoch": 347.55, + "learning_rate": 1.3630379746835446e-06, + "loss": 0.0, + "step": 34625 + }, + { + "epoch": 347.8, + "learning_rate": 1.3567088607594938e-06, + "loss": 0.0, + "step": 34650 + }, + { + "epoch": 348.06, + "learning_rate": 1.3503797468354432e-06, + "loss": 0.0, + "step": 34675 + }, + { + "epoch": 348.31, + "learning_rate": 1.3440506329113925e-06, + "loss": 0.0, + "step": 34700 + }, + { + "epoch": 348.56, + "learning_rate": 1.3377215189873419e-06, + "loss": 0.0, + "step": 34725 + }, + { + "epoch": 348.81, + "learning_rate": 1.3313924050632913e-06, + "loss": 0.0, + "step": 34750 + }, + { + "epoch": 349.06, + "learning_rate": 1.3250632911392405e-06, + "loss": 0.0, + "step": 34775 + }, + { + "epoch": 349.31, + "learning_rate": 1.31873417721519e-06, + "loss": 0.0, + "step": 34800 + }, + { + "epoch": 349.56, + "learning_rate": 1.3124050632911394e-06, + "loss": 0.0, + "step": 34825 + }, + { + "epoch": 349.81, + "learning_rate": 1.3060759493670888e-06, + "loss": 0.0, + "step": 34850 + }, + { + "epoch": 350.06, + "learning_rate": 1.2997468354430382e-06, + "loss": 0.0, + "step": 34875 + }, + { + "epoch": 350.31, + "learning_rate": 1.2934177215189875e-06, + "loss": 0.0, + "step": 34900 + }, + { + "epoch": 350.56, + "learning_rate": 1.2870886075949369e-06, + "loss": 0.0, + "step": 34925 + }, + { + "epoch": 350.82, + "learning_rate": 1.280759493670886e-06, + "loss": 0.0, + "step": 34950 + }, + { + "epoch": 351.07, + "learning_rate": 1.2744303797468355e-06, + "loss": 0.0, + "step": 34975 + }, + { + "epoch": 351.32, + "learning_rate": 1.2681012658227847e-06, + "loss": 0.0, + "step": 35000 + }, + { + "epoch": 351.32, + "eval_loss": 0.36445754766464233, + "eval_runtime": 2782.2502, + "eval_samples_per_second": 4.58, + "eval_steps_per_second": 0.286, + "eval_wer": 6.878224167578552, + "step": 35000 + }, + { + "epoch": 351.57, + "learning_rate": 1.2617721518987342e-06, + "loss": 0.0, + "step": 35025 + }, + { + "epoch": 351.82, + "learning_rate": 1.2554430379746838e-06, + "loss": 0.0, + "step": 35050 + }, + { + "epoch": 352.07, + "learning_rate": 1.249113924050633e-06, + "loss": 0.0, + "step": 35075 + }, + { + "epoch": 352.32, + "learning_rate": 1.2427848101265824e-06, + "loss": 0.0, + "step": 35100 + }, + { + "epoch": 352.57, + "learning_rate": 1.2364556962025317e-06, + "loss": 0.0, + "step": 35125 + }, + { + "epoch": 352.82, + "learning_rate": 1.230126582278481e-06, + "loss": 0.0, + "step": 35150 + }, + { + "epoch": 353.07, + "learning_rate": 1.2237974683544305e-06, + "loss": 0.0, + "step": 35175 + }, + { + "epoch": 353.32, + "learning_rate": 1.21746835443038e-06, + "loss": 0.0, + "step": 35200 + }, + { + "epoch": 353.58, + "learning_rate": 1.2111392405063292e-06, + "loss": 0.0, + "step": 35225 + }, + { + "epoch": 353.83, + "learning_rate": 1.2048101265822786e-06, + "loss": 0.0, + "step": 35250 + }, + { + "epoch": 354.08, + "learning_rate": 1.1984810126582278e-06, + "loss": 0.0, + "step": 35275 + }, + { + "epoch": 354.33, + "learning_rate": 1.1921518987341774e-06, + "loss": 0.0, + "step": 35300 + }, + { + "epoch": 354.58, + "learning_rate": 1.1858227848101267e-06, + "loss": 0.0, + "step": 35325 + }, + { + "epoch": 354.83, + "learning_rate": 1.179493670886076e-06, + "loss": 0.0, + "step": 35350 + }, + { + "epoch": 355.08, + "learning_rate": 1.1731645569620253e-06, + "loss": 0.0, + "step": 35375 + }, + { + "epoch": 355.33, + "learning_rate": 1.1668354430379747e-06, + "loss": 0.0, + "step": 35400 + }, + { + "epoch": 355.58, + "learning_rate": 1.1605063291139242e-06, + "loss": 0.0, + "step": 35425 + }, + { + "epoch": 355.83, + "learning_rate": 1.1541772151898736e-06, + "loss": 0.0, + "step": 35450 + }, + { + "epoch": 356.09, + "learning_rate": 1.1478481012658228e-06, + "loss": 0.0, + "step": 35475 + }, + { + "epoch": 356.34, + "learning_rate": 1.1415189873417722e-06, + "loss": 0.0, + "step": 35500 + }, + { + "epoch": 356.59, + "learning_rate": 1.1351898734177217e-06, + "loss": 0.0, + "step": 35525 + }, + { + "epoch": 356.84, + "learning_rate": 1.1288607594936709e-06, + "loss": 0.0, + "step": 35550 + }, + { + "epoch": 357.09, + "learning_rate": 1.1225316455696203e-06, + "loss": 0.0, + "step": 35575 + }, + { + "epoch": 357.34, + "learning_rate": 1.1162025316455697e-06, + "loss": 0.0, + "step": 35600 + }, + { + "epoch": 357.59, + "learning_rate": 1.1098734177215192e-06, + "loss": 0.0, + "step": 35625 + }, + { + "epoch": 357.84, + "learning_rate": 1.1035443037974684e-06, + "loss": 0.0, + "step": 35650 + }, + { + "epoch": 358.09, + "learning_rate": 1.0972151898734178e-06, + "loss": 0.0, + "step": 35675 + }, + { + "epoch": 358.34, + "learning_rate": 1.0908860759493672e-06, + "loss": 0.0, + "step": 35700 + }, + { + "epoch": 358.59, + "learning_rate": 1.0845569620253167e-06, + "loss": 0.0, + "step": 35725 + }, + { + "epoch": 358.85, + "learning_rate": 1.0782278481012659e-06, + "loss": 0.0, + "step": 35750 + }, + { + "epoch": 359.1, + "learning_rate": 1.0718987341772153e-06, + "loss": 0.0, + "step": 35775 + }, + { + "epoch": 359.35, + "learning_rate": 1.0655696202531647e-06, + "loss": 0.0, + "step": 35800 + }, + { + "epoch": 359.6, + "learning_rate": 1.059240506329114e-06, + "loss": 0.0, + "step": 35825 + }, + { + "epoch": 359.85, + "learning_rate": 1.0529113924050634e-06, + "loss": 0.0, + "step": 35850 + }, + { + "epoch": 360.1, + "learning_rate": 1.0465822784810128e-06, + "loss": 0.0, + "step": 35875 + }, + { + "epoch": 360.35, + "learning_rate": 1.040253164556962e-06, + "loss": 0.0, + "step": 35900 + }, + { + "epoch": 360.6, + "learning_rate": 1.0339240506329114e-06, + "loss": 0.0, + "step": 35925 + }, + { + "epoch": 360.85, + "learning_rate": 1.0275949367088609e-06, + "loss": 0.0, + "step": 35950 + }, + { + "epoch": 361.1, + "learning_rate": 1.02126582278481e-06, + "loss": 0.0, + "step": 35975 + }, + { + "epoch": 361.36, + "learning_rate": 1.0149367088607595e-06, + "loss": 0.0, + "step": 36000 + }, + { + "epoch": 361.36, + "eval_loss": 0.3663193881511688, + "eval_runtime": 2812.4519, + "eval_samples_per_second": 4.531, + "eval_steps_per_second": 0.283, + "eval_wer": 6.871385024230108, + "step": 36000 + }, + { + "epoch": 361.61, + "learning_rate": 1.008607594936709e-06, + "loss": 0.0, + "step": 36025 + }, + { + "epoch": 361.86, + "learning_rate": 1.0022784810126584e-06, + "loss": 0.0, + "step": 36050 + }, + { + "epoch": 362.11, + "learning_rate": 9.959493670886076e-07, + "loss": 0.0, + "step": 36075 + }, + { + "epoch": 362.36, + "learning_rate": 9.89620253164557e-07, + "loss": 0.0, + "step": 36100 + }, + { + "epoch": 362.61, + "learning_rate": 9.832911392405064e-07, + "loss": 0.0, + "step": 36125 + }, + { + "epoch": 362.86, + "learning_rate": 9.769620253164559e-07, + "loss": 0.0, + "step": 36150 + }, + { + "epoch": 363.11, + "learning_rate": 9.70632911392405e-07, + "loss": 0.0, + "step": 36175 + }, + { + "epoch": 363.36, + "learning_rate": 9.643037974683545e-07, + "loss": 0.0, + "step": 36200 + }, + { + "epoch": 363.61, + "learning_rate": 9.57974683544304e-07, + "loss": 0.0, + "step": 36225 + }, + { + "epoch": 363.86, + "learning_rate": 9.516455696202533e-07, + "loss": 0.0, + "step": 36250 + }, + { + "epoch": 364.12, + "learning_rate": 9.453164556962026e-07, + "loss": 0.0, + "step": 36275 + }, + { + "epoch": 364.37, + "learning_rate": 9.389873417721519e-07, + "loss": 0.0, + "step": 36300 + }, + { + "epoch": 364.62, + "learning_rate": 9.326582278481014e-07, + "loss": 0.0, + "step": 36325 + }, + { + "epoch": 364.87, + "learning_rate": 9.263291139240508e-07, + "loss": 0.0, + "step": 36350 + }, + { + "epoch": 365.12, + "learning_rate": 9.200000000000001e-07, + "loss": 0.0, + "step": 36375 + }, + { + "epoch": 365.37, + "learning_rate": 9.136708860759494e-07, + "loss": 0.0, + "step": 36400 + }, + { + "epoch": 365.62, + "learning_rate": 9.073417721518988e-07, + "loss": 0.0, + "step": 36425 + }, + { + "epoch": 365.87, + "learning_rate": 9.010126582278482e-07, + "loss": 0.0, + "step": 36450 + }, + { + "epoch": 366.12, + "learning_rate": 8.946835443037975e-07, + "loss": 0.0, + "step": 36475 + }, + { + "epoch": 366.37, + "learning_rate": 8.883544303797469e-07, + "loss": 0.0, + "step": 36500 + }, + { + "epoch": 366.62, + "learning_rate": 8.820253164556963e-07, + "loss": 0.0, + "step": 36525 + }, + { + "epoch": 366.88, + "learning_rate": 8.756962025316457e-07, + "loss": 0.0, + "step": 36550 + }, + { + "epoch": 367.13, + "learning_rate": 8.69367088607595e-07, + "loss": 0.0, + "step": 36575 + }, + { + "epoch": 367.38, + "learning_rate": 8.630379746835443e-07, + "loss": 0.0, + "step": 36600 + }, + { + "epoch": 367.63, + "learning_rate": 8.567088607594938e-07, + "loss": 0.0, + "step": 36625 + }, + { + "epoch": 367.88, + "learning_rate": 8.503797468354432e-07, + "loss": 0.0, + "step": 36650 + }, + { + "epoch": 368.13, + "learning_rate": 8.440506329113925e-07, + "loss": 0.0, + "step": 36675 + }, + { + "epoch": 368.38, + "learning_rate": 8.377215189873418e-07, + "loss": 0.0, + "step": 36700 + }, + { + "epoch": 368.63, + "learning_rate": 8.313924050632912e-07, + "loss": 0.0, + "step": 36725 + }, + { + "epoch": 368.88, + "learning_rate": 8.250632911392407e-07, + "loss": 0.0, + "step": 36750 + }, + { + "epoch": 369.13, + "learning_rate": 8.1873417721519e-07, + "loss": 0.0, + "step": 36775 + }, + { + "epoch": 369.39, + "learning_rate": 8.124050632911393e-07, + "loss": 0.0, + "step": 36800 + }, + { + "epoch": 369.64, + "learning_rate": 8.060759493670886e-07, + "loss": 0.0, + "step": 36825 + }, + { + "epoch": 369.89, + "learning_rate": 7.99746835443038e-07, + "loss": 0.0, + "step": 36850 + }, + { + "epoch": 370.14, + "learning_rate": 7.934177215189874e-07, + "loss": 0.0, + "step": 36875 + }, + { + "epoch": 370.39, + "learning_rate": 7.870886075949367e-07, + "loss": 0.0, + "step": 36900 + }, + { + "epoch": 370.64, + "learning_rate": 7.807594936708861e-07, + "loss": 0.0, + "step": 36925 + }, + { + "epoch": 370.89, + "learning_rate": 7.744303797468355e-07, + "loss": 0.0, + "step": 36950 + }, + { + "epoch": 371.14, + "learning_rate": 7.681012658227849e-07, + "loss": 0.0, + "step": 36975 + }, + { + "epoch": 371.39, + "learning_rate": 7.617721518987342e-07, + "loss": 0.0, + "step": 37000 + }, + { + "epoch": 371.39, + "eval_loss": 0.3676894009113312, + "eval_runtime": 2780.5773, + "eval_samples_per_second": 4.583, + "eval_steps_per_second": 0.287, + "eval_wer": 6.867476942316711, + "step": 37000 + }, + { + "epoch": 371.64, + "learning_rate": 7.554430379746835e-07, + "loss": 0.0, + "step": 37025 + }, + { + "epoch": 371.89, + "learning_rate": 7.49113924050633e-07, + "loss": 0.0, + "step": 37050 + }, + { + "epoch": 372.15, + "learning_rate": 7.427848101265824e-07, + "loss": 0.0, + "step": 37075 + }, + { + "epoch": 372.4, + "learning_rate": 7.364556962025317e-07, + "loss": 0.0, + "step": 37100 + }, + { + "epoch": 372.65, + "learning_rate": 7.30126582278481e-07, + "loss": 0.0, + "step": 37125 + }, + { + "epoch": 372.9, + "learning_rate": 7.237974683544304e-07, + "loss": 0.0, + "step": 37150 + }, + { + "epoch": 373.15, + "learning_rate": 7.174683544303799e-07, + "loss": 0.0, + "step": 37175 + }, + { + "epoch": 373.4, + "learning_rate": 7.111392405063292e-07, + "loss": 0.0, + "step": 37200 + }, + { + "epoch": 373.65, + "learning_rate": 7.048101265822785e-07, + "loss": 0.0, + "step": 37225 + }, + { + "epoch": 373.9, + "learning_rate": 6.984810126582279e-07, + "loss": 0.0, + "step": 37250 + }, + { + "epoch": 374.15, + "learning_rate": 6.921518987341773e-07, + "loss": 0.0, + "step": 37275 + }, + { + "epoch": 374.4, + "learning_rate": 6.858227848101266e-07, + "loss": 0.0, + "step": 37300 + }, + { + "epoch": 374.65, + "learning_rate": 6.79493670886076e-07, + "loss": 0.0, + "step": 37325 + }, + { + "epoch": 374.91, + "learning_rate": 6.731645569620254e-07, + "loss": 0.0, + "step": 37350 + }, + { + "epoch": 375.16, + "learning_rate": 6.668354430379748e-07, + "loss": 0.0, + "step": 37375 + }, + { + "epoch": 375.41, + "learning_rate": 6.605063291139241e-07, + "loss": 0.0, + "step": 37400 + }, + { + "epoch": 375.66, + "learning_rate": 6.541772151898734e-07, + "loss": 0.0, + "step": 37425 + }, + { + "epoch": 375.91, + "learning_rate": 6.478481012658229e-07, + "loss": 0.0, + "step": 37450 + }, + { + "epoch": 376.16, + "learning_rate": 6.415189873417723e-07, + "loss": 0.0, + "step": 37475 + }, + { + "epoch": 376.41, + "learning_rate": 6.351898734177216e-07, + "loss": 0.0, + "step": 37500 + }, + { + "epoch": 376.66, + "learning_rate": 6.288607594936709e-07, + "loss": 0.0, + "step": 37525 + }, + { + "epoch": 376.91, + "learning_rate": 6.225316455696203e-07, + "loss": 0.0, + "step": 37550 + }, + { + "epoch": 377.16, + "learning_rate": 6.162025316455696e-07, + "loss": 0.0, + "step": 37575 + }, + { + "epoch": 377.42, + "learning_rate": 6.098734177215191e-07, + "loss": 0.0, + "step": 37600 + }, + { + "epoch": 377.67, + "learning_rate": 6.035443037974684e-07, + "loss": 0.0, + "step": 37625 + }, + { + "epoch": 377.92, + "learning_rate": 5.972151898734177e-07, + "loss": 0.0, + "step": 37650 + }, + { + "epoch": 378.17, + "learning_rate": 5.908860759493671e-07, + "loss": 0.0, + "step": 37675 + }, + { + "epoch": 378.42, + "learning_rate": 5.845569620253165e-07, + "loss": 0.0, + "step": 37700 + }, + { + "epoch": 378.67, + "learning_rate": 5.782278481012658e-07, + "loss": 0.0, + "step": 37725 + }, + { + "epoch": 378.92, + "learning_rate": 5.718987341772152e-07, + "loss": 0.0, + "step": 37750 + }, + { + "epoch": 379.17, + "learning_rate": 5.655696202531645e-07, + "loss": 0.0, + "step": 37775 + }, + { + "epoch": 379.42, + "learning_rate": 5.59240506329114e-07, + "loss": 0.0, + "step": 37800 + }, + { + "epoch": 379.67, + "learning_rate": 5.529113924050633e-07, + "loss": 0.0, + "step": 37825 + }, + { + "epoch": 379.92, + "learning_rate": 5.465822784810127e-07, + "loss": 0.0, + "step": 37850 + }, + { + "epoch": 380.18, + "learning_rate": 5.40253164556962e-07, + "loss": 0.0, + "step": 37875 + }, + { + "epoch": 380.43, + "learning_rate": 5.339240506329115e-07, + "loss": 0.0, + "step": 37900 + }, + { + "epoch": 380.68, + "learning_rate": 5.275949367088608e-07, + "loss": 0.0, + "step": 37925 + }, + { + "epoch": 380.93, + "learning_rate": 5.212658227848102e-07, + "loss": 0.0, + "step": 37950 + }, + { + "epoch": 381.18, + "learning_rate": 5.149367088607595e-07, + "loss": 0.0, + "step": 37975 + }, + { + "epoch": 381.43, + "learning_rate": 5.08607594936709e-07, + "loss": 0.0, + "step": 38000 + }, + { + "epoch": 381.43, + "eval_loss": 0.3681415617465973, + "eval_runtime": 2779.0085, + "eval_samples_per_second": 4.585, + "eval_steps_per_second": 0.287, + "eval_wer": 6.880178208535251, + "step": 38000 + }, + { + "epoch": 381.68, + "learning_rate": 5.022784810126583e-07, + "loss": 0.0, + "step": 38025 + }, + { + "epoch": 381.93, + "learning_rate": 4.959493670886076e-07, + "loss": 0.0, + "step": 38050 + }, + { + "epoch": 382.18, + "learning_rate": 4.896202531645569e-07, + "loss": 0.0, + "step": 38075 + }, + { + "epoch": 382.43, + "learning_rate": 4.832911392405064e-07, + "loss": 0.0, + "step": 38100 + }, + { + "epoch": 382.69, + "learning_rate": 4.769620253164557e-07, + "loss": 0.0, + "step": 38125 + }, + { + "epoch": 382.94, + "learning_rate": 4.706329113924051e-07, + "loss": 0.0, + "step": 38150 + }, + { + "epoch": 383.19, + "learning_rate": 4.6430379746835443e-07, + "loss": 0.0, + "step": 38175 + }, + { + "epoch": 383.44, + "learning_rate": 4.5797468354430386e-07, + "loss": 0.0, + "step": 38200 + }, + { + "epoch": 383.69, + "learning_rate": 4.516455696202532e-07, + "loss": 0.0, + "step": 38225 + }, + { + "epoch": 383.94, + "learning_rate": 4.453164556962026e-07, + "loss": 0.0, + "step": 38250 + }, + { + "epoch": 384.19, + "learning_rate": 4.3898734177215193e-07, + "loss": 0.0, + "step": 38275 + }, + { + "epoch": 384.44, + "learning_rate": 4.326582278481013e-07, + "loss": 0.0, + "step": 38300 + }, + { + "epoch": 384.69, + "learning_rate": 4.263291139240507e-07, + "loss": 0.0, + "step": 38325 + }, + { + "epoch": 384.94, + "learning_rate": 4.2000000000000006e-07, + "loss": 0.0, + "step": 38350 + }, + { + "epoch": 385.19, + "learning_rate": 4.136708860759494e-07, + "loss": 0.0, + "step": 38375 + }, + { + "epoch": 385.45, + "learning_rate": 4.073417721518988e-07, + "loss": 0.0, + "step": 38400 + }, + { + "epoch": 385.7, + "learning_rate": 4.010126582278481e-07, + "loss": 0.0, + "step": 38425 + }, + { + "epoch": 385.95, + "learning_rate": 3.9468354430379755e-07, + "loss": 0.0, + "step": 38450 + }, + { + "epoch": 386.2, + "learning_rate": 3.883544303797469e-07, + "loss": 0.0, + "step": 38475 + }, + { + "epoch": 386.45, + "learning_rate": 3.8202531645569625e-07, + "loss": 0.0, + "step": 38500 + }, + { + "epoch": 386.7, + "learning_rate": 3.7569620253164557e-07, + "loss": 0.0, + "step": 38525 + }, + { + "epoch": 386.95, + "learning_rate": 3.69367088607595e-07, + "loss": 0.0, + "step": 38550 + }, + { + "epoch": 387.2, + "learning_rate": 3.630379746835443e-07, + "loss": 0.0, + "step": 38575 + }, + { + "epoch": 387.45, + "learning_rate": 3.5670886075949364e-07, + "loss": 0.0, + "step": 38600 + }, + { + "epoch": 387.7, + "learning_rate": 3.5037974683544307e-07, + "loss": 0.0, + "step": 38625 + }, + { + "epoch": 387.95, + "learning_rate": 3.440506329113924e-07, + "loss": 0.0, + "step": 38650 + }, + { + "epoch": 388.21, + "learning_rate": 3.377215189873418e-07, + "loss": 0.0, + "step": 38675 + }, + { + "epoch": 388.46, + "learning_rate": 3.3139240506329114e-07, + "loss": 0.0, + "step": 38700 + }, + { + "epoch": 388.71, + "learning_rate": 3.250632911392405e-07, + "loss": 0.0, + "step": 38725 + }, + { + "epoch": 388.96, + "learning_rate": 3.187341772151899e-07, + "loss": 0.0, + "step": 38750 + }, + { + "epoch": 389.21, + "learning_rate": 3.1240506329113927e-07, + "loss": 0.0, + "step": 38775 + }, + { + "epoch": 389.46, + "learning_rate": 3.0607594936708864e-07, + "loss": 0.0, + "step": 38800 + }, + { + "epoch": 389.71, + "learning_rate": 2.99746835443038e-07, + "loss": 0.0, + "step": 38825 + }, + { + "epoch": 389.96, + "learning_rate": 2.934177215189874e-07, + "loss": 0.0, + "step": 38850 + }, + { + "epoch": 390.21, + "learning_rate": 2.8708860759493677e-07, + "loss": 0.0, + "step": 38875 + }, + { + "epoch": 390.46, + "learning_rate": 2.807594936708861e-07, + "loss": 0.0, + "step": 38900 + }, + { + "epoch": 390.72, + "learning_rate": 2.7443037974683546e-07, + "loss": 0.0, + "step": 38925 + }, + { + "epoch": 390.97, + "learning_rate": 2.6810126582278484e-07, + "loss": 0.0, + "step": 38950 + }, + { + "epoch": 391.22, + "learning_rate": 2.617721518987342e-07, + "loss": 0.0, + "step": 38975 + }, + { + "epoch": 391.47, + "learning_rate": 2.554430379746836e-07, + "loss": 0.0, + "step": 39000 + }, + { + "epoch": 391.47, + "eval_loss": 0.36862120032310486, + "eval_runtime": 2786.3432, + "eval_samples_per_second": 4.573, + "eval_steps_per_second": 0.286, + "eval_wer": 6.887994372362044, + "step": 39000 + }, + { + "epoch": 391.72, + "learning_rate": 2.491139240506329e-07, + "loss": 0.0, + "step": 39025 + }, + { + "epoch": 391.97, + "learning_rate": 2.427848101265823e-07, + "loss": 0.0, + "step": 39050 + }, + { + "epoch": 392.22, + "learning_rate": 2.3645569620253166e-07, + "loss": 0.0, + "step": 39075 + }, + { + "epoch": 392.47, + "learning_rate": 2.30126582278481e-07, + "loss": 0.0, + "step": 39100 + }, + { + "epoch": 392.72, + "learning_rate": 2.2379746835443038e-07, + "loss": 0.0, + "step": 39125 + }, + { + "epoch": 392.97, + "learning_rate": 2.1746835443037976e-07, + "loss": 0.0, + "step": 39150 + }, + { + "epoch": 393.22, + "learning_rate": 2.1113924050632913e-07, + "loss": 0.0, + "step": 39175 + }, + { + "epoch": 393.48, + "learning_rate": 2.0481012658227848e-07, + "loss": 0.0, + "step": 39200 + }, + { + "epoch": 393.73, + "learning_rate": 1.9848101265822785e-07, + "loss": 0.0, + "step": 39225 + }, + { + "epoch": 393.98, + "learning_rate": 1.9215189873417723e-07, + "loss": 0.0, + "step": 39250 + }, + { + "epoch": 394.23, + "learning_rate": 1.858227848101266e-07, + "loss": 0.0, + "step": 39275 + }, + { + "epoch": 394.48, + "learning_rate": 1.7949367088607595e-07, + "loss": 0.0, + "step": 39300 + }, + { + "epoch": 394.73, + "learning_rate": 1.7316455696202533e-07, + "loss": 0.0, + "step": 39325 + }, + { + "epoch": 394.98, + "learning_rate": 1.668354430379747e-07, + "loss": 0.0, + "step": 39350 + }, + { + "epoch": 395.23, + "learning_rate": 1.6050632911392405e-07, + "loss": 0.0, + "step": 39375 + }, + { + "epoch": 395.48, + "learning_rate": 1.5417721518987342e-07, + "loss": 0.0, + "step": 39400 + }, + { + "epoch": 395.73, + "learning_rate": 1.4810126582278482e-07, + "loss": 0.0, + "step": 39425 + }, + { + "epoch": 395.98, + "learning_rate": 1.417721518987342e-07, + "loss": 0.0, + "step": 39450 + }, + { + "epoch": 396.24, + "learning_rate": 1.3544303797468354e-07, + "loss": 0.0, + "step": 39475 + }, + { + "epoch": 396.49, + "learning_rate": 1.2911392405063292e-07, + "loss": 0.0, + "step": 39500 + }, + { + "epoch": 396.74, + "learning_rate": 1.227848101265823e-07, + "loss": 0.0, + "step": 39525 + }, + { + "epoch": 396.99, + "learning_rate": 1.1645569620253166e-07, + "loss": 0.0, + "step": 39550 + }, + { + "epoch": 397.24, + "learning_rate": 1.1012658227848102e-07, + "loss": 0.0, + "step": 39575 + }, + { + "epoch": 397.49, + "learning_rate": 1.0379746835443039e-07, + "loss": 0.0, + "step": 39600 + }, + { + "epoch": 397.74, + "learning_rate": 9.746835443037975e-08, + "loss": 0.0, + "step": 39625 + }, + { + "epoch": 397.99, + "learning_rate": 9.113924050632913e-08, + "loss": 0.0, + "step": 39650 + }, + { + "epoch": 398.24, + "learning_rate": 8.481012658227849e-08, + "loss": 0.0, + "step": 39675 + }, + { + "epoch": 398.49, + "learning_rate": 7.848101265822786e-08, + "loss": 0.0, + "step": 39700 + }, + { + "epoch": 398.75, + "learning_rate": 7.215189873417721e-08, + "loss": 0.0, + "step": 39725 + }, + { + "epoch": 399.0, + "learning_rate": 6.582278481012659e-08, + "loss": 0.0, + "step": 39750 + }, + { + "epoch": 399.25, + "learning_rate": 5.9493670886075955e-08, + "loss": 0.0, + "step": 39775 + }, + { + "epoch": 399.5, + "learning_rate": 5.3164556962025324e-08, + "loss": 0.0, + "step": 39800 + }, + { + "epoch": 399.75, + "learning_rate": 4.683544303797469e-08, + "loss": 0.0, + "step": 39825 + }, + { + "epoch": 400.0, + "learning_rate": 4.050632911392405e-08, + "loss": 0.0, + "step": 39850 + }, + { + "epoch": 400.25, + "learning_rate": 3.417721518987342e-08, + "loss": 0.0, + "step": 39875 + }, + { + "epoch": 400.5, + "learning_rate": 2.7848101265822786e-08, + "loss": 0.0, + "step": 39900 + }, + { + "epoch": 400.75, + "learning_rate": 2.1518987341772154e-08, + "loss": 0.0, + "step": 39925 + }, + { + "epoch": 401.0, + "learning_rate": 1.518987341772152e-08, + "loss": 0.0, + "step": 39950 + }, + { + "epoch": 401.25, + "learning_rate": 8.860759493670887e-09, + "loss": 0.0, + "step": 39975 + }, + { + "epoch": 401.51, + "learning_rate": 2.5316455696202533e-09, + "loss": 0.0, + "step": 40000 + }, + { + "epoch": 401.51, + "eval_loss": 0.36875849962234497, + "eval_runtime": 2798.7548, + "eval_samples_per_second": 4.553, + "eval_steps_per_second": 0.285, + "eval_wer": 6.887994372362044, + "step": 40000 + }, + { + "epoch": 401.51, + "step": 40000, + "total_flos": 3.476313472275579e+22, + "train_loss": 0.003312818900368211, + "train_runtime": 987758.8877, + "train_samples_per_second": 10.367, + "train_steps_per_second": 0.04 + } + ], + "logging_steps": 25, + "max_steps": 40000, + "num_input_tokens_seen": 0, + "num_train_epochs": 405, + "save_steps": 1000, + "total_flos": 3.476313472275579e+22, + "train_batch_size": 32, + "trial_name": null, + "trial_params": null +}