diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,12210 @@ +{ + "best_metric": 27.969339566672204, + "best_model_checkpoint": "./hamsa-tiny-pretrained/checkpoint-42500", + "epoch": 2.004972331381827, + "eval_steps": 2500, + "global_step": 50000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 3.8e-07, + "loss": 12.4564, + "step": 25 + }, + { + "epoch": 0.0, + "learning_rate": 8.8e-07, + "loss": 10.7741, + "step": 50 + }, + { + "epoch": 0.0, + "learning_rate": 1.3800000000000001e-06, + "loss": 6.9302, + "step": 75 + }, + { + "epoch": 0.0, + "learning_rate": 1.8800000000000002e-06, + "loss": 4.7429, + "step": 100 + }, + { + "epoch": 0.01, + "learning_rate": 2.38e-06, + "loss": 4.1009, + "step": 125 + }, + { + "epoch": 0.01, + "learning_rate": 2.88e-06, + "loss": 3.7125, + "step": 150 + }, + { + "epoch": 0.01, + "learning_rate": 3.3800000000000007e-06, + "loss": 3.5459, + "step": 175 + }, + { + "epoch": 0.01, + "learning_rate": 3.88e-06, + "loss": 3.4287, + "step": 200 + }, + { + "epoch": 0.01, + "learning_rate": 4.38e-06, + "loss": 3.3747, + "step": 225 + }, + { + "epoch": 0.01, + "learning_rate": 4.880000000000001e-06, + "loss": 3.3327, + "step": 250 + }, + { + "epoch": 0.01, + "learning_rate": 5.380000000000001e-06, + "loss": 3.2979, + "step": 275 + }, + { + "epoch": 0.01, + "learning_rate": 5.8800000000000005e-06, + "loss": 3.2587, + "step": 300 + }, + { + "epoch": 0.01, + "learning_rate": 6.380000000000001e-06, + "loss": 3.2244, + "step": 325 + }, + { + "epoch": 0.01, + "learning_rate": 6.88e-06, + "loss": 3.1921, + "step": 350 + }, + { + "epoch": 0.02, + "learning_rate": 7.3800000000000005e-06, + "loss": 3.174, + "step": 375 + }, + { + "epoch": 0.02, + "learning_rate": 7.88e-06, + "loss": 3.1549, + "step": 400 + }, + { + "epoch": 0.02, + "learning_rate": 8.380000000000001e-06, + "loss": 3.1301, + "step": 425 + }, + { + "epoch": 0.02, + "learning_rate": 8.880000000000001e-06, + "loss": 3.087, + "step": 450 + }, + { + "epoch": 0.02, + "learning_rate": 9.38e-06, + "loss": 3.0892, + "step": 475 + }, + { + "epoch": 0.02, + "learning_rate": 9.88e-06, + "loss": 3.0683, + "step": 500 + }, + { + "epoch": 0.02, + "learning_rate": 9.996161616161618e-06, + "loss": 3.0525, + "step": 525 + }, + { + "epoch": 0.02, + "learning_rate": 9.991111111111112e-06, + "loss": 3.0249, + "step": 550 + }, + { + "epoch": 0.02, + "learning_rate": 9.986060606060606e-06, + "loss": 3.0031, + "step": 575 + }, + { + "epoch": 0.02, + "learning_rate": 9.981010101010102e-06, + "loss": 2.9919, + "step": 600 + }, + { + "epoch": 0.03, + "learning_rate": 9.975959595959597e-06, + "loss": 2.9719, + "step": 625 + }, + { + "epoch": 0.03, + "learning_rate": 9.970909090909093e-06, + "loss": 2.9604, + "step": 650 + }, + { + "epoch": 0.03, + "learning_rate": 9.965858585858587e-06, + "loss": 2.9554, + "step": 675 + }, + { + "epoch": 0.03, + "learning_rate": 9.960808080808081e-06, + "loss": 2.92, + "step": 700 + }, + { + "epoch": 0.03, + "learning_rate": 9.955757575757576e-06, + "loss": 2.8839, + "step": 725 + }, + { + "epoch": 0.03, + "learning_rate": 9.950707070707072e-06, + "loss": 2.8838, + "step": 750 + }, + { + "epoch": 0.03, + "learning_rate": 9.945656565656566e-06, + "loss": 2.8339, + "step": 775 + }, + { + "epoch": 0.03, + "learning_rate": 9.940606060606062e-06, + "loss": 2.3913, + "step": 800 + }, + { + "epoch": 0.03, + "learning_rate": 9.935555555555556e-06, + "loss": 1.4371, + "step": 825 + }, + { + "epoch": 0.03, + "learning_rate": 9.930505050505052e-06, + "loss": 1.1851, + "step": 850 + }, + { + "epoch": 0.04, + "learning_rate": 9.925454545454547e-06, + "loss": 1.0894, + "step": 875 + }, + { + "epoch": 0.04, + "learning_rate": 9.92040404040404e-06, + "loss": 1.0265, + "step": 900 + }, + { + "epoch": 0.04, + "learning_rate": 9.915353535353535e-06, + "loss": 0.9688, + "step": 925 + }, + { + "epoch": 0.04, + "learning_rate": 9.910303030303031e-06, + "loss": 0.943, + "step": 950 + }, + { + "epoch": 0.04, + "learning_rate": 9.905252525252525e-06, + "loss": 0.9323, + "step": 975 + }, + { + "epoch": 0.04, + "learning_rate": 9.900202020202021e-06, + "loss": 0.9253, + "step": 1000 + }, + { + "epoch": 0.04, + "learning_rate": 9.895151515151516e-06, + "loss": 0.9364, + "step": 1025 + }, + { + "epoch": 0.04, + "learning_rate": 9.890101010101012e-06, + "loss": 0.877, + "step": 1050 + }, + { + "epoch": 0.04, + "learning_rate": 9.885050505050506e-06, + "loss": 0.8555, + "step": 1075 + }, + { + "epoch": 0.04, + "learning_rate": 9.88e-06, + "loss": 0.8677, + "step": 1100 + }, + { + "epoch": 0.05, + "learning_rate": 9.874949494949496e-06, + "loss": 0.8478, + "step": 1125 + }, + { + "epoch": 0.05, + "learning_rate": 9.86989898989899e-06, + "loss": 0.8226, + "step": 1150 + }, + { + "epoch": 0.05, + "learning_rate": 9.864848484848487e-06, + "loss": 0.8557, + "step": 1175 + }, + { + "epoch": 0.05, + "learning_rate": 9.85979797979798e-06, + "loss": 0.8147, + "step": 1200 + }, + { + "epoch": 0.05, + "learning_rate": 9.854747474747475e-06, + "loss": 0.8105, + "step": 1225 + }, + { + "epoch": 0.05, + "learning_rate": 9.84969696969697e-06, + "loss": 0.8112, + "step": 1250 + }, + { + "epoch": 0.05, + "learning_rate": 9.844646464646465e-06, + "loss": 0.8025, + "step": 1275 + }, + { + "epoch": 0.05, + "learning_rate": 9.83959595959596e-06, + "loss": 0.7667, + "step": 1300 + }, + { + "epoch": 0.05, + "learning_rate": 9.834545454545456e-06, + "loss": 0.7569, + "step": 1325 + }, + { + "epoch": 0.05, + "learning_rate": 9.82949494949495e-06, + "loss": 0.7895, + "step": 1350 + }, + { + "epoch": 0.06, + "learning_rate": 9.824444444444446e-06, + "loss": 0.7617, + "step": 1375 + }, + { + "epoch": 0.06, + "learning_rate": 9.81939393939394e-06, + "loss": 0.7461, + "step": 1400 + }, + { + "epoch": 0.06, + "learning_rate": 9.814343434343435e-06, + "loss": 0.7571, + "step": 1425 + }, + { + "epoch": 0.06, + "learning_rate": 9.80929292929293e-06, + "loss": 0.7505, + "step": 1450 + }, + { + "epoch": 0.06, + "learning_rate": 9.804242424242425e-06, + "loss": 0.7264, + "step": 1475 + }, + { + "epoch": 0.06, + "learning_rate": 9.799191919191921e-06, + "loss": 0.7555, + "step": 1500 + }, + { + "epoch": 0.06, + "learning_rate": 9.794141414141415e-06, + "loss": 0.7307, + "step": 1525 + }, + { + "epoch": 0.06, + "learning_rate": 9.78909090909091e-06, + "loss": 0.7414, + "step": 1550 + }, + { + "epoch": 0.06, + "learning_rate": 9.784040404040405e-06, + "loss": 0.7407, + "step": 1575 + }, + { + "epoch": 0.06, + "learning_rate": 9.7789898989899e-06, + "loss": 0.7128, + "step": 1600 + }, + { + "epoch": 0.07, + "learning_rate": 9.773939393939394e-06, + "loss": 0.7091, + "step": 1625 + }, + { + "epoch": 0.07, + "learning_rate": 9.76888888888889e-06, + "loss": 0.7166, + "step": 1650 + }, + { + "epoch": 0.07, + "learning_rate": 9.763838383838384e-06, + "loss": 0.7312, + "step": 1675 + }, + { + "epoch": 0.07, + "learning_rate": 9.75878787878788e-06, + "loss": 0.702, + "step": 1700 + }, + { + "epoch": 0.07, + "learning_rate": 9.753737373737375e-06, + "loss": 0.6995, + "step": 1725 + }, + { + "epoch": 0.07, + "learning_rate": 9.748686868686869e-06, + "loss": 0.7129, + "step": 1750 + }, + { + "epoch": 0.07, + "learning_rate": 9.743636363636363e-06, + "loss": 0.7034, + "step": 1775 + }, + { + "epoch": 0.07, + "learning_rate": 9.73858585858586e-06, + "loss": 0.7077, + "step": 1800 + }, + { + "epoch": 0.07, + "learning_rate": 9.733535353535353e-06, + "loss": 0.7103, + "step": 1825 + }, + { + "epoch": 0.07, + "learning_rate": 9.72848484848485e-06, + "loss": 0.6812, + "step": 1850 + }, + { + "epoch": 0.08, + "learning_rate": 9.723434343434345e-06, + "loss": 0.6833, + "step": 1875 + }, + { + "epoch": 0.08, + "learning_rate": 9.71838383838384e-06, + "loss": 0.7074, + "step": 1900 + }, + { + "epoch": 0.08, + "learning_rate": 9.713333333333334e-06, + "loss": 0.6759, + "step": 1925 + }, + { + "epoch": 0.08, + "learning_rate": 9.708282828282828e-06, + "loss": 0.6769, + "step": 1950 + }, + { + "epoch": 0.08, + "learning_rate": 9.703232323232324e-06, + "loss": 0.6499, + "step": 1975 + }, + { + "epoch": 0.08, + "learning_rate": 9.698181818181819e-06, + "loss": 0.671, + "step": 2000 + }, + { + "epoch": 0.08, + "learning_rate": 9.693131313131315e-06, + "loss": 0.6632, + "step": 2025 + }, + { + "epoch": 0.08, + "learning_rate": 9.688080808080809e-06, + "loss": 0.6818, + "step": 2050 + }, + { + "epoch": 0.08, + "learning_rate": 9.683030303030305e-06, + "loss": 0.655, + "step": 2075 + }, + { + "epoch": 0.08, + "learning_rate": 9.6779797979798e-06, + "loss": 0.6762, + "step": 2100 + }, + { + "epoch": 0.09, + "learning_rate": 9.672929292929294e-06, + "loss": 0.6799, + "step": 2125 + }, + { + "epoch": 0.09, + "learning_rate": 9.667878787878788e-06, + "loss": 0.6555, + "step": 2150 + }, + { + "epoch": 0.09, + "learning_rate": 9.662828282828284e-06, + "loss": 0.6549, + "step": 2175 + }, + { + "epoch": 0.09, + "learning_rate": 9.657777777777778e-06, + "loss": 0.665, + "step": 2200 + }, + { + "epoch": 0.09, + "learning_rate": 9.652727272727274e-06, + "loss": 0.6663, + "step": 2225 + }, + { + "epoch": 0.09, + "learning_rate": 9.647676767676768e-06, + "loss": 0.6383, + "step": 2250 + }, + { + "epoch": 0.09, + "learning_rate": 9.642626262626263e-06, + "loss": 0.6426, + "step": 2275 + }, + { + "epoch": 0.09, + "learning_rate": 9.637575757575759e-06, + "loss": 0.6448, + "step": 2300 + }, + { + "epoch": 0.09, + "learning_rate": 9.632525252525253e-06, + "loss": 0.6444, + "step": 2325 + }, + { + "epoch": 0.09, + "learning_rate": 9.627474747474749e-06, + "loss": 0.6468, + "step": 2350 + }, + { + "epoch": 0.1, + "learning_rate": 9.622424242424243e-06, + "loss": 0.659, + "step": 2375 + }, + { + "epoch": 0.1, + "learning_rate": 9.61737373737374e-06, + "loss": 0.6481, + "step": 2400 + }, + { + "epoch": 0.1, + "learning_rate": 9.612323232323234e-06, + "loss": 0.6516, + "step": 2425 + }, + { + "epoch": 0.1, + "learning_rate": 9.607272727272728e-06, + "loss": 0.6222, + "step": 2450 + }, + { + "epoch": 0.1, + "learning_rate": 9.602222222222222e-06, + "loss": 0.672, + "step": 2475 + }, + { + "epoch": 0.1, + "learning_rate": 9.597171717171718e-06, + "loss": 0.6597, + "step": 2500 + }, + { + "epoch": 0.1, + "eval_loss": 0.6394317150115967, + "eval_runtime": 334.7136, + "eval_samples_per_second": 14.953, + "eval_steps_per_second": 1.87, + "eval_wer": 48.83836825743373, + "step": 2500 + }, + { + "epoch": 0.1, + "learning_rate": 9.592121212121212e-06, + "loss": 0.633, + "step": 2525 + }, + { + "epoch": 0.1, + "learning_rate": 9.587070707070708e-06, + "loss": 0.6082, + "step": 2550 + }, + { + "epoch": 0.1, + "learning_rate": 9.582020202020203e-06, + "loss": 0.6322, + "step": 2575 + }, + { + "epoch": 0.1, + "learning_rate": 9.576969696969699e-06, + "loss": 0.6516, + "step": 2600 + }, + { + "epoch": 0.11, + "learning_rate": 9.571919191919193e-06, + "loss": 0.637, + "step": 2625 + }, + { + "epoch": 0.11, + "learning_rate": 9.566868686868687e-06, + "loss": 0.6358, + "step": 2650 + }, + { + "epoch": 0.11, + "learning_rate": 9.561818181818182e-06, + "loss": 0.6416, + "step": 2675 + }, + { + "epoch": 0.11, + "learning_rate": 9.556767676767678e-06, + "loss": 0.6102, + "step": 2700 + }, + { + "epoch": 0.11, + "learning_rate": 9.551717171717174e-06, + "loss": 0.6196, + "step": 2725 + }, + { + "epoch": 0.11, + "learning_rate": 9.546666666666668e-06, + "loss": 0.6398, + "step": 2750 + }, + { + "epoch": 0.11, + "learning_rate": 9.541616161616162e-06, + "loss": 0.6186, + "step": 2775 + }, + { + "epoch": 0.11, + "learning_rate": 9.536565656565656e-06, + "loss": 0.618, + "step": 2800 + }, + { + "epoch": 0.11, + "learning_rate": 9.531515151515152e-06, + "loss": 0.622, + "step": 2825 + }, + { + "epoch": 0.11, + "learning_rate": 9.526464646464647e-06, + "loss": 0.6157, + "step": 2850 + }, + { + "epoch": 0.12, + "learning_rate": 9.521414141414143e-06, + "loss": 0.6351, + "step": 2875 + }, + { + "epoch": 0.12, + "learning_rate": 9.516363636363637e-06, + "loss": 0.6265, + "step": 2900 + }, + { + "epoch": 0.12, + "learning_rate": 9.511313131313133e-06, + "loss": 0.6202, + "step": 2925 + }, + { + "epoch": 0.12, + "learning_rate": 9.506262626262627e-06, + "loss": 0.5981, + "step": 2950 + }, + { + "epoch": 0.12, + "learning_rate": 9.501212121212122e-06, + "loss": 0.5991, + "step": 2975 + }, + { + "epoch": 0.12, + "learning_rate": 9.496161616161616e-06, + "loss": 0.5855, + "step": 3000 + }, + { + "epoch": 0.12, + "learning_rate": 9.491111111111112e-06, + "loss": 0.6107, + "step": 3025 + }, + { + "epoch": 0.12, + "learning_rate": 9.486060606060606e-06, + "loss": 0.5846, + "step": 3050 + }, + { + "epoch": 0.12, + "learning_rate": 9.481010101010102e-06, + "loss": 0.5985, + "step": 3075 + }, + { + "epoch": 0.12, + "learning_rate": 9.475959595959596e-06, + "loss": 0.6231, + "step": 3100 + }, + { + "epoch": 0.13, + "learning_rate": 9.470909090909092e-06, + "loss": 0.5999, + "step": 3125 + }, + { + "epoch": 0.13, + "learning_rate": 9.465858585858587e-06, + "loss": 0.5851, + "step": 3150 + }, + { + "epoch": 0.13, + "learning_rate": 9.460808080808081e-06, + "loss": 0.6101, + "step": 3175 + }, + { + "epoch": 0.13, + "learning_rate": 9.455757575757577e-06, + "loss": 0.6155, + "step": 3200 + }, + { + "epoch": 0.13, + "learning_rate": 9.450707070707071e-06, + "loss": 0.617, + "step": 3225 + }, + { + "epoch": 0.13, + "learning_rate": 9.445656565656567e-06, + "loss": 0.5908, + "step": 3250 + }, + { + "epoch": 0.13, + "learning_rate": 9.440606060606062e-06, + "loss": 0.5898, + "step": 3275 + }, + { + "epoch": 0.13, + "learning_rate": 9.435555555555556e-06, + "loss": 0.5761, + "step": 3300 + }, + { + "epoch": 0.13, + "learning_rate": 9.43050505050505e-06, + "loss": 0.6068, + "step": 3325 + }, + { + "epoch": 0.13, + "learning_rate": 9.425454545454546e-06, + "loss": 0.6193, + "step": 3350 + }, + { + "epoch": 0.14, + "learning_rate": 9.42040404040404e-06, + "loss": 0.5659, + "step": 3375 + }, + { + "epoch": 0.14, + "learning_rate": 9.415353535353537e-06, + "loss": 0.5706, + "step": 3400 + }, + { + "epoch": 0.14, + "learning_rate": 9.41030303030303e-06, + "loss": 0.5881, + "step": 3425 + }, + { + "epoch": 0.14, + "learning_rate": 9.405252525252527e-06, + "loss": 0.587, + "step": 3450 + }, + { + "epoch": 0.14, + "learning_rate": 9.400202020202021e-06, + "loss": 0.5999, + "step": 3475 + }, + { + "epoch": 0.14, + "learning_rate": 9.395151515151515e-06, + "loss": 0.5927, + "step": 3500 + }, + { + "epoch": 0.14, + "learning_rate": 9.39010101010101e-06, + "loss": 0.57, + "step": 3525 + }, + { + "epoch": 0.14, + "learning_rate": 9.385050505050506e-06, + "loss": 0.5748, + "step": 3550 + }, + { + "epoch": 0.14, + "learning_rate": 9.38e-06, + "loss": 0.5901, + "step": 3575 + }, + { + "epoch": 0.14, + "learning_rate": 9.374949494949496e-06, + "loss": 0.5614, + "step": 3600 + }, + { + "epoch": 0.15, + "learning_rate": 9.369898989898992e-06, + "loss": 0.5811, + "step": 3625 + }, + { + "epoch": 0.15, + "learning_rate": 9.364848484848486e-06, + "loss": 0.5777, + "step": 3650 + }, + { + "epoch": 0.15, + "learning_rate": 9.35979797979798e-06, + "loss": 0.595, + "step": 3675 + }, + { + "epoch": 0.15, + "learning_rate": 9.354747474747475e-06, + "loss": 0.5798, + "step": 3700 + }, + { + "epoch": 0.15, + "learning_rate": 9.34969696969697e-06, + "loss": 0.5856, + "step": 3725 + }, + { + "epoch": 0.15, + "learning_rate": 9.344646464646465e-06, + "loss": 0.5863, + "step": 3750 + }, + { + "epoch": 0.15, + "learning_rate": 9.339595959595961e-06, + "loss": 0.5817, + "step": 3775 + }, + { + "epoch": 0.15, + "learning_rate": 9.334545454545455e-06, + "loss": 0.5943, + "step": 3800 + }, + { + "epoch": 0.15, + "learning_rate": 9.32949494949495e-06, + "loss": 0.56, + "step": 3825 + }, + { + "epoch": 0.15, + "learning_rate": 9.324444444444444e-06, + "loss": 0.573, + "step": 3850 + }, + { + "epoch": 0.16, + "learning_rate": 9.31939393939394e-06, + "loss": 0.5525, + "step": 3875 + }, + { + "epoch": 0.16, + "learning_rate": 9.314343434343434e-06, + "loss": 0.6028, + "step": 3900 + }, + { + "epoch": 0.16, + "learning_rate": 9.30929292929293e-06, + "loss": 0.5804, + "step": 3925 + }, + { + "epoch": 0.16, + "learning_rate": 9.304242424242425e-06, + "loss": 0.5647, + "step": 3950 + }, + { + "epoch": 0.16, + "learning_rate": 9.29919191919192e-06, + "loss": 0.5758, + "step": 3975 + }, + { + "epoch": 0.16, + "learning_rate": 9.294141414141415e-06, + "loss": 0.5667, + "step": 4000 + }, + { + "epoch": 0.16, + "learning_rate": 9.28909090909091e-06, + "loss": 0.558, + "step": 4025 + }, + { + "epoch": 0.16, + "learning_rate": 9.284040404040405e-06, + "loss": 0.5671, + "step": 4050 + }, + { + "epoch": 0.16, + "learning_rate": 9.2789898989899e-06, + "loss": 0.5421, + "step": 4075 + }, + { + "epoch": 0.16, + "learning_rate": 9.273939393939395e-06, + "loss": 0.551, + "step": 4100 + }, + { + "epoch": 0.17, + "learning_rate": 9.26888888888889e-06, + "loss": 0.5646, + "step": 4125 + }, + { + "epoch": 0.17, + "learning_rate": 9.263838383838386e-06, + "loss": 0.5756, + "step": 4150 + }, + { + "epoch": 0.17, + "learning_rate": 9.25878787878788e-06, + "loss": 0.5527, + "step": 4175 + }, + { + "epoch": 0.17, + "learning_rate": 9.253737373737374e-06, + "loss": 0.5491, + "step": 4200 + }, + { + "epoch": 0.17, + "learning_rate": 9.248686868686869e-06, + "loss": 0.5713, + "step": 4225 + }, + { + "epoch": 0.17, + "learning_rate": 9.243636363636365e-06, + "loss": 0.5914, + "step": 4250 + }, + { + "epoch": 0.17, + "learning_rate": 9.238585858585859e-06, + "loss": 0.5546, + "step": 4275 + }, + { + "epoch": 0.17, + "learning_rate": 9.233535353535355e-06, + "loss": 0.5616, + "step": 4300 + }, + { + "epoch": 0.17, + "learning_rate": 9.22848484848485e-06, + "loss": 0.5532, + "step": 4325 + }, + { + "epoch": 0.17, + "learning_rate": 9.223434343434343e-06, + "loss": 0.5596, + "step": 4350 + }, + { + "epoch": 0.18, + "learning_rate": 9.21838383838384e-06, + "loss": 0.5584, + "step": 4375 + }, + { + "epoch": 0.18, + "learning_rate": 9.213333333333334e-06, + "loss": 0.5418, + "step": 4400 + }, + { + "epoch": 0.18, + "learning_rate": 9.208282828282828e-06, + "loss": 0.5438, + "step": 4425 + }, + { + "epoch": 0.18, + "learning_rate": 9.203232323232324e-06, + "loss": 0.5684, + "step": 4450 + }, + { + "epoch": 0.18, + "learning_rate": 9.19818181818182e-06, + "loss": 0.5224, + "step": 4475 + }, + { + "epoch": 0.18, + "learning_rate": 9.193131313131314e-06, + "loss": 0.5501, + "step": 4500 + }, + { + "epoch": 0.18, + "learning_rate": 9.188080808080809e-06, + "loss": 0.5429, + "step": 4525 + }, + { + "epoch": 0.18, + "learning_rate": 9.183030303030303e-06, + "loss": 0.5529, + "step": 4550 + }, + { + "epoch": 0.18, + "learning_rate": 9.177979797979799e-06, + "loss": 0.5694, + "step": 4575 + }, + { + "epoch": 0.18, + "learning_rate": 9.172929292929293e-06, + "loss": 0.5494, + "step": 4600 + }, + { + "epoch": 0.19, + "learning_rate": 9.16787878787879e-06, + "loss": 0.5686, + "step": 4625 + }, + { + "epoch": 0.19, + "learning_rate": 9.162828282828284e-06, + "loss": 0.5311, + "step": 4650 + }, + { + "epoch": 0.19, + "learning_rate": 9.15777777777778e-06, + "loss": 0.5439, + "step": 4675 + }, + { + "epoch": 0.19, + "learning_rate": 9.152727272727274e-06, + "loss": 0.5351, + "step": 4700 + }, + { + "epoch": 0.19, + "learning_rate": 9.147676767676768e-06, + "loss": 0.5438, + "step": 4725 + }, + { + "epoch": 0.19, + "learning_rate": 9.142626262626262e-06, + "loss": 0.5627, + "step": 4750 + }, + { + "epoch": 0.19, + "learning_rate": 9.137575757575758e-06, + "loss": 0.5443, + "step": 4775 + }, + { + "epoch": 0.19, + "learning_rate": 9.132525252525253e-06, + "loss": 0.5367, + "step": 4800 + }, + { + "epoch": 0.19, + "learning_rate": 9.127474747474749e-06, + "loss": 0.5256, + "step": 4825 + }, + { + "epoch": 0.19, + "learning_rate": 9.122424242424243e-06, + "loss": 0.5447, + "step": 4850 + }, + { + "epoch": 0.2, + "learning_rate": 9.117373737373737e-06, + "loss": 0.5295, + "step": 4875 + }, + { + "epoch": 0.2, + "learning_rate": 9.112323232323233e-06, + "loss": 0.5365, + "step": 4900 + }, + { + "epoch": 0.2, + "learning_rate": 9.107272727272728e-06, + "loss": 0.5309, + "step": 4925 + }, + { + "epoch": 0.2, + "learning_rate": 9.102222222222224e-06, + "loss": 0.5223, + "step": 4950 + }, + { + "epoch": 0.2, + "learning_rate": 9.097171717171718e-06, + "loss": 0.536, + "step": 4975 + }, + { + "epoch": 0.2, + "learning_rate": 9.092121212121214e-06, + "loss": 0.5442, + "step": 5000 + }, + { + "epoch": 0.2, + "eval_loss": 0.5454992055892944, + "eval_runtime": 329.8023, + "eval_samples_per_second": 15.176, + "eval_steps_per_second": 1.898, + "eval_wer": 41.85433921070742, + "step": 5000 + }, + { + "epoch": 0.2, + "learning_rate": 9.087070707070708e-06, + "loss": 0.5432, + "step": 5025 + }, + { + "epoch": 0.2, + "learning_rate": 9.082020202020202e-06, + "loss": 0.5454, + "step": 5050 + }, + { + "epoch": 0.2, + "learning_rate": 9.076969696969697e-06, + "loss": 0.5455, + "step": 5075 + }, + { + "epoch": 0.2, + "learning_rate": 9.071919191919193e-06, + "loss": 0.5462, + "step": 5100 + }, + { + "epoch": 0.21, + "learning_rate": 9.066868686868687e-06, + "loss": 0.5283, + "step": 5125 + }, + { + "epoch": 0.21, + "learning_rate": 9.061818181818183e-06, + "loss": 0.5418, + "step": 5150 + }, + { + "epoch": 0.21, + "learning_rate": 9.056767676767677e-06, + "loss": 0.5293, + "step": 5175 + }, + { + "epoch": 0.21, + "learning_rate": 9.051717171717173e-06, + "loss": 0.5228, + "step": 5200 + }, + { + "epoch": 0.21, + "learning_rate": 9.046666666666668e-06, + "loss": 0.5381, + "step": 5225 + }, + { + "epoch": 0.21, + "learning_rate": 9.041616161616162e-06, + "loss": 0.5572, + "step": 5250 + }, + { + "epoch": 0.21, + "learning_rate": 9.036565656565656e-06, + "loss": 0.5243, + "step": 5275 + }, + { + "epoch": 0.21, + "learning_rate": 9.031515151515152e-06, + "loss": 0.5353, + "step": 5300 + }, + { + "epoch": 0.21, + "learning_rate": 9.026464646464648e-06, + "loss": 0.5348, + "step": 5325 + }, + { + "epoch": 0.21, + "learning_rate": 9.021414141414142e-06, + "loss": 0.5445, + "step": 5350 + }, + { + "epoch": 0.22, + "learning_rate": 9.016363636363637e-06, + "loss": 0.516, + "step": 5375 + }, + { + "epoch": 0.22, + "learning_rate": 9.011313131313133e-06, + "loss": 0.5268, + "step": 5400 + }, + { + "epoch": 0.22, + "learning_rate": 9.006262626262627e-06, + "loss": 0.5416, + "step": 5425 + }, + { + "epoch": 0.22, + "learning_rate": 9.001212121212121e-06, + "loss": 0.5564, + "step": 5450 + }, + { + "epoch": 0.22, + "learning_rate": 8.996161616161617e-06, + "loss": 0.5475, + "step": 5475 + }, + { + "epoch": 0.22, + "learning_rate": 8.991111111111112e-06, + "loss": 0.5441, + "step": 5500 + }, + { + "epoch": 0.22, + "learning_rate": 8.986060606060608e-06, + "loss": 0.5281, + "step": 5525 + }, + { + "epoch": 0.22, + "learning_rate": 8.981010101010102e-06, + "loss": 0.5289, + "step": 5550 + }, + { + "epoch": 0.22, + "learning_rate": 8.975959595959596e-06, + "loss": 0.5466, + "step": 5575 + }, + { + "epoch": 0.22, + "learning_rate": 8.97090909090909e-06, + "loss": 0.5344, + "step": 5600 + }, + { + "epoch": 0.23, + "learning_rate": 8.965858585858586e-06, + "loss": 0.51, + "step": 5625 + }, + { + "epoch": 0.23, + "learning_rate": 8.96080808080808e-06, + "loss": 0.498, + "step": 5650 + }, + { + "epoch": 0.23, + "learning_rate": 8.955757575757577e-06, + "loss": 0.5346, + "step": 5675 + }, + { + "epoch": 0.23, + "learning_rate": 8.950707070707071e-06, + "loss": 0.5269, + "step": 5700 + }, + { + "epoch": 0.23, + "learning_rate": 8.945656565656567e-06, + "loss": 0.5345, + "step": 5725 + }, + { + "epoch": 0.23, + "learning_rate": 8.940606060606061e-06, + "loss": 0.5265, + "step": 5750 + }, + { + "epoch": 0.23, + "learning_rate": 8.935555555555556e-06, + "loss": 0.5264, + "step": 5775 + }, + { + "epoch": 0.23, + "learning_rate": 8.930505050505052e-06, + "loss": 0.5177, + "step": 5800 + }, + { + "epoch": 0.23, + "learning_rate": 8.925454545454546e-06, + "loss": 0.533, + "step": 5825 + }, + { + "epoch": 0.23, + "learning_rate": 8.920404040404042e-06, + "loss": 0.5188, + "step": 5850 + }, + { + "epoch": 0.24, + "learning_rate": 8.915353535353536e-06, + "loss": 0.5245, + "step": 5875 + }, + { + "epoch": 0.24, + "learning_rate": 8.91030303030303e-06, + "loss": 0.5166, + "step": 5900 + }, + { + "epoch": 0.24, + "learning_rate": 8.905252525252527e-06, + "loss": 0.5323, + "step": 5925 + }, + { + "epoch": 0.24, + "learning_rate": 8.90020202020202e-06, + "loss": 0.5216, + "step": 5950 + }, + { + "epoch": 0.24, + "learning_rate": 8.895151515151515e-06, + "loss": 0.5037, + "step": 5975 + }, + { + "epoch": 0.24, + "learning_rate": 8.890101010101011e-06, + "loss": 0.5348, + "step": 6000 + }, + { + "epoch": 0.24, + "learning_rate": 8.885050505050505e-06, + "loss": 0.5265, + "step": 6025 + }, + { + "epoch": 0.24, + "learning_rate": 8.880000000000001e-06, + "loss": 0.5232, + "step": 6050 + }, + { + "epoch": 0.24, + "learning_rate": 8.874949494949496e-06, + "loss": 0.5024, + "step": 6075 + }, + { + "epoch": 0.24, + "learning_rate": 8.86989898989899e-06, + "loss": 0.5103, + "step": 6100 + }, + { + "epoch": 0.25, + "learning_rate": 8.864848484848484e-06, + "loss": 0.4969, + "step": 6125 + }, + { + "epoch": 0.25, + "learning_rate": 8.85979797979798e-06, + "loss": 0.5156, + "step": 6150 + }, + { + "epoch": 0.25, + "learning_rate": 8.854747474747476e-06, + "loss": 0.5261, + "step": 6175 + }, + { + "epoch": 0.25, + "learning_rate": 8.84969696969697e-06, + "loss": 0.5004, + "step": 6200 + }, + { + "epoch": 0.25, + "learning_rate": 8.844646464646467e-06, + "loss": 0.4955, + "step": 6225 + }, + { + "epoch": 0.25, + "learning_rate": 8.83959595959596e-06, + "loss": 0.5173, + "step": 6250 + }, + { + "epoch": 0.25, + "learning_rate": 8.834545454545455e-06, + "loss": 0.5217, + "step": 6275 + }, + { + "epoch": 0.25, + "learning_rate": 8.82949494949495e-06, + "loss": 0.512, + "step": 6300 + }, + { + "epoch": 0.25, + "learning_rate": 8.824444444444445e-06, + "loss": 0.506, + "step": 6325 + }, + { + "epoch": 0.25, + "learning_rate": 8.81939393939394e-06, + "loss": 0.5232, + "step": 6350 + }, + { + "epoch": 0.26, + "learning_rate": 8.814343434343436e-06, + "loss": 0.5187, + "step": 6375 + }, + { + "epoch": 0.26, + "learning_rate": 8.80929292929293e-06, + "loss": 0.4965, + "step": 6400 + }, + { + "epoch": 0.26, + "learning_rate": 8.804242424242426e-06, + "loss": 0.5071, + "step": 6425 + }, + { + "epoch": 0.26, + "learning_rate": 8.79919191919192e-06, + "loss": 0.5165, + "step": 6450 + }, + { + "epoch": 0.26, + "learning_rate": 8.794141414141415e-06, + "loss": 0.5104, + "step": 6475 + }, + { + "epoch": 0.26, + "learning_rate": 8.789090909090909e-06, + "loss": 0.4947, + "step": 6500 + }, + { + "epoch": 0.26, + "learning_rate": 8.784040404040405e-06, + "loss": 0.4864, + "step": 6525 + }, + { + "epoch": 0.26, + "learning_rate": 8.7789898989899e-06, + "loss": 0.5373, + "step": 6550 + }, + { + "epoch": 0.26, + "learning_rate": 8.773939393939395e-06, + "loss": 0.5253, + "step": 6575 + }, + { + "epoch": 0.26, + "learning_rate": 8.76888888888889e-06, + "loss": 0.5056, + "step": 6600 + }, + { + "epoch": 0.27, + "learning_rate": 8.763838383838384e-06, + "loss": 0.5065, + "step": 6625 + }, + { + "epoch": 0.27, + "learning_rate": 8.75878787878788e-06, + "loss": 0.5022, + "step": 6650 + }, + { + "epoch": 0.27, + "learning_rate": 8.753737373737374e-06, + "loss": 0.4991, + "step": 6675 + }, + { + "epoch": 0.27, + "learning_rate": 8.74868686868687e-06, + "loss": 0.5224, + "step": 6700 + }, + { + "epoch": 0.27, + "learning_rate": 8.743636363636364e-06, + "loss": 0.5293, + "step": 6725 + }, + { + "epoch": 0.27, + "learning_rate": 8.73858585858586e-06, + "loss": 0.5131, + "step": 6750 + }, + { + "epoch": 0.27, + "learning_rate": 8.733535353535355e-06, + "loss": 0.4972, + "step": 6775 + }, + { + "epoch": 0.27, + "learning_rate": 8.728484848484849e-06, + "loss": 0.4901, + "step": 6800 + }, + { + "epoch": 0.27, + "learning_rate": 8.723434343434343e-06, + "loss": 0.4907, + "step": 6825 + }, + { + "epoch": 0.27, + "learning_rate": 8.71838383838384e-06, + "loss": 0.4896, + "step": 6850 + }, + { + "epoch": 0.28, + "learning_rate": 8.713333333333333e-06, + "loss": 0.5052, + "step": 6875 + }, + { + "epoch": 0.28, + "learning_rate": 8.70828282828283e-06, + "loss": 0.5105, + "step": 6900 + }, + { + "epoch": 0.28, + "learning_rate": 8.703232323232324e-06, + "loss": 0.5036, + "step": 6925 + }, + { + "epoch": 0.28, + "learning_rate": 8.69818181818182e-06, + "loss": 0.4917, + "step": 6950 + }, + { + "epoch": 0.28, + "learning_rate": 8.693131313131314e-06, + "loss": 0.4844, + "step": 6975 + }, + { + "epoch": 0.28, + "learning_rate": 8.688080808080808e-06, + "loss": 0.5248, + "step": 7000 + }, + { + "epoch": 0.28, + "learning_rate": 8.683030303030304e-06, + "loss": 0.497, + "step": 7025 + }, + { + "epoch": 0.28, + "learning_rate": 8.677979797979799e-06, + "loss": 0.4918, + "step": 7050 + }, + { + "epoch": 0.28, + "learning_rate": 8.672929292929295e-06, + "loss": 0.5221, + "step": 7075 + }, + { + "epoch": 0.28, + "learning_rate": 8.667878787878789e-06, + "loss": 0.5155, + "step": 7100 + }, + { + "epoch": 0.29, + "learning_rate": 8.662828282828283e-06, + "loss": 0.5031, + "step": 7125 + }, + { + "epoch": 0.29, + "learning_rate": 8.657777777777778e-06, + "loss": 0.4829, + "step": 7150 + }, + { + "epoch": 0.29, + "learning_rate": 8.652727272727274e-06, + "loss": 0.4863, + "step": 7175 + }, + { + "epoch": 0.29, + "learning_rate": 8.647676767676768e-06, + "loss": 0.4697, + "step": 7200 + }, + { + "epoch": 0.29, + "learning_rate": 8.642626262626264e-06, + "loss": 0.4705, + "step": 7225 + }, + { + "epoch": 0.29, + "learning_rate": 8.637575757575758e-06, + "loss": 0.5049, + "step": 7250 + }, + { + "epoch": 0.29, + "learning_rate": 8.632525252525254e-06, + "loss": 0.5023, + "step": 7275 + }, + { + "epoch": 0.29, + "learning_rate": 8.627474747474748e-06, + "loss": 0.5118, + "step": 7300 + }, + { + "epoch": 0.29, + "learning_rate": 8.622424242424243e-06, + "loss": 0.5219, + "step": 7325 + }, + { + "epoch": 0.29, + "learning_rate": 8.617373737373737e-06, + "loss": 0.4733, + "step": 7350 + }, + { + "epoch": 0.3, + "learning_rate": 8.612323232323233e-06, + "loss": 0.4903, + "step": 7375 + }, + { + "epoch": 0.3, + "learning_rate": 8.607272727272727e-06, + "loss": 0.4855, + "step": 7400 + }, + { + "epoch": 0.3, + "learning_rate": 8.602222222222223e-06, + "loss": 0.4954, + "step": 7425 + }, + { + "epoch": 0.3, + "learning_rate": 8.597171717171718e-06, + "loss": 0.4778, + "step": 7450 + }, + { + "epoch": 0.3, + "learning_rate": 8.592121212121214e-06, + "loss": 0.5003, + "step": 7475 + }, + { + "epoch": 0.3, + "learning_rate": 8.587070707070708e-06, + "loss": 0.4954, + "step": 7500 + }, + { + "epoch": 0.3, + "eval_loss": 0.5018385052680969, + "eval_runtime": 326.6554, + "eval_samples_per_second": 15.322, + "eval_steps_per_second": 1.916, + "eval_wer": 39.86093642468972, + "step": 7500 + }, + { + "epoch": 0.3, + "learning_rate": 8.582020202020202e-06, + "loss": 0.5221, + "step": 7525 + }, + { + "epoch": 0.3, + "learning_rate": 8.576969696969698e-06, + "loss": 0.4649, + "step": 7550 + }, + { + "epoch": 0.3, + "learning_rate": 8.571919191919192e-06, + "loss": 0.5203, + "step": 7575 + }, + { + "epoch": 0.3, + "learning_rate": 8.566868686868688e-06, + "loss": 0.4946, + "step": 7600 + }, + { + "epoch": 0.31, + "learning_rate": 8.561818181818183e-06, + "loss": 0.4797, + "step": 7625 + }, + { + "epoch": 0.31, + "learning_rate": 8.556767676767677e-06, + "loss": 0.5038, + "step": 7650 + }, + { + "epoch": 0.31, + "learning_rate": 8.551717171717171e-06, + "loss": 0.4835, + "step": 7675 + }, + { + "epoch": 0.31, + "learning_rate": 8.546666666666667e-06, + "loss": 0.5149, + "step": 7700 + }, + { + "epoch": 0.31, + "learning_rate": 8.541616161616162e-06, + "loss": 0.4866, + "step": 7725 + }, + { + "epoch": 0.31, + "learning_rate": 8.536565656565658e-06, + "loss": 0.4996, + "step": 7750 + }, + { + "epoch": 0.31, + "learning_rate": 8.531515151515152e-06, + "loss": 0.4758, + "step": 7775 + }, + { + "epoch": 0.31, + "learning_rate": 8.526464646464648e-06, + "loss": 0.5027, + "step": 7800 + }, + { + "epoch": 0.31, + "learning_rate": 8.521414141414142e-06, + "loss": 0.4976, + "step": 7825 + }, + { + "epoch": 0.31, + "learning_rate": 8.516363636363636e-06, + "loss": 0.4817, + "step": 7850 + }, + { + "epoch": 0.32, + "learning_rate": 8.511313131313132e-06, + "loss": 0.5112, + "step": 7875 + }, + { + "epoch": 0.32, + "learning_rate": 8.506262626262627e-06, + "loss": 0.476, + "step": 7900 + }, + { + "epoch": 0.32, + "learning_rate": 8.501212121212123e-06, + "loss": 0.4719, + "step": 7925 + }, + { + "epoch": 0.32, + "learning_rate": 8.496161616161617e-06, + "loss": 0.4911, + "step": 7950 + }, + { + "epoch": 0.32, + "learning_rate": 8.491111111111113e-06, + "loss": 0.503, + "step": 7975 + }, + { + "epoch": 0.32, + "learning_rate": 8.486060606060607e-06, + "loss": 0.4636, + "step": 8000 + }, + { + "epoch": 0.32, + "learning_rate": 8.481010101010102e-06, + "loss": 0.4923, + "step": 8025 + }, + { + "epoch": 0.32, + "learning_rate": 8.475959595959596e-06, + "loss": 0.4896, + "step": 8050 + }, + { + "epoch": 0.32, + "learning_rate": 8.470909090909092e-06, + "loss": 0.4901, + "step": 8075 + }, + { + "epoch": 0.32, + "learning_rate": 8.465858585858586e-06, + "loss": 0.4871, + "step": 8100 + }, + { + "epoch": 0.33, + "learning_rate": 8.460808080808082e-06, + "loss": 0.4808, + "step": 8125 + }, + { + "epoch": 0.33, + "learning_rate": 8.455757575757576e-06, + "loss": 0.4749, + "step": 8150 + }, + { + "epoch": 0.33, + "learning_rate": 8.45070707070707e-06, + "loss": 0.4905, + "step": 8175 + }, + { + "epoch": 0.33, + "learning_rate": 8.445656565656565e-06, + "loss": 0.4963, + "step": 8200 + }, + { + "epoch": 0.33, + "learning_rate": 8.440606060606061e-06, + "loss": 0.4755, + "step": 8225 + }, + { + "epoch": 0.33, + "learning_rate": 8.435555555555555e-06, + "loss": 0.5149, + "step": 8250 + }, + { + "epoch": 0.33, + "learning_rate": 8.430505050505051e-06, + "loss": 0.4944, + "step": 8275 + }, + { + "epoch": 0.33, + "learning_rate": 8.425454545454547e-06, + "loss": 0.4671, + "step": 8300 + }, + { + "epoch": 0.33, + "learning_rate": 8.420404040404042e-06, + "loss": 0.4706, + "step": 8325 + }, + { + "epoch": 0.33, + "learning_rate": 8.415353535353536e-06, + "loss": 0.4601, + "step": 8350 + }, + { + "epoch": 0.34, + "learning_rate": 8.41030303030303e-06, + "loss": 0.4612, + "step": 8375 + }, + { + "epoch": 0.34, + "learning_rate": 8.405252525252526e-06, + "loss": 0.4672, + "step": 8400 + }, + { + "epoch": 0.34, + "learning_rate": 8.40020202020202e-06, + "loss": 0.4875, + "step": 8425 + }, + { + "epoch": 0.34, + "learning_rate": 8.395151515151516e-06, + "loss": 0.5222, + "step": 8450 + }, + { + "epoch": 0.34, + "learning_rate": 8.39010101010101e-06, + "loss": 0.477, + "step": 8475 + }, + { + "epoch": 0.34, + "learning_rate": 8.385050505050507e-06, + "loss": 0.477, + "step": 8500 + }, + { + "epoch": 0.34, + "learning_rate": 8.380000000000001e-06, + "loss": 0.4654, + "step": 8525 + }, + { + "epoch": 0.34, + "learning_rate": 8.374949494949495e-06, + "loss": 0.4953, + "step": 8550 + }, + { + "epoch": 0.34, + "learning_rate": 8.36989898989899e-06, + "loss": 0.4741, + "step": 8575 + }, + { + "epoch": 0.34, + "learning_rate": 8.364848484848486e-06, + "loss": 0.5095, + "step": 8600 + }, + { + "epoch": 0.35, + "learning_rate": 8.35979797979798e-06, + "loss": 0.4731, + "step": 8625 + }, + { + "epoch": 0.35, + "learning_rate": 8.354747474747476e-06, + "loss": 0.4665, + "step": 8650 + }, + { + "epoch": 0.35, + "learning_rate": 8.34969696969697e-06, + "loss": 0.483, + "step": 8675 + }, + { + "epoch": 0.35, + "learning_rate": 8.344646464646465e-06, + "loss": 0.4905, + "step": 8700 + }, + { + "epoch": 0.35, + "learning_rate": 8.33959595959596e-06, + "loss": 0.4658, + "step": 8725 + }, + { + "epoch": 0.35, + "learning_rate": 8.334545454545455e-06, + "loss": 0.4826, + "step": 8750 + }, + { + "epoch": 0.35, + "learning_rate": 8.32949494949495e-06, + "loss": 0.478, + "step": 8775 + }, + { + "epoch": 0.35, + "learning_rate": 8.324444444444445e-06, + "loss": 0.4846, + "step": 8800 + }, + { + "epoch": 0.35, + "learning_rate": 8.319393939393941e-06, + "loss": 0.4757, + "step": 8825 + }, + { + "epoch": 0.35, + "learning_rate": 8.314343434343435e-06, + "loss": 0.4847, + "step": 8850 + }, + { + "epoch": 0.36, + "learning_rate": 8.30929292929293e-06, + "loss": 0.4886, + "step": 8875 + }, + { + "epoch": 0.36, + "learning_rate": 8.304242424242424e-06, + "loss": 0.4724, + "step": 8900 + }, + { + "epoch": 0.36, + "learning_rate": 8.29919191919192e-06, + "loss": 0.4785, + "step": 8925 + }, + { + "epoch": 0.36, + "learning_rate": 8.294141414141414e-06, + "loss": 0.4844, + "step": 8950 + }, + { + "epoch": 0.36, + "learning_rate": 8.28909090909091e-06, + "loss": 0.4694, + "step": 8975 + }, + { + "epoch": 0.36, + "learning_rate": 8.284040404040405e-06, + "loss": 0.4852, + "step": 9000 + }, + { + "epoch": 0.36, + "learning_rate": 8.2789898989899e-06, + "loss": 0.4963, + "step": 9025 + }, + { + "epoch": 0.36, + "learning_rate": 8.273939393939395e-06, + "loss": 0.4735, + "step": 9050 + }, + { + "epoch": 0.36, + "learning_rate": 8.268888888888889e-06, + "loss": 0.4733, + "step": 9075 + }, + { + "epoch": 0.36, + "learning_rate": 8.263838383838383e-06, + "loss": 0.4537, + "step": 9100 + }, + { + "epoch": 0.37, + "learning_rate": 8.25878787878788e-06, + "loss": 0.4843, + "step": 9125 + }, + { + "epoch": 0.37, + "learning_rate": 8.253737373737375e-06, + "loss": 0.4789, + "step": 9150 + }, + { + "epoch": 0.37, + "learning_rate": 8.24868686868687e-06, + "loss": 0.4908, + "step": 9175 + }, + { + "epoch": 0.37, + "learning_rate": 8.243636363636364e-06, + "loss": 0.4735, + "step": 9200 + }, + { + "epoch": 0.37, + "learning_rate": 8.238585858585858e-06, + "loss": 0.476, + "step": 9225 + }, + { + "epoch": 0.37, + "learning_rate": 8.233535353535354e-06, + "loss": 0.4844, + "step": 9250 + }, + { + "epoch": 0.37, + "learning_rate": 8.228484848484849e-06, + "loss": 0.4828, + "step": 9275 + }, + { + "epoch": 0.37, + "learning_rate": 8.223434343434345e-06, + "loss": 0.5066, + "step": 9300 + }, + { + "epoch": 0.37, + "learning_rate": 8.218383838383839e-06, + "loss": 0.4674, + "step": 9325 + }, + { + "epoch": 0.37, + "learning_rate": 8.213333333333335e-06, + "loss": 0.47, + "step": 9350 + }, + { + "epoch": 0.38, + "learning_rate": 8.20828282828283e-06, + "loss": 0.4821, + "step": 9375 + }, + { + "epoch": 0.38, + "learning_rate": 8.203232323232323e-06, + "loss": 0.4588, + "step": 9400 + }, + { + "epoch": 0.38, + "learning_rate": 8.198181818181818e-06, + "loss": 0.4674, + "step": 9425 + }, + { + "epoch": 0.38, + "learning_rate": 8.193131313131314e-06, + "loss": 0.4825, + "step": 9450 + }, + { + "epoch": 0.38, + "learning_rate": 8.188080808080808e-06, + "loss": 0.472, + "step": 9475 + }, + { + "epoch": 0.38, + "learning_rate": 8.183030303030304e-06, + "loss": 0.4723, + "step": 9500 + }, + { + "epoch": 0.38, + "learning_rate": 8.177979797979798e-06, + "loss": 0.4703, + "step": 9525 + }, + { + "epoch": 0.38, + "learning_rate": 8.172929292929294e-06, + "loss": 0.4945, + "step": 9550 + }, + { + "epoch": 0.38, + "learning_rate": 8.167878787878789e-06, + "loss": 0.4829, + "step": 9575 + }, + { + "epoch": 0.38, + "learning_rate": 8.162828282828283e-06, + "loss": 0.4595, + "step": 9600 + }, + { + "epoch": 0.39, + "learning_rate": 8.157777777777779e-06, + "loss": 0.4775, + "step": 9625 + }, + { + "epoch": 0.39, + "learning_rate": 8.152727272727273e-06, + "loss": 0.4583, + "step": 9650 + }, + { + "epoch": 0.39, + "learning_rate": 8.14767676767677e-06, + "loss": 0.4716, + "step": 9675 + }, + { + "epoch": 0.39, + "learning_rate": 8.142626262626263e-06, + "loss": 0.467, + "step": 9700 + }, + { + "epoch": 0.39, + "learning_rate": 8.137575757575758e-06, + "loss": 0.456, + "step": 9725 + }, + { + "epoch": 0.39, + "learning_rate": 8.132525252525252e-06, + "loss": 0.4694, + "step": 9750 + }, + { + "epoch": 0.39, + "learning_rate": 8.127474747474748e-06, + "loss": 0.4902, + "step": 9775 + }, + { + "epoch": 0.39, + "learning_rate": 8.122424242424242e-06, + "loss": 0.4852, + "step": 9800 + }, + { + "epoch": 0.39, + "learning_rate": 8.117373737373738e-06, + "loss": 0.4721, + "step": 9825 + }, + { + "epoch": 0.39, + "learning_rate": 8.112323232323233e-06, + "loss": 0.4712, + "step": 9850 + }, + { + "epoch": 0.4, + "learning_rate": 8.107272727272729e-06, + "loss": 0.4862, + "step": 9875 + }, + { + "epoch": 0.4, + "learning_rate": 8.102222222222223e-06, + "loss": 0.4626, + "step": 9900 + }, + { + "epoch": 0.4, + "learning_rate": 8.097171717171717e-06, + "loss": 0.4675, + "step": 9925 + }, + { + "epoch": 0.4, + "learning_rate": 8.092121212121212e-06, + "loss": 0.4686, + "step": 9950 + }, + { + "epoch": 0.4, + "learning_rate": 8.087070707070708e-06, + "loss": 0.455, + "step": 9975 + }, + { + "epoch": 0.4, + "learning_rate": 8.082020202020204e-06, + "loss": 0.474, + "step": 10000 + }, + { + "epoch": 0.4, + "eval_loss": 0.4769977331161499, + "eval_runtime": 328.2875, + "eval_samples_per_second": 15.246, + "eval_steps_per_second": 1.907, + "eval_wer": 38.55335912100429, + "step": 10000 + }, + { + "epoch": 0.4, + "learning_rate": 8.076969696969698e-06, + "loss": 0.4679, + "step": 10025 + }, + { + "epoch": 0.4, + "learning_rate": 8.071919191919194e-06, + "loss": 0.4848, + "step": 10050 + }, + { + "epoch": 0.4, + "learning_rate": 8.066868686868688e-06, + "loss": 0.4654, + "step": 10075 + }, + { + "epoch": 0.41, + "learning_rate": 8.061818181818182e-06, + "loss": 0.4622, + "step": 10100 + }, + { + "epoch": 0.41, + "learning_rate": 8.056767676767677e-06, + "loss": 0.4658, + "step": 10125 + }, + { + "epoch": 0.41, + "learning_rate": 8.051717171717173e-06, + "loss": 0.4618, + "step": 10150 + }, + { + "epoch": 0.41, + "learning_rate": 8.046666666666667e-06, + "loss": 0.4523, + "step": 10175 + }, + { + "epoch": 0.41, + "learning_rate": 8.041616161616163e-06, + "loss": 0.4575, + "step": 10200 + }, + { + "epoch": 0.41, + "learning_rate": 8.036565656565657e-06, + "loss": 0.4779, + "step": 10225 + }, + { + "epoch": 0.41, + "learning_rate": 8.031515151515152e-06, + "loss": 0.4713, + "step": 10250 + }, + { + "epoch": 0.41, + "learning_rate": 8.026464646464648e-06, + "loss": 0.4525, + "step": 10275 + }, + { + "epoch": 0.41, + "learning_rate": 8.021414141414142e-06, + "loss": 0.459, + "step": 10300 + }, + { + "epoch": 0.41, + "learning_rate": 8.016363636363636e-06, + "loss": 0.4714, + "step": 10325 + }, + { + "epoch": 0.42, + "learning_rate": 8.011313131313132e-06, + "loss": 0.4553, + "step": 10350 + }, + { + "epoch": 0.42, + "learning_rate": 8.006262626262626e-06, + "loss": 0.4742, + "step": 10375 + }, + { + "epoch": 0.42, + "learning_rate": 8.001212121212122e-06, + "loss": 0.4661, + "step": 10400 + }, + { + "epoch": 0.42, + "learning_rate": 7.996161616161617e-06, + "loss": 0.4629, + "step": 10425 + }, + { + "epoch": 0.42, + "learning_rate": 7.991111111111111e-06, + "loss": 0.4588, + "step": 10450 + }, + { + "epoch": 0.42, + "learning_rate": 7.986060606060607e-06, + "loss": 0.4659, + "step": 10475 + }, + { + "epoch": 0.42, + "learning_rate": 7.981010101010101e-06, + "loss": 0.48, + "step": 10500 + }, + { + "epoch": 0.42, + "learning_rate": 7.975959595959597e-06, + "loss": 0.4733, + "step": 10525 + }, + { + "epoch": 0.42, + "learning_rate": 7.970909090909092e-06, + "loss": 0.453, + "step": 10550 + }, + { + "epoch": 0.42, + "learning_rate": 7.965858585858588e-06, + "loss": 0.4801, + "step": 10575 + }, + { + "epoch": 0.43, + "learning_rate": 7.960808080808082e-06, + "loss": 0.469, + "step": 10600 + }, + { + "epoch": 0.43, + "learning_rate": 7.955959595959597e-06, + "loss": 0.4507, + "step": 10625 + }, + { + "epoch": 0.43, + "learning_rate": 7.950909090909092e-06, + "loss": 0.4579, + "step": 10650 + }, + { + "epoch": 0.43, + "learning_rate": 7.945858585858586e-06, + "loss": 0.4767, + "step": 10675 + }, + { + "epoch": 0.43, + "learning_rate": 7.94080808080808e-06, + "loss": 0.4625, + "step": 10700 + }, + { + "epoch": 0.43, + "learning_rate": 7.935757575757576e-06, + "loss": 0.4727, + "step": 10725 + }, + { + "epoch": 0.43, + "learning_rate": 7.93070707070707e-06, + "loss": 0.4751, + "step": 10750 + }, + { + "epoch": 0.43, + "learning_rate": 7.925656565656567e-06, + "loss": 0.4682, + "step": 10775 + }, + { + "epoch": 0.43, + "learning_rate": 7.920606060606061e-06, + "loss": 0.4623, + "step": 10800 + }, + { + "epoch": 0.43, + "learning_rate": 7.915555555555557e-06, + "loss": 0.4775, + "step": 10825 + }, + { + "epoch": 0.44, + "learning_rate": 7.910505050505051e-06, + "loss": 0.4522, + "step": 10850 + }, + { + "epoch": 0.44, + "learning_rate": 7.905454545454546e-06, + "loss": 0.4873, + "step": 10875 + }, + { + "epoch": 0.44, + "learning_rate": 7.90040404040404e-06, + "loss": 0.4528, + "step": 10900 + }, + { + "epoch": 0.44, + "learning_rate": 7.895353535353536e-06, + "loss": 0.4521, + "step": 10925 + }, + { + "epoch": 0.44, + "learning_rate": 7.890303030303032e-06, + "loss": 0.4691, + "step": 10950 + }, + { + "epoch": 0.44, + "learning_rate": 7.885252525252526e-06, + "loss": 0.4294, + "step": 10975 + }, + { + "epoch": 0.44, + "learning_rate": 7.880202020202022e-06, + "loss": 0.4611, + "step": 11000 + }, + { + "epoch": 0.44, + "learning_rate": 7.875151515151516e-06, + "loss": 0.4458, + "step": 11025 + }, + { + "epoch": 0.44, + "learning_rate": 7.87010101010101e-06, + "loss": 0.4761, + "step": 11050 + }, + { + "epoch": 0.44, + "learning_rate": 7.865050505050505e-06, + "loss": 0.4584, + "step": 11075 + }, + { + "epoch": 0.45, + "learning_rate": 7.860000000000001e-06, + "loss": 0.4644, + "step": 11100 + }, + { + "epoch": 0.45, + "learning_rate": 7.854949494949495e-06, + "loss": 0.4633, + "step": 11125 + }, + { + "epoch": 0.45, + "learning_rate": 7.849898989898991e-06, + "loss": 0.4631, + "step": 11150 + }, + { + "epoch": 0.45, + "learning_rate": 7.844848484848486e-06, + "loss": 0.4461, + "step": 11175 + }, + { + "epoch": 0.45, + "learning_rate": 7.83979797979798e-06, + "loss": 0.4874, + "step": 11200 + }, + { + "epoch": 0.45, + "learning_rate": 7.834747474747474e-06, + "loss": 0.469, + "step": 11225 + }, + { + "epoch": 0.45, + "learning_rate": 7.82969696969697e-06, + "loss": 0.4195, + "step": 11250 + }, + { + "epoch": 0.45, + "learning_rate": 7.824646464646464e-06, + "loss": 0.4769, + "step": 11275 + }, + { + "epoch": 0.45, + "learning_rate": 7.81959595959596e-06, + "loss": 0.465, + "step": 11300 + }, + { + "epoch": 0.45, + "learning_rate": 7.814545454545455e-06, + "loss": 0.464, + "step": 11325 + }, + { + "epoch": 0.46, + "learning_rate": 7.80949494949495e-06, + "loss": 0.4559, + "step": 11350 + }, + { + "epoch": 0.46, + "learning_rate": 7.804444444444445e-06, + "loss": 0.466, + "step": 11375 + }, + { + "epoch": 0.46, + "learning_rate": 7.79939393939394e-06, + "loss": 0.4683, + "step": 11400 + }, + { + "epoch": 0.46, + "learning_rate": 7.794343434343435e-06, + "loss": 0.4619, + "step": 11425 + }, + { + "epoch": 0.46, + "learning_rate": 7.78929292929293e-06, + "loss": 0.457, + "step": 11450 + }, + { + "epoch": 0.46, + "learning_rate": 7.784242424242426e-06, + "loss": 0.4535, + "step": 11475 + }, + { + "epoch": 0.46, + "learning_rate": 7.77919191919192e-06, + "loss": 0.4749, + "step": 11500 + }, + { + "epoch": 0.46, + "learning_rate": 7.774141414141416e-06, + "loss": 0.4634, + "step": 11525 + }, + { + "epoch": 0.46, + "learning_rate": 7.76909090909091e-06, + "loss": 0.4517, + "step": 11550 + }, + { + "epoch": 0.46, + "learning_rate": 7.764040404040404e-06, + "loss": 0.457, + "step": 11575 + }, + { + "epoch": 0.47, + "learning_rate": 7.758989898989899e-06, + "loss": 0.464, + "step": 11600 + }, + { + "epoch": 0.47, + "learning_rate": 7.753939393939395e-06, + "loss": 0.4606, + "step": 11625 + }, + { + "epoch": 0.47, + "learning_rate": 7.748888888888889e-06, + "loss": 0.4593, + "step": 11650 + }, + { + "epoch": 0.47, + "learning_rate": 7.743838383838385e-06, + "loss": 0.4581, + "step": 11675 + }, + { + "epoch": 0.47, + "learning_rate": 7.73878787878788e-06, + "loss": 0.4554, + "step": 11700 + }, + { + "epoch": 0.47, + "learning_rate": 7.733737373737374e-06, + "loss": 0.4449, + "step": 11725 + }, + { + "epoch": 0.47, + "learning_rate": 7.72868686868687e-06, + "loss": 0.4626, + "step": 11750 + }, + { + "epoch": 0.47, + "learning_rate": 7.723636363636364e-06, + "loss": 0.4584, + "step": 11775 + }, + { + "epoch": 0.47, + "learning_rate": 7.71858585858586e-06, + "loss": 0.4659, + "step": 11800 + }, + { + "epoch": 0.47, + "learning_rate": 7.713535353535354e-06, + "loss": 0.459, + "step": 11825 + }, + { + "epoch": 0.48, + "learning_rate": 7.70848484848485e-06, + "loss": 0.463, + "step": 11850 + }, + { + "epoch": 0.48, + "learning_rate": 7.703434343434344e-06, + "loss": 0.4443, + "step": 11875 + }, + { + "epoch": 0.48, + "learning_rate": 7.698383838383839e-06, + "loss": 0.4517, + "step": 11900 + }, + { + "epoch": 0.48, + "learning_rate": 7.693333333333333e-06, + "loss": 0.4524, + "step": 11925 + }, + { + "epoch": 0.48, + "learning_rate": 7.688282828282829e-06, + "loss": 0.4523, + "step": 11950 + }, + { + "epoch": 0.48, + "learning_rate": 7.683232323232323e-06, + "loss": 0.4685, + "step": 11975 + }, + { + "epoch": 0.48, + "learning_rate": 7.67818181818182e-06, + "loss": 0.4485, + "step": 12000 + }, + { + "epoch": 0.48, + "learning_rate": 7.673131313131314e-06, + "loss": 0.4742, + "step": 12025 + }, + { + "epoch": 0.48, + "learning_rate": 7.66808080808081e-06, + "loss": 0.4501, + "step": 12050 + }, + { + "epoch": 0.48, + "learning_rate": 7.663030303030304e-06, + "loss": 0.4459, + "step": 12075 + }, + { + "epoch": 0.49, + "learning_rate": 7.657979797979798e-06, + "loss": 0.4643, + "step": 12100 + }, + { + "epoch": 0.49, + "learning_rate": 7.652929292929293e-06, + "loss": 0.4588, + "step": 12125 + }, + { + "epoch": 0.49, + "learning_rate": 7.647878787878789e-06, + "loss": 0.4591, + "step": 12150 + }, + { + "epoch": 0.49, + "learning_rate": 7.642828282828283e-06, + "loss": 0.4493, + "step": 12175 + }, + { + "epoch": 0.49, + "learning_rate": 7.637777777777779e-06, + "loss": 0.456, + "step": 12200 + }, + { + "epoch": 0.49, + "learning_rate": 7.632727272727273e-06, + "loss": 0.4726, + "step": 12225 + }, + { + "epoch": 0.49, + "learning_rate": 7.627676767676768e-06, + "loss": 0.4447, + "step": 12250 + }, + { + "epoch": 0.49, + "learning_rate": 7.622626262626263e-06, + "loss": 0.4495, + "step": 12275 + }, + { + "epoch": 0.49, + "learning_rate": 7.617575757575758e-06, + "loss": 0.4478, + "step": 12300 + }, + { + "epoch": 0.49, + "learning_rate": 7.612525252525254e-06, + "loss": 0.4667, + "step": 12325 + }, + { + "epoch": 0.5, + "learning_rate": 7.607474747474748e-06, + "loss": 0.4626, + "step": 12350 + }, + { + "epoch": 0.5, + "learning_rate": 7.602424242424243e-06, + "loss": 0.4549, + "step": 12375 + }, + { + "epoch": 0.5, + "learning_rate": 7.597373737373737e-06, + "loss": 0.4582, + "step": 12400 + }, + { + "epoch": 0.5, + "learning_rate": 7.592323232323233e-06, + "loss": 0.4496, + "step": 12425 + }, + { + "epoch": 0.5, + "learning_rate": 7.587272727272728e-06, + "loss": 0.4604, + "step": 12450 + }, + { + "epoch": 0.5, + "learning_rate": 7.582222222222223e-06, + "loss": 0.4592, + "step": 12475 + }, + { + "epoch": 0.5, + "learning_rate": 7.577171717171717e-06, + "loss": 0.4696, + "step": 12500 + }, + { + "epoch": 0.5, + "eval_loss": 0.4565899670124054, + "eval_runtime": 321.107, + "eval_samples_per_second": 15.587, + "eval_steps_per_second": 1.95, + "eval_wer": 36.25145352286481, + "step": 12500 + }, + { + "epoch": 0.5, + "learning_rate": 7.572121212121213e-06, + "loss": 0.4294, + "step": 12525 + }, + { + "epoch": 0.5, + "learning_rate": 7.5670707070707074e-06, + "loss": 0.4358, + "step": 12550 + }, + { + "epoch": 0.5, + "learning_rate": 7.5620202020202026e-06, + "loss": 0.4569, + "step": 12575 + }, + { + "epoch": 0.51, + "learning_rate": 7.556969696969697e-06, + "loss": 0.4464, + "step": 12600 + }, + { + "epoch": 0.51, + "learning_rate": 7.551919191919193e-06, + "loss": 0.4645, + "step": 12625 + }, + { + "epoch": 0.51, + "learning_rate": 7.547070707070708e-06, + "loss": 0.4547, + "step": 12650 + }, + { + "epoch": 0.51, + "learning_rate": 7.542020202020203e-06, + "loss": 0.4748, + "step": 12675 + }, + { + "epoch": 0.51, + "learning_rate": 7.536969696969697e-06, + "loss": 0.4344, + "step": 12700 + }, + { + "epoch": 0.51, + "learning_rate": 7.531919191919192e-06, + "loss": 0.4418, + "step": 12725 + }, + { + "epoch": 0.51, + "learning_rate": 7.526868686868688e-06, + "loss": 0.4521, + "step": 12750 + }, + { + "epoch": 0.51, + "learning_rate": 7.5218181818181825e-06, + "loss": 0.4655, + "step": 12775 + }, + { + "epoch": 0.51, + "learning_rate": 7.516767676767678e-06, + "loss": 0.4499, + "step": 12800 + }, + { + "epoch": 0.51, + "learning_rate": 7.511717171717172e-06, + "loss": 0.4473, + "step": 12825 + }, + { + "epoch": 0.52, + "learning_rate": 7.506666666666668e-06, + "loss": 0.436, + "step": 12850 + }, + { + "epoch": 0.52, + "learning_rate": 7.501616161616162e-06, + "loss": 0.4446, + "step": 12875 + }, + { + "epoch": 0.52, + "learning_rate": 7.496565656565657e-06, + "loss": 0.4504, + "step": 12900 + }, + { + "epoch": 0.52, + "learning_rate": 7.491515151515152e-06, + "loss": 0.4611, + "step": 12925 + }, + { + "epoch": 0.52, + "learning_rate": 7.486464646464648e-06, + "loss": 0.4572, + "step": 12950 + }, + { + "epoch": 0.52, + "learning_rate": 7.481414141414142e-06, + "loss": 0.4517, + "step": 12975 + }, + { + "epoch": 0.52, + "learning_rate": 7.476363636363637e-06, + "loss": 0.4624, + "step": 13000 + }, + { + "epoch": 0.52, + "learning_rate": 7.471313131313131e-06, + "loss": 0.4618, + "step": 13025 + }, + { + "epoch": 0.52, + "learning_rate": 7.466262626262627e-06, + "loss": 0.4608, + "step": 13050 + }, + { + "epoch": 0.52, + "learning_rate": 7.461212121212122e-06, + "loss": 0.4573, + "step": 13075 + }, + { + "epoch": 0.53, + "learning_rate": 7.456161616161617e-06, + "loss": 0.4477, + "step": 13100 + }, + { + "epoch": 0.53, + "learning_rate": 7.451111111111111e-06, + "loss": 0.453, + "step": 13125 + }, + { + "epoch": 0.53, + "learning_rate": 7.446060606060606e-06, + "loss": 0.4737, + "step": 13150 + }, + { + "epoch": 0.53, + "learning_rate": 7.441010101010102e-06, + "loss": 0.4351, + "step": 13175 + }, + { + "epoch": 0.53, + "learning_rate": 7.4359595959595965e-06, + "loss": 0.4378, + "step": 13200 + }, + { + "epoch": 0.53, + "learning_rate": 7.430909090909092e-06, + "loss": 0.4598, + "step": 13225 + }, + { + "epoch": 0.53, + "learning_rate": 7.425858585858586e-06, + "loss": 0.4454, + "step": 13250 + }, + { + "epoch": 0.53, + "learning_rate": 7.420808080808082e-06, + "loss": 0.4307, + "step": 13275 + }, + { + "epoch": 0.53, + "learning_rate": 7.415757575757576e-06, + "loss": 0.4513, + "step": 13300 + }, + { + "epoch": 0.53, + "learning_rate": 7.410707070707071e-06, + "loss": 0.4448, + "step": 13325 + }, + { + "epoch": 0.54, + "learning_rate": 7.405656565656566e-06, + "loss": 0.452, + "step": 13350 + }, + { + "epoch": 0.54, + "learning_rate": 7.400606060606062e-06, + "loss": 0.4399, + "step": 13375 + }, + { + "epoch": 0.54, + "learning_rate": 7.395555555555556e-06, + "loss": 0.432, + "step": 13400 + }, + { + "epoch": 0.54, + "learning_rate": 7.390505050505051e-06, + "loss": 0.4261, + "step": 13425 + }, + { + "epoch": 0.54, + "learning_rate": 7.3854545454545454e-06, + "loss": 0.4497, + "step": 13450 + }, + { + "epoch": 0.54, + "learning_rate": 7.380404040404041e-06, + "loss": 0.4483, + "step": 13475 + }, + { + "epoch": 0.54, + "learning_rate": 7.375353535353536e-06, + "loss": 0.4701, + "step": 13500 + }, + { + "epoch": 0.54, + "learning_rate": 7.370303030303031e-06, + "loss": 0.4214, + "step": 13525 + }, + { + "epoch": 0.54, + "learning_rate": 7.365252525252525e-06, + "loss": 0.4399, + "step": 13550 + }, + { + "epoch": 0.54, + "learning_rate": 7.360202020202021e-06, + "loss": 0.4282, + "step": 13575 + }, + { + "epoch": 0.55, + "learning_rate": 7.355151515151516e-06, + "loss": 0.4441, + "step": 13600 + }, + { + "epoch": 0.55, + "learning_rate": 7.350101010101011e-06, + "loss": 0.4249, + "step": 13625 + }, + { + "epoch": 0.55, + "learning_rate": 7.345050505050506e-06, + "loss": 0.4295, + "step": 13650 + }, + { + "epoch": 0.55, + "learning_rate": 7.340000000000001e-06, + "loss": 0.4408, + "step": 13675 + }, + { + "epoch": 0.55, + "learning_rate": 7.334949494949496e-06, + "loss": 0.4572, + "step": 13700 + }, + { + "epoch": 0.55, + "learning_rate": 7.32989898989899e-06, + "loss": 0.4507, + "step": 13725 + }, + { + "epoch": 0.55, + "learning_rate": 7.3248484848484855e-06, + "loss": 0.4469, + "step": 13750 + }, + { + "epoch": 0.55, + "learning_rate": 7.31979797979798e-06, + "loss": 0.4359, + "step": 13775 + }, + { + "epoch": 0.55, + "learning_rate": 7.314747474747476e-06, + "loss": 0.4609, + "step": 13800 + }, + { + "epoch": 0.55, + "learning_rate": 7.30969696969697e-06, + "loss": 0.4651, + "step": 13825 + }, + { + "epoch": 0.56, + "learning_rate": 7.304646464646465e-06, + "loss": 0.443, + "step": 13850 + }, + { + "epoch": 0.56, + "learning_rate": 7.2995959595959595e-06, + "loss": 0.4593, + "step": 13875 + }, + { + "epoch": 0.56, + "learning_rate": 7.2945454545454555e-06, + "loss": 0.4594, + "step": 13900 + }, + { + "epoch": 0.56, + "learning_rate": 7.28949494949495e-06, + "loss": 0.419, + "step": 13925 + }, + { + "epoch": 0.56, + "learning_rate": 7.284444444444445e-06, + "loss": 0.4348, + "step": 13950 + }, + { + "epoch": 0.56, + "learning_rate": 7.279393939393939e-06, + "loss": 0.4551, + "step": 13975 + }, + { + "epoch": 0.56, + "learning_rate": 7.274343434343435e-06, + "loss": 0.4223, + "step": 14000 + }, + { + "epoch": 0.56, + "learning_rate": 7.26929292929293e-06, + "loss": 0.4658, + "step": 14025 + }, + { + "epoch": 0.56, + "learning_rate": 7.264242424242425e-06, + "loss": 0.4239, + "step": 14050 + }, + { + "epoch": 0.56, + "learning_rate": 7.259191919191921e-06, + "loss": 0.4249, + "step": 14075 + }, + { + "epoch": 0.57, + "learning_rate": 7.254141414141415e-06, + "loss": 0.4387, + "step": 14100 + }, + { + "epoch": 0.57, + "learning_rate": 7.24909090909091e-06, + "loss": 0.4284, + "step": 14125 + }, + { + "epoch": 0.57, + "learning_rate": 7.244040404040404e-06, + "loss": 0.4468, + "step": 14150 + }, + { + "epoch": 0.57, + "learning_rate": 7.2389898989898995e-06, + "loss": 0.4401, + "step": 14175 + }, + { + "epoch": 0.57, + "learning_rate": 7.233939393939395e-06, + "loss": 0.4362, + "step": 14200 + }, + { + "epoch": 0.57, + "learning_rate": 7.22888888888889e-06, + "loss": 0.4445, + "step": 14225 + }, + { + "epoch": 0.57, + "learning_rate": 7.223838383838384e-06, + "loss": 0.4435, + "step": 14250 + }, + { + "epoch": 0.57, + "learning_rate": 7.218787878787879e-06, + "loss": 0.4479, + "step": 14275 + }, + { + "epoch": 0.57, + "learning_rate": 7.2137373737373735e-06, + "loss": 0.4286, + "step": 14300 + }, + { + "epoch": 0.57, + "learning_rate": 7.2086868686868695e-06, + "loss": 0.428, + "step": 14325 + }, + { + "epoch": 0.58, + "learning_rate": 7.203636363636364e-06, + "loss": 0.4405, + "step": 14350 + }, + { + "epoch": 0.58, + "learning_rate": 7.198585858585859e-06, + "loss": 0.4454, + "step": 14375 + }, + { + "epoch": 0.58, + "learning_rate": 7.193535353535353e-06, + "loss": 0.4483, + "step": 14400 + }, + { + "epoch": 0.58, + "learning_rate": 7.188484848484849e-06, + "loss": 0.4449, + "step": 14425 + }, + { + "epoch": 0.58, + "learning_rate": 7.183434343434344e-06, + "loss": 0.4274, + "step": 14450 + }, + { + "epoch": 0.58, + "learning_rate": 7.178383838383839e-06, + "loss": 0.4208, + "step": 14475 + }, + { + "epoch": 0.58, + "learning_rate": 7.173333333333335e-06, + "loss": 0.4435, + "step": 14500 + }, + { + "epoch": 0.58, + "learning_rate": 7.168282828282829e-06, + "loss": 0.4329, + "step": 14525 + }, + { + "epoch": 0.58, + "learning_rate": 7.163232323232324e-06, + "loss": 0.3995, + "step": 14550 + }, + { + "epoch": 0.58, + "learning_rate": 7.158181818181818e-06, + "loss": 0.4609, + "step": 14575 + }, + { + "epoch": 0.59, + "learning_rate": 7.153131313131314e-06, + "loss": 0.4638, + "step": 14600 + }, + { + "epoch": 0.59, + "learning_rate": 7.148080808080809e-06, + "loss": 0.4249, + "step": 14625 + }, + { + "epoch": 0.59, + "learning_rate": 7.143030303030304e-06, + "loss": 0.4154, + "step": 14650 + }, + { + "epoch": 0.59, + "learning_rate": 7.138181818181819e-06, + "loss": 0.4388, + "step": 14675 + }, + { + "epoch": 0.59, + "learning_rate": 7.133131313131314e-06, + "loss": 0.4264, + "step": 14700 + }, + { + "epoch": 0.59, + "learning_rate": 7.128080808080808e-06, + "loss": 0.4408, + "step": 14725 + }, + { + "epoch": 0.59, + "learning_rate": 7.123030303030304e-06, + "loss": 0.4335, + "step": 14750 + }, + { + "epoch": 0.59, + "learning_rate": 7.117979797979798e-06, + "loss": 0.4502, + "step": 14775 + }, + { + "epoch": 0.59, + "learning_rate": 7.1129292929292935e-06, + "loss": 0.454, + "step": 14800 + }, + { + "epoch": 0.59, + "learning_rate": 7.107878787878788e-06, + "loss": 0.4547, + "step": 14825 + }, + { + "epoch": 0.6, + "learning_rate": 7.102828282828284e-06, + "loss": 0.4403, + "step": 14850 + }, + { + "epoch": 0.6, + "learning_rate": 7.097777777777778e-06, + "loss": 0.4273, + "step": 14875 + }, + { + "epoch": 0.6, + "learning_rate": 7.092727272727273e-06, + "loss": 0.4314, + "step": 14900 + }, + { + "epoch": 0.6, + "learning_rate": 7.0876767676767675e-06, + "loss": 0.4355, + "step": 14925 + }, + { + "epoch": 0.6, + "learning_rate": 7.0826262626262635e-06, + "loss": 0.4381, + "step": 14950 + }, + { + "epoch": 0.6, + "learning_rate": 7.077575757575759e-06, + "loss": 0.4259, + "step": 14975 + }, + { + "epoch": 0.6, + "learning_rate": 7.072525252525253e-06, + "loss": 0.4312, + "step": 15000 + }, + { + "epoch": 0.6, + "eval_loss": 0.4432617723941803, + "eval_runtime": 329.2864, + "eval_samples_per_second": 15.2, + "eval_steps_per_second": 1.901, + "eval_wer": 36.87795154132751, + "step": 15000 + }, + { + "epoch": 0.6, + "learning_rate": 7.067474747474748e-06, + "loss": 0.4423, + "step": 15025 + }, + { + "epoch": 0.6, + "learning_rate": 7.062424242424243e-06, + "loss": 0.4302, + "step": 15050 + }, + { + "epoch": 0.6, + "learning_rate": 7.057373737373738e-06, + "loss": 0.441, + "step": 15075 + }, + { + "epoch": 0.61, + "learning_rate": 7.052323232323233e-06, + "loss": 0.4281, + "step": 15100 + }, + { + "epoch": 0.61, + "learning_rate": 7.047272727272728e-06, + "loss": 0.4295, + "step": 15125 + }, + { + "epoch": 0.61, + "learning_rate": 7.042222222222223e-06, + "loss": 0.4268, + "step": 15150 + }, + { + "epoch": 0.61, + "learning_rate": 7.037171717171718e-06, + "loss": 0.4347, + "step": 15175 + }, + { + "epoch": 0.61, + "learning_rate": 7.032121212121212e-06, + "loss": 0.4463, + "step": 15200 + }, + { + "epoch": 0.61, + "learning_rate": 7.0270707070707075e-06, + "loss": 0.425, + "step": 15225 + }, + { + "epoch": 0.61, + "learning_rate": 7.022020202020202e-06, + "loss": 0.4393, + "step": 15250 + }, + { + "epoch": 0.61, + "learning_rate": 7.016969696969698e-06, + "loss": 0.4356, + "step": 15275 + }, + { + "epoch": 0.61, + "learning_rate": 7.011919191919192e-06, + "loss": 0.4228, + "step": 15300 + }, + { + "epoch": 0.61, + "learning_rate": 7.006868686868687e-06, + "loss": 0.428, + "step": 15325 + }, + { + "epoch": 0.62, + "learning_rate": 7.0018181818181815e-06, + "loss": 0.4418, + "step": 15350 + }, + { + "epoch": 0.62, + "learning_rate": 6.9967676767676775e-06, + "loss": 0.4257, + "step": 15375 + }, + { + "epoch": 0.62, + "learning_rate": 6.991717171717173e-06, + "loss": 0.4362, + "step": 15400 + }, + { + "epoch": 0.62, + "learning_rate": 6.986666666666667e-06, + "loss": 0.4321, + "step": 15425 + }, + { + "epoch": 0.62, + "learning_rate": 6.981616161616163e-06, + "loss": 0.4244, + "step": 15450 + }, + { + "epoch": 0.62, + "learning_rate": 6.976565656565657e-06, + "loss": 0.4297, + "step": 15475 + }, + { + "epoch": 0.62, + "learning_rate": 6.971515151515152e-06, + "loss": 0.4245, + "step": 15500 + }, + { + "epoch": 0.62, + "learning_rate": 6.966464646464647e-06, + "loss": 0.426, + "step": 15525 + }, + { + "epoch": 0.62, + "learning_rate": 6.961414141414143e-06, + "loss": 0.4475, + "step": 15550 + }, + { + "epoch": 0.62, + "learning_rate": 6.956363636363637e-06, + "loss": 0.4407, + "step": 15575 + }, + { + "epoch": 0.63, + "learning_rate": 6.951313131313132e-06, + "loss": 0.4298, + "step": 15600 + }, + { + "epoch": 0.63, + "learning_rate": 6.9462626262626264e-06, + "loss": 0.4157, + "step": 15625 + }, + { + "epoch": 0.63, + "learning_rate": 6.9412121212121216e-06, + "loss": 0.4288, + "step": 15650 + }, + { + "epoch": 0.63, + "learning_rate": 6.936161616161617e-06, + "loss": 0.4294, + "step": 15675 + }, + { + "epoch": 0.63, + "learning_rate": 6.931111111111112e-06, + "loss": 0.4231, + "step": 15700 + }, + { + "epoch": 0.63, + "learning_rate": 6.926060606060606e-06, + "loss": 0.4392, + "step": 15725 + }, + { + "epoch": 0.63, + "learning_rate": 6.921010101010101e-06, + "loss": 0.4144, + "step": 15750 + }, + { + "epoch": 0.63, + "learning_rate": 6.915959595959596e-06, + "loss": 0.4438, + "step": 15775 + }, + { + "epoch": 0.63, + "learning_rate": 6.910909090909092e-06, + "loss": 0.4181, + "step": 15800 + }, + { + "epoch": 0.63, + "learning_rate": 6.905858585858587e-06, + "loss": 0.4177, + "step": 15825 + }, + { + "epoch": 0.64, + "learning_rate": 6.900808080808081e-06, + "loss": 0.4319, + "step": 15850 + }, + { + "epoch": 0.64, + "learning_rate": 6.895757575757577e-06, + "loss": 0.432, + "step": 15875 + }, + { + "epoch": 0.64, + "learning_rate": 6.890707070707071e-06, + "loss": 0.4332, + "step": 15900 + }, + { + "epoch": 0.64, + "learning_rate": 6.8856565656565664e-06, + "loss": 0.4174, + "step": 15925 + }, + { + "epoch": 0.64, + "learning_rate": 6.880606060606061e-06, + "loss": 0.4543, + "step": 15950 + }, + { + "epoch": 0.64, + "learning_rate": 6.875555555555557e-06, + "loss": 0.4187, + "step": 15975 + }, + { + "epoch": 0.64, + "learning_rate": 6.870505050505051e-06, + "loss": 0.4371, + "step": 16000 + }, + { + "epoch": 0.64, + "learning_rate": 6.865454545454546e-06, + "loss": 0.4377, + "step": 16025 + }, + { + "epoch": 0.64, + "learning_rate": 6.8604040404040405e-06, + "loss": 0.4432, + "step": 16050 + }, + { + "epoch": 0.64, + "learning_rate": 6.8553535353535365e-06, + "loss": 0.4261, + "step": 16075 + }, + { + "epoch": 0.65, + "learning_rate": 6.850303030303031e-06, + "loss": 0.436, + "step": 16100 + }, + { + "epoch": 0.65, + "learning_rate": 6.845252525252526e-06, + "loss": 0.4192, + "step": 16125 + }, + { + "epoch": 0.65, + "learning_rate": 6.84020202020202e-06, + "loss": 0.4363, + "step": 16150 + }, + { + "epoch": 0.65, + "learning_rate": 6.835151515151515e-06, + "loss": 0.4336, + "step": 16175 + }, + { + "epoch": 0.65, + "learning_rate": 6.8301010101010105e-06, + "loss": 0.4451, + "step": 16200 + }, + { + "epoch": 0.65, + "learning_rate": 6.825050505050506e-06, + "loss": 0.4131, + "step": 16225 + }, + { + "epoch": 0.65, + "learning_rate": 6.820000000000001e-06, + "loss": 0.4384, + "step": 16250 + }, + { + "epoch": 0.65, + "learning_rate": 6.814949494949495e-06, + "loss": 0.4177, + "step": 16275 + }, + { + "epoch": 0.65, + "learning_rate": 6.809898989898991e-06, + "loss": 0.4355, + "step": 16300 + }, + { + "epoch": 0.65, + "learning_rate": 6.804848484848485e-06, + "loss": 0.4168, + "step": 16325 + }, + { + "epoch": 0.66, + "learning_rate": 6.7997979797979805e-06, + "loss": 0.4193, + "step": 16350 + }, + { + "epoch": 0.66, + "learning_rate": 6.794747474747475e-06, + "loss": 0.417, + "step": 16375 + }, + { + "epoch": 0.66, + "learning_rate": 6.789696969696971e-06, + "loss": 0.4337, + "step": 16400 + }, + { + "epoch": 0.66, + "learning_rate": 6.784646464646465e-06, + "loss": 0.4253, + "step": 16425 + }, + { + "epoch": 0.66, + "learning_rate": 6.77959595959596e-06, + "loss": 0.421, + "step": 16450 + }, + { + "epoch": 0.66, + "learning_rate": 6.7745454545454545e-06, + "loss": 0.431, + "step": 16475 + }, + { + "epoch": 0.66, + "learning_rate": 6.7694949494949505e-06, + "loss": 0.4143, + "step": 16500 + }, + { + "epoch": 0.66, + "learning_rate": 6.764444444444445e-06, + "loss": 0.424, + "step": 16525 + }, + { + "epoch": 0.66, + "learning_rate": 6.75939393939394e-06, + "loss": 0.4172, + "step": 16550 + }, + { + "epoch": 0.66, + "learning_rate": 6.754343434343434e-06, + "loss": 0.434, + "step": 16575 + }, + { + "epoch": 0.67, + "learning_rate": 6.74929292929293e-06, + "loss": 0.4295, + "step": 16600 + }, + { + "epoch": 0.67, + "learning_rate": 6.7442424242424245e-06, + "loss": 0.4117, + "step": 16625 + }, + { + "epoch": 0.67, + "learning_rate": 6.73919191919192e-06, + "loss": 0.4188, + "step": 16650 + }, + { + "epoch": 0.67, + "learning_rate": 6.734141414141415e-06, + "loss": 0.4356, + "step": 16675 + }, + { + "epoch": 0.67, + "learning_rate": 6.72909090909091e-06, + "loss": 0.4422, + "step": 16700 + }, + { + "epoch": 0.67, + "learning_rate": 6.724040404040405e-06, + "loss": 0.4236, + "step": 16725 + }, + { + "epoch": 0.67, + "learning_rate": 6.718989898989899e-06, + "loss": 0.4122, + "step": 16750 + }, + { + "epoch": 0.67, + "learning_rate": 6.714141414141415e-06, + "loss": 0.4019, + "step": 16775 + }, + { + "epoch": 0.67, + "learning_rate": 6.709090909090909e-06, + "loss": 0.4294, + "step": 16800 + }, + { + "epoch": 0.67, + "learning_rate": 6.704040404040405e-06, + "loss": 0.425, + "step": 16825 + }, + { + "epoch": 0.68, + "learning_rate": 6.6989898989899e-06, + "loss": 0.4389, + "step": 16850 + }, + { + "epoch": 0.68, + "learning_rate": 6.693939393939395e-06, + "loss": 0.4441, + "step": 16875 + }, + { + "epoch": 0.68, + "learning_rate": 6.688888888888889e-06, + "loss": 0.4154, + "step": 16900 + }, + { + "epoch": 0.68, + "learning_rate": 6.683838383838385e-06, + "loss": 0.4263, + "step": 16925 + }, + { + "epoch": 0.68, + "learning_rate": 6.678787878787879e-06, + "loss": 0.4035, + "step": 16950 + }, + { + "epoch": 0.68, + "learning_rate": 6.6737373737373745e-06, + "loss": 0.4229, + "step": 16975 + }, + { + "epoch": 0.68, + "learning_rate": 6.668686868686869e-06, + "loss": 0.4078, + "step": 17000 + }, + { + "epoch": 0.68, + "learning_rate": 6.663636363636365e-06, + "loss": 0.4294, + "step": 17025 + }, + { + "epoch": 0.68, + "learning_rate": 6.658585858585859e-06, + "loss": 0.436, + "step": 17050 + }, + { + "epoch": 0.68, + "learning_rate": 6.653535353535354e-06, + "loss": 0.4341, + "step": 17075 + }, + { + "epoch": 0.69, + "learning_rate": 6.6484848484848485e-06, + "loss": 0.4185, + "step": 17100 + }, + { + "epoch": 0.69, + "learning_rate": 6.643434343434344e-06, + "loss": 0.427, + "step": 17125 + }, + { + "epoch": 0.69, + "learning_rate": 6.638383838383839e-06, + "loss": 0.4318, + "step": 17150 + }, + { + "epoch": 0.69, + "learning_rate": 6.633333333333334e-06, + "loss": 0.4168, + "step": 17175 + }, + { + "epoch": 0.69, + "learning_rate": 6.628282828282829e-06, + "loss": 0.424, + "step": 17200 + }, + { + "epoch": 0.69, + "learning_rate": 6.623232323232323e-06, + "loss": 0.4291, + "step": 17225 + }, + { + "epoch": 0.69, + "learning_rate": 6.618181818181819e-06, + "loss": 0.4211, + "step": 17250 + }, + { + "epoch": 0.69, + "learning_rate": 6.613131313131314e-06, + "loss": 0.4157, + "step": 17275 + }, + { + "epoch": 0.69, + "learning_rate": 6.608080808080809e-06, + "loss": 0.4334, + "step": 17300 + }, + { + "epoch": 0.69, + "learning_rate": 6.603030303030303e-06, + "loss": 0.4164, + "step": 17325 + }, + { + "epoch": 0.7, + "learning_rate": 6.597979797979799e-06, + "loss": 0.4346, + "step": 17350 + }, + { + "epoch": 0.7, + "learning_rate": 6.592929292929293e-06, + "loss": 0.4317, + "step": 17375 + }, + { + "epoch": 0.7, + "learning_rate": 6.5878787878787885e-06, + "loss": 0.439, + "step": 17400 + }, + { + "epoch": 0.7, + "learning_rate": 6.582828282828283e-06, + "loss": 0.4302, + "step": 17425 + }, + { + "epoch": 0.7, + "learning_rate": 6.577777777777779e-06, + "loss": 0.4337, + "step": 17450 + }, + { + "epoch": 0.7, + "learning_rate": 6.572727272727273e-06, + "loss": 0.4033, + "step": 17475 + }, + { + "epoch": 0.7, + "learning_rate": 6.567676767676768e-06, + "loss": 0.4208, + "step": 17500 + }, + { + "epoch": 0.7, + "eval_loss": 0.43082931637763977, + "eval_runtime": 307.9947, + "eval_samples_per_second": 16.25, + "eval_steps_per_second": 2.033, + "eval_wer": 32.371437385794636, + "step": 17500 + }, + { + "epoch": 0.7, + "learning_rate": 6.5626262626262625e-06, + "loss": 0.4161, + "step": 17525 + }, + { + "epoch": 0.7, + "learning_rate": 6.5575757575757585e-06, + "loss": 0.4151, + "step": 17550 + }, + { + "epoch": 0.7, + "learning_rate": 6.552525252525253e-06, + "loss": 0.4389, + "step": 17575 + }, + { + "epoch": 0.71, + "learning_rate": 6.547474747474748e-06, + "loss": 0.4413, + "step": 17600 + }, + { + "epoch": 0.71, + "learning_rate": 6.542424242424243e-06, + "loss": 0.4208, + "step": 17625 + }, + { + "epoch": 0.71, + "learning_rate": 6.537373737373737e-06, + "loss": 0.4272, + "step": 17650 + }, + { + "epoch": 0.71, + "learning_rate": 6.532323232323233e-06, + "loss": 0.4095, + "step": 17675 + }, + { + "epoch": 0.71, + "learning_rate": 6.527272727272728e-06, + "loss": 0.431, + "step": 17700 + }, + { + "epoch": 0.71, + "learning_rate": 6.522222222222223e-06, + "loss": 0.4285, + "step": 17725 + }, + { + "epoch": 0.71, + "learning_rate": 6.517171717171717e-06, + "loss": 0.4086, + "step": 17750 + }, + { + "epoch": 0.71, + "learning_rate": 6.512121212121213e-06, + "loss": 0.435, + "step": 17775 + }, + { + "epoch": 0.71, + "learning_rate": 6.507070707070707e-06, + "loss": 0.4134, + "step": 17800 + }, + { + "epoch": 0.71, + "learning_rate": 6.5020202020202026e-06, + "loss": 0.4181, + "step": 17825 + }, + { + "epoch": 0.72, + "learning_rate": 6.496969696969697e-06, + "loss": 0.3998, + "step": 17850 + }, + { + "epoch": 0.72, + "learning_rate": 6.491919191919193e-06, + "loss": 0.4095, + "step": 17875 + }, + { + "epoch": 0.72, + "learning_rate": 6.486868686868687e-06, + "loss": 0.4344, + "step": 17900 + }, + { + "epoch": 0.72, + "learning_rate": 6.481818181818182e-06, + "loss": 0.4049, + "step": 17925 + }, + { + "epoch": 0.72, + "learning_rate": 6.476767676767677e-06, + "loss": 0.4204, + "step": 17950 + }, + { + "epoch": 0.72, + "learning_rate": 6.4717171717171726e-06, + "loss": 0.4377, + "step": 17975 + }, + { + "epoch": 0.72, + "learning_rate": 6.466666666666667e-06, + "loss": 0.4247, + "step": 18000 + }, + { + "epoch": 0.72, + "learning_rate": 6.461616161616162e-06, + "loss": 0.4249, + "step": 18025 + }, + { + "epoch": 0.72, + "learning_rate": 6.456565656565658e-06, + "loss": 0.4067, + "step": 18050 + }, + { + "epoch": 0.72, + "learning_rate": 6.451515151515152e-06, + "loss": 0.4149, + "step": 18075 + }, + { + "epoch": 0.73, + "learning_rate": 6.4464646464646474e-06, + "loss": 0.4059, + "step": 18100 + }, + { + "epoch": 0.73, + "learning_rate": 6.441414141414142e-06, + "loss": 0.4207, + "step": 18125 + }, + { + "epoch": 0.73, + "learning_rate": 6.436363636363637e-06, + "loss": 0.4135, + "step": 18150 + }, + { + "epoch": 0.73, + "learning_rate": 6.431313131313132e-06, + "loss": 0.4335, + "step": 18175 + }, + { + "epoch": 0.73, + "learning_rate": 6.426262626262627e-06, + "loss": 0.423, + "step": 18200 + }, + { + "epoch": 0.73, + "learning_rate": 6.4212121212121215e-06, + "loss": 0.4142, + "step": 18225 + }, + { + "epoch": 0.73, + "learning_rate": 6.416161616161617e-06, + "loss": 0.4417, + "step": 18250 + }, + { + "epoch": 0.73, + "learning_rate": 6.411111111111111e-06, + "loss": 0.424, + "step": 18275 + }, + { + "epoch": 0.73, + "learning_rate": 6.406060606060607e-06, + "loss": 0.4286, + "step": 18300 + }, + { + "epoch": 0.73, + "learning_rate": 6.401010101010101e-06, + "loss": 0.4143, + "step": 18325 + }, + { + "epoch": 0.74, + "learning_rate": 6.395959595959596e-06, + "loss": 0.4154, + "step": 18350 + }, + { + "epoch": 0.74, + "learning_rate": 6.390909090909091e-06, + "loss": 0.4065, + "step": 18375 + }, + { + "epoch": 0.74, + "learning_rate": 6.385858585858587e-06, + "loss": 0.4251, + "step": 18400 + }, + { + "epoch": 0.74, + "learning_rate": 6.380808080808081e-06, + "loss": 0.4203, + "step": 18425 + }, + { + "epoch": 0.74, + "learning_rate": 6.375757575757576e-06, + "loss": 0.3992, + "step": 18450 + }, + { + "epoch": 0.74, + "learning_rate": 6.370707070707072e-06, + "loss": 0.4243, + "step": 18475 + }, + { + "epoch": 0.74, + "learning_rate": 6.365656565656566e-06, + "loss": 0.4465, + "step": 18500 + }, + { + "epoch": 0.74, + "learning_rate": 6.3606060606060615e-06, + "loss": 0.4089, + "step": 18525 + }, + { + "epoch": 0.74, + "learning_rate": 6.355555555555556e-06, + "loss": 0.4242, + "step": 18550 + }, + { + "epoch": 0.74, + "learning_rate": 6.350505050505052e-06, + "loss": 0.4295, + "step": 18575 + }, + { + "epoch": 0.75, + "learning_rate": 6.345454545454546e-06, + "loss": 0.4053, + "step": 18600 + }, + { + "epoch": 0.75, + "learning_rate": 6.340404040404041e-06, + "loss": 0.4106, + "step": 18625 + }, + { + "epoch": 0.75, + "learning_rate": 6.3353535353535355e-06, + "loss": 0.4287, + "step": 18650 + }, + { + "epoch": 0.75, + "learning_rate": 6.330303030303031e-06, + "loss": 0.4265, + "step": 18675 + }, + { + "epoch": 0.75, + "learning_rate": 6.325252525252526e-06, + "loss": 0.4328, + "step": 18700 + }, + { + "epoch": 0.75, + "learning_rate": 6.320202020202021e-06, + "loss": 0.4071, + "step": 18725 + }, + { + "epoch": 0.75, + "learning_rate": 6.315151515151515e-06, + "loss": 0.4214, + "step": 18750 + }, + { + "epoch": 0.75, + "learning_rate": 6.31010101010101e-06, + "loss": 0.4108, + "step": 18775 + }, + { + "epoch": 0.75, + "learning_rate": 6.305050505050505e-06, + "loss": 0.4262, + "step": 18800 + }, + { + "epoch": 0.75, + "learning_rate": 6.300000000000001e-06, + "loss": 0.3884, + "step": 18825 + }, + { + "epoch": 0.76, + "learning_rate": 6.294949494949495e-06, + "loss": 0.411, + "step": 18850 + }, + { + "epoch": 0.76, + "learning_rate": 6.28989898989899e-06, + "loss": 0.4229, + "step": 18875 + }, + { + "epoch": 0.76, + "learning_rate": 6.284848484848486e-06, + "loss": 0.4252, + "step": 18900 + }, + { + "epoch": 0.76, + "learning_rate": 6.27979797979798e-06, + "loss": 0.4134, + "step": 18925 + }, + { + "epoch": 0.76, + "learning_rate": 6.2747474747474755e-06, + "loss": 0.4265, + "step": 18950 + }, + { + "epoch": 0.76, + "learning_rate": 6.26969696969697e-06, + "loss": 0.395, + "step": 18975 + }, + { + "epoch": 0.76, + "learning_rate": 6.264646464646466e-06, + "loss": 0.417, + "step": 19000 + }, + { + "epoch": 0.76, + "learning_rate": 6.25959595959596e-06, + "loss": 0.4259, + "step": 19025 + }, + { + "epoch": 0.76, + "learning_rate": 6.254545454545455e-06, + "loss": 0.4009, + "step": 19050 + }, + { + "epoch": 0.76, + "learning_rate": 6.2494949494949496e-06, + "loss": 0.399, + "step": 19075 + }, + { + "epoch": 0.77, + "learning_rate": 6.2444444444444456e-06, + "loss": 0.4098, + "step": 19100 + }, + { + "epoch": 0.77, + "learning_rate": 6.23939393939394e-06, + "loss": 0.4192, + "step": 19125 + }, + { + "epoch": 0.77, + "learning_rate": 6.2345454545454555e-06, + "loss": 0.4068, + "step": 19150 + }, + { + "epoch": 0.77, + "learning_rate": 6.22949494949495e-06, + "loss": 0.426, + "step": 19175 + }, + { + "epoch": 0.77, + "learning_rate": 6.224444444444445e-06, + "loss": 0.4072, + "step": 19200 + }, + { + "epoch": 0.77, + "learning_rate": 6.219393939393939e-06, + "loss": 0.4181, + "step": 19225 + }, + { + "epoch": 0.77, + "learning_rate": 6.214343434343435e-06, + "loss": 0.4127, + "step": 19250 + }, + { + "epoch": 0.77, + "learning_rate": 6.2092929292929295e-06, + "loss": 0.4244, + "step": 19275 + }, + { + "epoch": 0.77, + "learning_rate": 6.204242424242425e-06, + "loss": 0.4168, + "step": 19300 + }, + { + "epoch": 0.77, + "learning_rate": 6.199191919191919e-06, + "loss": 0.4112, + "step": 19325 + }, + { + "epoch": 0.78, + "learning_rate": 6.194141414141415e-06, + "loss": 0.4162, + "step": 19350 + }, + { + "epoch": 0.78, + "learning_rate": 6.18909090909091e-06, + "loss": 0.3985, + "step": 19375 + }, + { + "epoch": 0.78, + "learning_rate": 6.184040404040404e-06, + "loss": 0.428, + "step": 19400 + }, + { + "epoch": 0.78, + "learning_rate": 6.1789898989899e-06, + "loss": 0.4175, + "step": 19425 + }, + { + "epoch": 0.78, + "learning_rate": 6.173939393939395e-06, + "loss": 0.4138, + "step": 19450 + }, + { + "epoch": 0.78, + "learning_rate": 6.16888888888889e-06, + "loss": 0.3978, + "step": 19475 + }, + { + "epoch": 0.78, + "learning_rate": 6.163838383838384e-06, + "loss": 0.4213, + "step": 19500 + }, + { + "epoch": 0.78, + "learning_rate": 6.15878787878788e-06, + "loss": 0.408, + "step": 19525 + }, + { + "epoch": 0.78, + "learning_rate": 6.153737373737374e-06, + "loss": 0.4107, + "step": 19550 + }, + { + "epoch": 0.78, + "learning_rate": 6.1486868686868695e-06, + "loss": 0.4061, + "step": 19575 + }, + { + "epoch": 0.79, + "learning_rate": 6.143636363636364e-06, + "loss": 0.4142, + "step": 19600 + }, + { + "epoch": 0.79, + "learning_rate": 6.138585858585859e-06, + "loss": 0.4182, + "step": 19625 + }, + { + "epoch": 0.79, + "learning_rate": 6.133535353535354e-06, + "loss": 0.4174, + "step": 19650 + }, + { + "epoch": 0.79, + "learning_rate": 6.128484848484849e-06, + "loss": 0.4284, + "step": 19675 + }, + { + "epoch": 0.79, + "learning_rate": 6.1234343434343435e-06, + "loss": 0.4023, + "step": 19700 + }, + { + "epoch": 0.79, + "learning_rate": 6.118383838383839e-06, + "loss": 0.4249, + "step": 19725 + }, + { + "epoch": 0.79, + "learning_rate": 6.113333333333333e-06, + "loss": 0.4049, + "step": 19750 + }, + { + "epoch": 0.79, + "learning_rate": 6.108282828282829e-06, + "loss": 0.4137, + "step": 19775 + }, + { + "epoch": 0.79, + "learning_rate": 6.103232323232324e-06, + "loss": 0.4084, + "step": 19800 + }, + { + "epoch": 0.79, + "learning_rate": 6.098181818181818e-06, + "loss": 0.4209, + "step": 19825 + }, + { + "epoch": 0.8, + "learning_rate": 6.093131313131314e-06, + "loss": 0.4114, + "step": 19850 + }, + { + "epoch": 0.8, + "learning_rate": 6.088080808080809e-06, + "loss": 0.4121, + "step": 19875 + }, + { + "epoch": 0.8, + "learning_rate": 6.083030303030304e-06, + "loss": 0.4279, + "step": 19900 + }, + { + "epoch": 0.8, + "learning_rate": 6.077979797979798e-06, + "loss": 0.4275, + "step": 19925 + }, + { + "epoch": 0.8, + "learning_rate": 6.072929292929294e-06, + "loss": 0.4075, + "step": 19950 + }, + { + "epoch": 0.8, + "learning_rate": 6.067878787878788e-06, + "loss": 0.4179, + "step": 19975 + }, + { + "epoch": 0.8, + "learning_rate": 6.0628282828282836e-06, + "loss": 0.4089, + "step": 20000 + }, + { + "epoch": 0.8, + "eval_loss": 0.4228692054748535, + "eval_runtime": 313.9546, + "eval_samples_per_second": 15.942, + "eval_steps_per_second": 1.994, + "eval_wer": 33.41085455278957, + "step": 20000 + }, + { + "epoch": 0.8, + "learning_rate": 6.057777777777778e-06, + "loss": 0.4367, + "step": 20025 + }, + { + "epoch": 0.8, + "learning_rate": 6.052727272727274e-06, + "loss": 0.4269, + "step": 20050 + }, + { + "epoch": 0.8, + "learning_rate": 6.047676767676768e-06, + "loss": 0.4196, + "step": 20075 + }, + { + "epoch": 0.81, + "learning_rate": 6.042626262626263e-06, + "loss": 0.4006, + "step": 20100 + }, + { + "epoch": 0.81, + "learning_rate": 6.0375757575757576e-06, + "loss": 0.4113, + "step": 20125 + }, + { + "epoch": 0.81, + "learning_rate": 6.032525252525253e-06, + "loss": 0.413, + "step": 20150 + }, + { + "epoch": 0.81, + "learning_rate": 6.027474747474748e-06, + "loss": 0.4234, + "step": 20175 + }, + { + "epoch": 0.81, + "learning_rate": 6.022424242424243e-06, + "loss": 0.424, + "step": 20200 + }, + { + "epoch": 0.81, + "learning_rate": 6.017373737373737e-06, + "loss": 0.4187, + "step": 20225 + }, + { + "epoch": 0.81, + "learning_rate": 6.0123232323232324e-06, + "loss": 0.4066, + "step": 20250 + }, + { + "epoch": 0.81, + "learning_rate": 6.0072727272727284e-06, + "loss": 0.4126, + "step": 20275 + }, + { + "epoch": 0.81, + "learning_rate": 6.002222222222223e-06, + "loss": 0.4026, + "step": 20300 + }, + { + "epoch": 0.82, + "learning_rate": 5.997171717171718e-06, + "loss": 0.3976, + "step": 20325 + }, + { + "epoch": 0.82, + "learning_rate": 5.992121212121212e-06, + "loss": 0.4272, + "step": 20350 + }, + { + "epoch": 0.82, + "learning_rate": 5.987070707070708e-06, + "loss": 0.4242, + "step": 20375 + }, + { + "epoch": 0.82, + "learning_rate": 5.9820202020202025e-06, + "loss": 0.4108, + "step": 20400 + }, + { + "epoch": 0.82, + "learning_rate": 5.976969696969698e-06, + "loss": 0.426, + "step": 20425 + }, + { + "epoch": 0.82, + "learning_rate": 5.971919191919192e-06, + "loss": 0.4276, + "step": 20450 + }, + { + "epoch": 0.82, + "learning_rate": 5.966868686868688e-06, + "loss": 0.4193, + "step": 20475 + }, + { + "epoch": 0.82, + "learning_rate": 5.961818181818182e-06, + "loss": 0.4073, + "step": 20500 + }, + { + "epoch": 0.82, + "learning_rate": 5.956767676767677e-06, + "loss": 0.4294, + "step": 20525 + }, + { + "epoch": 0.82, + "learning_rate": 5.951717171717172e-06, + "loss": 0.4127, + "step": 20550 + }, + { + "epoch": 0.83, + "learning_rate": 5.946666666666668e-06, + "loss": 0.4075, + "step": 20575 + }, + { + "epoch": 0.83, + "learning_rate": 5.941616161616162e-06, + "loss": 0.3962, + "step": 20600 + }, + { + "epoch": 0.83, + "learning_rate": 5.936565656565657e-06, + "loss": 0.414, + "step": 20625 + }, + { + "epoch": 0.83, + "learning_rate": 5.931515151515151e-06, + "loss": 0.4167, + "step": 20650 + }, + { + "epoch": 0.83, + "learning_rate": 5.926464646464647e-06, + "loss": 0.4155, + "step": 20675 + }, + { + "epoch": 0.83, + "learning_rate": 5.9214141414141425e-06, + "loss": 0.4072, + "step": 20700 + }, + { + "epoch": 0.83, + "learning_rate": 5.916363636363637e-06, + "loss": 0.4028, + "step": 20725 + }, + { + "epoch": 0.83, + "learning_rate": 5.911313131313132e-06, + "loss": 0.4195, + "step": 20750 + }, + { + "epoch": 0.83, + "learning_rate": 5.906262626262626e-06, + "loss": 0.4224, + "step": 20775 + }, + { + "epoch": 0.83, + "learning_rate": 5.901212121212122e-06, + "loss": 0.406, + "step": 20800 + }, + { + "epoch": 0.84, + "learning_rate": 5.8961616161616165e-06, + "loss": 0.4145, + "step": 20825 + }, + { + "epoch": 0.84, + "learning_rate": 5.891111111111112e-06, + "loss": 0.4041, + "step": 20850 + }, + { + "epoch": 0.84, + "learning_rate": 5.886060606060606e-06, + "loss": 0.4062, + "step": 20875 + }, + { + "epoch": 0.84, + "learning_rate": 5.881010101010102e-06, + "loss": 0.4046, + "step": 20900 + }, + { + "epoch": 0.84, + "learning_rate": 5.875959595959596e-06, + "loss": 0.4375, + "step": 20925 + }, + { + "epoch": 0.84, + "learning_rate": 5.870909090909091e-06, + "loss": 0.4266, + "step": 20950 + }, + { + "epoch": 0.84, + "learning_rate": 5.865858585858586e-06, + "loss": 0.4102, + "step": 20975 + }, + { + "epoch": 0.84, + "learning_rate": 5.860808080808082e-06, + "loss": 0.4138, + "step": 21000 + }, + { + "epoch": 0.84, + "learning_rate": 5.855757575757576e-06, + "loss": 0.4086, + "step": 21025 + }, + { + "epoch": 0.84, + "learning_rate": 5.850707070707071e-06, + "loss": 0.4002, + "step": 21050 + }, + { + "epoch": 0.85, + "learning_rate": 5.845656565656565e-06, + "loss": 0.3841, + "step": 21075 + }, + { + "epoch": 0.85, + "learning_rate": 5.840606060606061e-06, + "loss": 0.4017, + "step": 21100 + }, + { + "epoch": 0.85, + "learning_rate": 5.8355555555555565e-06, + "loss": 0.4092, + "step": 21125 + }, + { + "epoch": 0.85, + "learning_rate": 5.830505050505051e-06, + "loss": 0.4161, + "step": 21150 + }, + { + "epoch": 0.85, + "learning_rate": 5.825454545454546e-06, + "loss": 0.3923, + "step": 21175 + }, + { + "epoch": 0.85, + "learning_rate": 5.820404040404041e-06, + "loss": 0.4073, + "step": 21200 + }, + { + "epoch": 0.85, + "learning_rate": 5.815353535353536e-06, + "loss": 0.3931, + "step": 21225 + }, + { + "epoch": 0.85, + "learning_rate": 5.8103030303030306e-06, + "loss": 0.3999, + "step": 21250 + }, + { + "epoch": 0.85, + "learning_rate": 5.805252525252526e-06, + "loss": 0.3947, + "step": 21275 + }, + { + "epoch": 0.85, + "learning_rate": 5.80020202020202e-06, + "loss": 0.4091, + "step": 21300 + }, + { + "epoch": 0.86, + "learning_rate": 5.795151515151516e-06, + "loss": 0.3898, + "step": 21325 + }, + { + "epoch": 0.86, + "learning_rate": 5.79010101010101e-06, + "loss": 0.4089, + "step": 21350 + }, + { + "epoch": 0.86, + "learning_rate": 5.785050505050505e-06, + "loss": 0.4212, + "step": 21375 + }, + { + "epoch": 0.86, + "learning_rate": 5.78e-06, + "loss": 0.4273, + "step": 21400 + }, + { + "epoch": 0.86, + "learning_rate": 5.774949494949496e-06, + "loss": 0.422, + "step": 21425 + }, + { + "epoch": 0.86, + "learning_rate": 5.76989898989899e-06, + "loss": 0.4094, + "step": 21450 + }, + { + "epoch": 0.86, + "learning_rate": 5.764848484848485e-06, + "loss": 0.4442, + "step": 21475 + }, + { + "epoch": 0.86, + "learning_rate": 5.7597979797979794e-06, + "loss": 0.4052, + "step": 21500 + }, + { + "epoch": 0.86, + "learning_rate": 5.7547474747474754e-06, + "loss": 0.4111, + "step": 21525 + }, + { + "epoch": 0.86, + "learning_rate": 5.749696969696971e-06, + "loss": 0.417, + "step": 21550 + }, + { + "epoch": 0.87, + "learning_rate": 5.744646464646465e-06, + "loss": 0.3936, + "step": 21575 + }, + { + "epoch": 0.87, + "learning_rate": 5.739595959595961e-06, + "loss": 0.392, + "step": 21600 + }, + { + "epoch": 0.87, + "learning_rate": 5.734545454545455e-06, + "loss": 0.4233, + "step": 21625 + }, + { + "epoch": 0.87, + "learning_rate": 5.72949494949495e-06, + "loss": 0.3902, + "step": 21650 + }, + { + "epoch": 0.87, + "learning_rate": 5.724444444444445e-06, + "loss": 0.4107, + "step": 21675 + }, + { + "epoch": 0.87, + "learning_rate": 5.71939393939394e-06, + "loss": 0.4171, + "step": 21700 + }, + { + "epoch": 0.87, + "learning_rate": 5.714343434343435e-06, + "loss": 0.42, + "step": 21725 + }, + { + "epoch": 0.87, + "learning_rate": 5.70929292929293e-06, + "loss": 0.4245, + "step": 21750 + }, + { + "epoch": 0.87, + "learning_rate": 5.704242424242424e-06, + "loss": 0.417, + "step": 21775 + }, + { + "epoch": 0.87, + "learning_rate": 5.6991919191919195e-06, + "loss": 0.4052, + "step": 21800 + }, + { + "epoch": 0.88, + "learning_rate": 5.694141414141415e-06, + "loss": 0.4282, + "step": 21825 + }, + { + "epoch": 0.88, + "learning_rate": 5.68909090909091e-06, + "loss": 0.4263, + "step": 21850 + }, + { + "epoch": 0.88, + "learning_rate": 5.684040404040404e-06, + "loss": 0.4163, + "step": 21875 + }, + { + "epoch": 0.88, + "learning_rate": 5.678989898989899e-06, + "loss": 0.4095, + "step": 21900 + }, + { + "epoch": 0.88, + "learning_rate": 5.6739393939393935e-06, + "loss": 0.4134, + "step": 21925 + }, + { + "epoch": 0.88, + "learning_rate": 5.6688888888888895e-06, + "loss": 0.4124, + "step": 21950 + }, + { + "epoch": 0.88, + "learning_rate": 5.663838383838385e-06, + "loss": 0.3975, + "step": 21975 + }, + { + "epoch": 0.88, + "learning_rate": 5.658787878787879e-06, + "loss": 0.4044, + "step": 22000 + }, + { + "epoch": 0.88, + "learning_rate": 5.653737373737375e-06, + "loss": 0.3992, + "step": 22025 + }, + { + "epoch": 0.88, + "learning_rate": 5.648686868686869e-06, + "loss": 0.4173, + "step": 22050 + }, + { + "epoch": 0.89, + "learning_rate": 5.643636363636364e-06, + "loss": 0.4212, + "step": 22075 + }, + { + "epoch": 0.89, + "learning_rate": 5.638585858585859e-06, + "loss": 0.4066, + "step": 22100 + }, + { + "epoch": 0.89, + "learning_rate": 5.633535353535355e-06, + "loss": 0.4141, + "step": 22125 + }, + { + "epoch": 0.89, + "learning_rate": 5.628484848484849e-06, + "loss": 0.4004, + "step": 22150 + }, + { + "epoch": 0.89, + "learning_rate": 5.623434343434344e-06, + "loss": 0.4123, + "step": 22175 + }, + { + "epoch": 0.89, + "learning_rate": 5.618383838383838e-06, + "loss": 0.4064, + "step": 22200 + }, + { + "epoch": 0.89, + "learning_rate": 5.613333333333334e-06, + "loss": 0.4156, + "step": 22225 + }, + { + "epoch": 0.89, + "learning_rate": 5.608282828282829e-06, + "loss": 0.3922, + "step": 22250 + }, + { + "epoch": 0.89, + "learning_rate": 5.603232323232324e-06, + "loss": 0.4172, + "step": 22275 + }, + { + "epoch": 0.89, + "learning_rate": 5.598181818181818e-06, + "loss": 0.4073, + "step": 22300 + }, + { + "epoch": 0.9, + "learning_rate": 5.593131313131313e-06, + "loss": 0.3981, + "step": 22325 + }, + { + "epoch": 0.9, + "learning_rate": 5.588080808080808e-06, + "loss": 0.4175, + "step": 22350 + }, + { + "epoch": 0.9, + "learning_rate": 5.5830303030303035e-06, + "loss": 0.407, + "step": 22375 + }, + { + "epoch": 0.9, + "learning_rate": 5.577979797979799e-06, + "loss": 0.3995, + "step": 22400 + }, + { + "epoch": 0.9, + "learning_rate": 5.572929292929293e-06, + "loss": 0.4078, + "step": 22425 + }, + { + "epoch": 0.9, + "learning_rate": 5.567878787878789e-06, + "loss": 0.3822, + "step": 22450 + }, + { + "epoch": 0.9, + "learning_rate": 5.562828282828283e-06, + "loss": 0.4089, + "step": 22475 + }, + { + "epoch": 0.9, + "learning_rate": 5.557777777777778e-06, + "loss": 0.4163, + "step": 22500 + }, + { + "epoch": 0.9, + "eval_loss": 0.41425320506095886, + "eval_runtime": 313.671, + "eval_samples_per_second": 15.956, + "eval_steps_per_second": 1.996, + "eval_wer": 32.542300481739005, + "step": 22500 + }, + { + "epoch": 0.9, + "learning_rate": 5.552727272727273e-06, + "loss": 0.4018, + "step": 22525 + }, + { + "epoch": 0.9, + "learning_rate": 5.547676767676769e-06, + "loss": 0.4308, + "step": 22550 + }, + { + "epoch": 0.91, + "learning_rate": 5.542626262626263e-06, + "loss": 0.4127, + "step": 22575 + }, + { + "epoch": 0.91, + "learning_rate": 5.537575757575758e-06, + "loss": 0.4111, + "step": 22600 + }, + { + "epoch": 0.91, + "learning_rate": 5.532525252525252e-06, + "loss": 0.4069, + "step": 22625 + }, + { + "epoch": 0.91, + "learning_rate": 5.527474747474748e-06, + "loss": 0.4216, + "step": 22650 + }, + { + "epoch": 0.91, + "learning_rate": 5.522424242424243e-06, + "loss": 0.3984, + "step": 22675 + }, + { + "epoch": 0.91, + "learning_rate": 5.517373737373738e-06, + "loss": 0.3949, + "step": 22700 + }, + { + "epoch": 0.91, + "learning_rate": 5.512323232323232e-06, + "loss": 0.3936, + "step": 22725 + }, + { + "epoch": 0.91, + "learning_rate": 5.507272727272728e-06, + "loss": 0.4118, + "step": 22750 + }, + { + "epoch": 0.91, + "learning_rate": 5.5022222222222224e-06, + "loss": 0.3797, + "step": 22775 + }, + { + "epoch": 0.91, + "learning_rate": 5.497171717171718e-06, + "loss": 0.4043, + "step": 22800 + }, + { + "epoch": 0.92, + "learning_rate": 5.492323232323232e-06, + "loss": 0.405, + "step": 22825 + }, + { + "epoch": 0.92, + "learning_rate": 5.4872727272727275e-06, + "loss": 0.3987, + "step": 22850 + }, + { + "epoch": 0.92, + "learning_rate": 5.4822222222222235e-06, + "loss": 0.4005, + "step": 22875 + }, + { + "epoch": 0.92, + "learning_rate": 5.477171717171718e-06, + "loss": 0.4014, + "step": 22900 + }, + { + "epoch": 0.92, + "learning_rate": 5.472121212121213e-06, + "loss": 0.4098, + "step": 22925 + }, + { + "epoch": 0.92, + "learning_rate": 5.467070707070707e-06, + "loss": 0.4111, + "step": 22950 + }, + { + "epoch": 0.92, + "learning_rate": 5.462020202020203e-06, + "loss": 0.4014, + "step": 22975 + }, + { + "epoch": 0.92, + "learning_rate": 5.4569696969696975e-06, + "loss": 0.4246, + "step": 23000 + }, + { + "epoch": 0.92, + "learning_rate": 5.451919191919193e-06, + "loss": 0.4103, + "step": 23025 + }, + { + "epoch": 0.92, + "learning_rate": 5.446868686868687e-06, + "loss": 0.3985, + "step": 23050 + }, + { + "epoch": 0.93, + "learning_rate": 5.441818181818183e-06, + "loss": 0.4221, + "step": 23075 + }, + { + "epoch": 0.93, + "learning_rate": 5.436767676767677e-06, + "loss": 0.4059, + "step": 23100 + }, + { + "epoch": 0.93, + "learning_rate": 5.431717171717172e-06, + "loss": 0.4058, + "step": 23125 + }, + { + "epoch": 0.93, + "learning_rate": 5.426666666666667e-06, + "loss": 0.41, + "step": 23150 + }, + { + "epoch": 0.93, + "learning_rate": 5.421616161616162e-06, + "loss": 0.4012, + "step": 23175 + }, + { + "epoch": 0.93, + "learning_rate": 5.416565656565657e-06, + "loss": 0.4175, + "step": 23200 + }, + { + "epoch": 0.93, + "learning_rate": 5.411515151515152e-06, + "loss": 0.3962, + "step": 23225 + }, + { + "epoch": 0.93, + "learning_rate": 5.406464646464646e-06, + "loss": 0.3994, + "step": 23250 + }, + { + "epoch": 0.93, + "learning_rate": 5.4014141414141415e-06, + "loss": 0.4042, + "step": 23275 + }, + { + "epoch": 0.93, + "learning_rate": 5.3963636363636375e-06, + "loss": 0.4133, + "step": 23300 + }, + { + "epoch": 0.94, + "learning_rate": 5.391313131313132e-06, + "loss": 0.3976, + "step": 23325 + }, + { + "epoch": 0.94, + "learning_rate": 5.386262626262627e-06, + "loss": 0.4217, + "step": 23350 + }, + { + "epoch": 0.94, + "learning_rate": 5.381212121212121e-06, + "loss": 0.4119, + "step": 23375 + }, + { + "epoch": 0.94, + "learning_rate": 5.376161616161617e-06, + "loss": 0.3959, + "step": 23400 + }, + { + "epoch": 0.94, + "learning_rate": 5.3711111111111115e-06, + "loss": 0.4011, + "step": 23425 + }, + { + "epoch": 0.94, + "learning_rate": 5.366060606060607e-06, + "loss": 0.4159, + "step": 23450 + }, + { + "epoch": 0.94, + "learning_rate": 5.361010101010101e-06, + "loss": 0.3831, + "step": 23475 + }, + { + "epoch": 0.94, + "learning_rate": 5.355959595959597e-06, + "loss": 0.4047, + "step": 23500 + }, + { + "epoch": 0.94, + "learning_rate": 5.350909090909091e-06, + "loss": 0.4134, + "step": 23525 + }, + { + "epoch": 0.94, + "learning_rate": 5.345858585858586e-06, + "loss": 0.4057, + "step": 23550 + }, + { + "epoch": 0.95, + "learning_rate": 5.340808080808081e-06, + "loss": 0.3774, + "step": 23575 + }, + { + "epoch": 0.95, + "learning_rate": 5.335757575757577e-06, + "loss": 0.385, + "step": 23600 + }, + { + "epoch": 0.95, + "learning_rate": 5.330707070707071e-06, + "loss": 0.4194, + "step": 23625 + }, + { + "epoch": 0.95, + "learning_rate": 5.325656565656566e-06, + "loss": 0.3963, + "step": 23650 + }, + { + "epoch": 0.95, + "learning_rate": 5.3206060606060604e-06, + "loss": 0.3942, + "step": 23675 + }, + { + "epoch": 0.95, + "learning_rate": 5.3155555555555564e-06, + "loss": 0.3933, + "step": 23700 + }, + { + "epoch": 0.95, + "learning_rate": 5.310505050505051e-06, + "loss": 0.3855, + "step": 23725 + }, + { + "epoch": 0.95, + "learning_rate": 5.305454545454546e-06, + "loss": 0.398, + "step": 23750 + }, + { + "epoch": 0.95, + "learning_rate": 5.300404040404041e-06, + "loss": 0.3858, + "step": 23775 + }, + { + "epoch": 0.95, + "learning_rate": 5.295353535353535e-06, + "loss": 0.4117, + "step": 23800 + }, + { + "epoch": 0.96, + "learning_rate": 5.290303030303031e-06, + "loss": 0.3883, + "step": 23825 + }, + { + "epoch": 0.96, + "learning_rate": 5.285252525252526e-06, + "loss": 0.4188, + "step": 23850 + }, + { + "epoch": 0.96, + "learning_rate": 5.280202020202021e-06, + "loss": 0.4152, + "step": 23875 + }, + { + "epoch": 0.96, + "learning_rate": 5.275151515151515e-06, + "loss": 0.417, + "step": 23900 + }, + { + "epoch": 0.96, + "learning_rate": 5.270101010101011e-06, + "loss": 0.3981, + "step": 23925 + }, + { + "epoch": 0.96, + "learning_rate": 5.265050505050505e-06, + "loss": 0.3862, + "step": 23950 + }, + { + "epoch": 0.96, + "learning_rate": 5.2600000000000005e-06, + "loss": 0.4005, + "step": 23975 + }, + { + "epoch": 0.96, + "learning_rate": 5.254949494949495e-06, + "loss": 0.3917, + "step": 24000 + }, + { + "epoch": 0.96, + "learning_rate": 5.249898989898991e-06, + "loss": 0.4012, + "step": 24025 + }, + { + "epoch": 0.96, + "learning_rate": 5.244848484848485e-06, + "loss": 0.4039, + "step": 24050 + }, + { + "epoch": 0.97, + "learning_rate": 5.23979797979798e-06, + "loss": 0.4166, + "step": 24075 + }, + { + "epoch": 0.97, + "learning_rate": 5.2347474747474745e-06, + "loss": 0.3985, + "step": 24100 + }, + { + "epoch": 0.97, + "learning_rate": 5.2296969696969705e-06, + "loss": 0.3946, + "step": 24125 + }, + { + "epoch": 0.97, + "learning_rate": 5.224646464646465e-06, + "loss": 0.4177, + "step": 24150 + }, + { + "epoch": 0.97, + "learning_rate": 5.21959595959596e-06, + "loss": 0.4052, + "step": 24175 + }, + { + "epoch": 0.97, + "learning_rate": 5.214545454545455e-06, + "loss": 0.4122, + "step": 24200 + }, + { + "epoch": 0.97, + "learning_rate": 5.20949494949495e-06, + "loss": 0.3905, + "step": 24225 + }, + { + "epoch": 0.97, + "learning_rate": 5.204444444444445e-06, + "loss": 0.4207, + "step": 24250 + }, + { + "epoch": 0.97, + "learning_rate": 5.19939393939394e-06, + "loss": 0.4138, + "step": 24275 + }, + { + "epoch": 0.97, + "learning_rate": 5.194343434343435e-06, + "loss": 0.3948, + "step": 24300 + }, + { + "epoch": 0.98, + "learning_rate": 5.189292929292929e-06, + "loss": 0.4039, + "step": 24325 + }, + { + "epoch": 0.98, + "learning_rate": 5.184242424242425e-06, + "loss": 0.3919, + "step": 24350 + }, + { + "epoch": 0.98, + "learning_rate": 5.179191919191919e-06, + "loss": 0.4047, + "step": 24375 + }, + { + "epoch": 0.98, + "learning_rate": 5.1741414141414145e-06, + "loss": 0.4308, + "step": 24400 + }, + { + "epoch": 0.98, + "learning_rate": 5.169090909090909e-06, + "loss": 0.3794, + "step": 24425 + }, + { + "epoch": 0.98, + "learning_rate": 5.164040404040405e-06, + "loss": 0.3918, + "step": 24450 + }, + { + "epoch": 0.98, + "learning_rate": 5.158989898989899e-06, + "loss": 0.4171, + "step": 24475 + }, + { + "epoch": 0.98, + "learning_rate": 5.153939393939394e-06, + "loss": 0.3838, + "step": 24500 + }, + { + "epoch": 0.98, + "learning_rate": 5.1488888888888885e-06, + "loss": 0.3948, + "step": 24525 + }, + { + "epoch": 0.98, + "learning_rate": 5.1438383838383845e-06, + "loss": 0.41, + "step": 24550 + }, + { + "epoch": 0.99, + "learning_rate": 5.138787878787879e-06, + "loss": 0.3874, + "step": 24575 + }, + { + "epoch": 0.99, + "learning_rate": 5.133737373737374e-06, + "loss": 0.3965, + "step": 24600 + }, + { + "epoch": 0.99, + "learning_rate": 5.12868686868687e-06, + "loss": 0.4062, + "step": 24625 + }, + { + "epoch": 0.99, + "learning_rate": 5.123636363636364e-06, + "loss": 0.4094, + "step": 24650 + }, + { + "epoch": 0.99, + "learning_rate": 5.118585858585859e-06, + "loss": 0.3903, + "step": 24675 + }, + { + "epoch": 0.99, + "learning_rate": 5.113535353535354e-06, + "loss": 0.3958, + "step": 24700 + }, + { + "epoch": 0.99, + "learning_rate": 5.10848484848485e-06, + "loss": 0.4025, + "step": 24725 + }, + { + "epoch": 0.99, + "learning_rate": 5.103434343434344e-06, + "loss": 0.4163, + "step": 24750 + }, + { + "epoch": 0.99, + "learning_rate": 5.098383838383839e-06, + "loss": 0.4031, + "step": 24775 + }, + { + "epoch": 0.99, + "learning_rate": 5.093333333333333e-06, + "loss": 0.3995, + "step": 24800 + }, + { + "epoch": 1.0, + "learning_rate": 5.0882828282828286e-06, + "loss": 0.404, + "step": 24825 + }, + { + "epoch": 1.0, + "learning_rate": 5.083232323232324e-06, + "loss": 0.3939, + "step": 24850 + }, + { + "epoch": 1.0, + "learning_rate": 5.078181818181819e-06, + "loss": 0.402, + "step": 24875 + }, + { + "epoch": 1.0, + "learning_rate": 5.073131313131313e-06, + "loss": 0.3975, + "step": 24900 + }, + { + "epoch": 1.0, + "learning_rate": 5.068080808080808e-06, + "loss": 0.3895, + "step": 24925 + }, + { + "epoch": 1.0, + "learning_rate": 5.063030303030303e-06, + "loss": 0.3973, + "step": 24950 + }, + { + "epoch": 1.0, + "learning_rate": 5.0579797979797986e-06, + "loss": 0.3876, + "step": 24975 + }, + { + "epoch": 1.0, + "learning_rate": 5.052929292929293e-06, + "loss": 0.3831, + "step": 25000 + }, + { + "epoch": 1.0, + "eval_loss": 0.4076802432537079, + "eval_runtime": 310.8735, + "eval_samples_per_second": 16.1, + "eval_steps_per_second": 2.014, + "eval_wer": 31.695104297681482, + "step": 25000 + }, + { + "epoch": 1.0, + "learning_rate": 5.047878787878788e-06, + "loss": 0.3901, + "step": 25025 + }, + { + "epoch": 1.0, + "learning_rate": 5.042828282828284e-06, + "loss": 0.3626, + "step": 25050 + }, + { + "epoch": 1.01, + "learning_rate": 5.037777777777778e-06, + "loss": 0.4023, + "step": 25075 + }, + { + "epoch": 1.01, + "learning_rate": 5.0327272727272734e-06, + "loss": 0.3804, + "step": 25100 + }, + { + "epoch": 1.01, + "learning_rate": 5.027676767676768e-06, + "loss": 0.3772, + "step": 25125 + }, + { + "epoch": 1.01, + "learning_rate": 5.022626262626264e-06, + "loss": 0.3845, + "step": 25150 + }, + { + "epoch": 1.01, + "learning_rate": 5.017575757575758e-06, + "loss": 0.3764, + "step": 25175 + }, + { + "epoch": 1.01, + "learning_rate": 5.012525252525253e-06, + "loss": 0.38, + "step": 25200 + }, + { + "epoch": 1.01, + "learning_rate": 5.0074747474747475e-06, + "loss": 0.387, + "step": 25225 + }, + { + "epoch": 1.01, + "learning_rate": 5.0024242424242435e-06, + "loss": 0.3782, + "step": 25250 + }, + { + "epoch": 1.01, + "learning_rate": 4.997373737373738e-06, + "loss": 0.3734, + "step": 25275 + }, + { + "epoch": 1.01, + "learning_rate": 4.992323232323233e-06, + "loss": 0.4094, + "step": 25300 + }, + { + "epoch": 1.02, + "learning_rate": 4.987272727272728e-06, + "loss": 0.3939, + "step": 25325 + }, + { + "epoch": 1.02, + "learning_rate": 4.982222222222222e-06, + "loss": 0.3967, + "step": 25350 + }, + { + "epoch": 1.02, + "learning_rate": 4.9771717171717175e-06, + "loss": 0.3831, + "step": 25375 + }, + { + "epoch": 1.02, + "learning_rate": 4.972121212121213e-06, + "loss": 0.3657, + "step": 25400 + }, + { + "epoch": 1.02, + "learning_rate": 4.967070707070708e-06, + "loss": 0.3967, + "step": 25425 + }, + { + "epoch": 1.02, + "learning_rate": 4.962020202020202e-06, + "loss": 0.3957, + "step": 25450 + }, + { + "epoch": 1.02, + "learning_rate": 4.956969696969697e-06, + "loss": 0.3893, + "step": 25475 + }, + { + "epoch": 1.02, + "learning_rate": 4.951919191919192e-06, + "loss": 0.3874, + "step": 25500 + }, + { + "epoch": 1.02, + "learning_rate": 4.9468686868686875e-06, + "loss": 0.3782, + "step": 25525 + }, + { + "epoch": 1.02, + "learning_rate": 4.941818181818182e-06, + "loss": 0.3871, + "step": 25550 + }, + { + "epoch": 1.03, + "learning_rate": 4.936767676767677e-06, + "loss": 0.3951, + "step": 25575 + }, + { + "epoch": 1.03, + "learning_rate": 4.931717171717172e-06, + "loss": 0.3814, + "step": 25600 + }, + { + "epoch": 1.03, + "learning_rate": 4.926666666666667e-06, + "loss": 0.3715, + "step": 25625 + }, + { + "epoch": 1.03, + "learning_rate": 4.921616161616162e-06, + "loss": 0.3838, + "step": 25650 + }, + { + "epoch": 1.03, + "learning_rate": 4.9165656565656575e-06, + "loss": 0.3876, + "step": 25675 + }, + { + "epoch": 1.03, + "learning_rate": 4.911515151515152e-06, + "loss": 0.393, + "step": 25700 + }, + { + "epoch": 1.03, + "learning_rate": 4.906464646464647e-06, + "loss": 0.3932, + "step": 25725 + }, + { + "epoch": 1.03, + "learning_rate": 4.901414141414142e-06, + "loss": 0.3824, + "step": 25750 + }, + { + "epoch": 1.03, + "learning_rate": 4.896363636363637e-06, + "loss": 0.3721, + "step": 25775 + }, + { + "epoch": 1.03, + "learning_rate": 4.8913131313131315e-06, + "loss": 0.373, + "step": 25800 + }, + { + "epoch": 1.04, + "learning_rate": 4.886262626262627e-06, + "loss": 0.3911, + "step": 25825 + }, + { + "epoch": 1.04, + "learning_rate": 4.881212121212122e-06, + "loss": 0.375, + "step": 25850 + }, + { + "epoch": 1.04, + "learning_rate": 4.876161616161617e-06, + "loss": 0.3832, + "step": 25875 + }, + { + "epoch": 1.04, + "learning_rate": 4.871111111111111e-06, + "loss": 0.3944, + "step": 25900 + }, + { + "epoch": 1.04, + "learning_rate": 4.866060606060606e-06, + "loss": 0.3886, + "step": 25925 + }, + { + "epoch": 1.04, + "learning_rate": 4.8610101010101015e-06, + "loss": 0.3893, + "step": 25950 + }, + { + "epoch": 1.04, + "learning_rate": 4.855959595959596e-06, + "loss": 0.381, + "step": 25975 + }, + { + "epoch": 1.04, + "learning_rate": 4.850909090909091e-06, + "loss": 0.3811, + "step": 26000 + }, + { + "epoch": 1.04, + "learning_rate": 4.845858585858586e-06, + "loss": 0.3792, + "step": 26025 + }, + { + "epoch": 1.04, + "learning_rate": 4.840808080808081e-06, + "loss": 0.3789, + "step": 26050 + }, + { + "epoch": 1.05, + "learning_rate": 4.835757575757576e-06, + "loss": 0.3986, + "step": 26075 + }, + { + "epoch": 1.05, + "learning_rate": 4.8307070707070715e-06, + "loss": 0.3866, + "step": 26100 + }, + { + "epoch": 1.05, + "learning_rate": 4.825656565656566e-06, + "loss": 0.3888, + "step": 26125 + }, + { + "epoch": 1.05, + "learning_rate": 4.820606060606061e-06, + "loss": 0.3927, + "step": 26150 + }, + { + "epoch": 1.05, + "learning_rate": 4.815555555555556e-06, + "loss": 0.3709, + "step": 26175 + }, + { + "epoch": 1.05, + "learning_rate": 4.810505050505051e-06, + "loss": 0.3929, + "step": 26200 + }, + { + "epoch": 1.05, + "learning_rate": 4.8054545454545456e-06, + "loss": 0.3845, + "step": 26225 + }, + { + "epoch": 1.05, + "learning_rate": 4.800404040404041e-06, + "loss": 0.3757, + "step": 26250 + }, + { + "epoch": 1.05, + "learning_rate": 4.795353535353536e-06, + "loss": 0.3837, + "step": 26275 + }, + { + "epoch": 1.05, + "learning_rate": 4.790303030303031e-06, + "loss": 0.3939, + "step": 26300 + }, + { + "epoch": 1.06, + "learning_rate": 4.785252525252525e-06, + "loss": 0.3898, + "step": 26325 + }, + { + "epoch": 1.06, + "learning_rate": 4.7802020202020204e-06, + "loss": 0.377, + "step": 26350 + }, + { + "epoch": 1.06, + "learning_rate": 4.775151515151516e-06, + "loss": 0.3675, + "step": 26375 + }, + { + "epoch": 1.06, + "learning_rate": 4.770101010101011e-06, + "loss": 0.3781, + "step": 26400 + }, + { + "epoch": 1.06, + "learning_rate": 4.765050505050505e-06, + "loss": 0.3861, + "step": 26425 + }, + { + "epoch": 1.06, + "learning_rate": 4.76e-06, + "loss": 0.3626, + "step": 26450 + }, + { + "epoch": 1.06, + "learning_rate": 4.754949494949495e-06, + "loss": 0.3803, + "step": 26475 + }, + { + "epoch": 1.06, + "learning_rate": 4.7498989898989905e-06, + "loss": 0.3873, + "step": 26500 + }, + { + "epoch": 1.06, + "learning_rate": 4.744848484848486e-06, + "loss": 0.3894, + "step": 26525 + }, + { + "epoch": 1.06, + "learning_rate": 4.739797979797981e-06, + "loss": 0.3702, + "step": 26550 + }, + { + "epoch": 1.07, + "learning_rate": 4.734747474747475e-06, + "loss": 0.3703, + "step": 26575 + }, + { + "epoch": 1.07, + "learning_rate": 4.72969696969697e-06, + "loss": 0.3921, + "step": 26600 + }, + { + "epoch": 1.07, + "learning_rate": 4.724646464646465e-06, + "loss": 0.3711, + "step": 26625 + }, + { + "epoch": 1.07, + "learning_rate": 4.7195959595959605e-06, + "loss": 0.3698, + "step": 26650 + }, + { + "epoch": 1.07, + "learning_rate": 4.714545454545455e-06, + "loss": 0.4003, + "step": 26675 + }, + { + "epoch": 1.07, + "learning_rate": 4.70949494949495e-06, + "loss": 0.3753, + "step": 26700 + }, + { + "epoch": 1.07, + "learning_rate": 4.704444444444445e-06, + "loss": 0.3758, + "step": 26725 + }, + { + "epoch": 1.07, + "learning_rate": 4.699393939393939e-06, + "loss": 0.3859, + "step": 26750 + }, + { + "epoch": 1.07, + "learning_rate": 4.6943434343434345e-06, + "loss": 0.3941, + "step": 26775 + }, + { + "epoch": 1.07, + "learning_rate": 4.68929292929293e-06, + "loss": 0.3668, + "step": 26800 + }, + { + "epoch": 1.08, + "learning_rate": 4.684444444444444e-06, + "loss": 0.372, + "step": 26825 + }, + { + "epoch": 1.08, + "learning_rate": 4.67959595959596e-06, + "loss": 0.3784, + "step": 26850 + }, + { + "epoch": 1.08, + "learning_rate": 4.674545454545455e-06, + "loss": 0.3788, + "step": 26875 + }, + { + "epoch": 1.08, + "learning_rate": 4.6694949494949494e-06, + "loss": 0.3934, + "step": 26900 + }, + { + "epoch": 1.08, + "learning_rate": 4.664444444444445e-06, + "loss": 0.3674, + "step": 26925 + }, + { + "epoch": 1.08, + "learning_rate": 4.65939393939394e-06, + "loss": 0.3955, + "step": 26950 + }, + { + "epoch": 1.08, + "learning_rate": 4.654343434343435e-06, + "loss": 0.3911, + "step": 26975 + }, + { + "epoch": 1.08, + "learning_rate": 4.649292929292929e-06, + "loss": 0.377, + "step": 27000 + }, + { + "epoch": 1.08, + "learning_rate": 4.644242424242424e-06, + "loss": 0.3726, + "step": 27025 + }, + { + "epoch": 1.08, + "learning_rate": 4.6391919191919195e-06, + "loss": 0.3804, + "step": 27050 + }, + { + "epoch": 1.09, + "learning_rate": 4.634141414141415e-06, + "loss": 0.3942, + "step": 27075 + }, + { + "epoch": 1.09, + "learning_rate": 4.62909090909091e-06, + "loss": 0.4027, + "step": 27100 + }, + { + "epoch": 1.09, + "learning_rate": 4.624040404040405e-06, + "loss": 0.3764, + "step": 27125 + }, + { + "epoch": 1.09, + "learning_rate": 4.618989898989899e-06, + "loss": 0.3919, + "step": 27150 + }, + { + "epoch": 1.09, + "learning_rate": 4.613939393939394e-06, + "loss": 0.3839, + "step": 27175 + }, + { + "epoch": 1.09, + "learning_rate": 4.6088888888888895e-06, + "loss": 0.3623, + "step": 27200 + }, + { + "epoch": 1.09, + "learning_rate": 4.603838383838385e-06, + "loss": 0.3779, + "step": 27225 + }, + { + "epoch": 1.09, + "learning_rate": 4.598787878787879e-06, + "loss": 0.3885, + "step": 27250 + }, + { + "epoch": 1.09, + "learning_rate": 4.593737373737374e-06, + "loss": 0.3758, + "step": 27275 + }, + { + "epoch": 1.09, + "learning_rate": 4.588686868686869e-06, + "loss": 0.3776, + "step": 27300 + }, + { + "epoch": 1.1, + "learning_rate": 4.583636363636364e-06, + "loss": 0.401, + "step": 27325 + }, + { + "epoch": 1.1, + "learning_rate": 4.578585858585859e-06, + "loss": 0.3718, + "step": 27350 + }, + { + "epoch": 1.1, + "learning_rate": 4.573535353535354e-06, + "loss": 0.3863, + "step": 27375 + }, + { + "epoch": 1.1, + "learning_rate": 4.568484848484849e-06, + "loss": 0.3867, + "step": 27400 + }, + { + "epoch": 1.1, + "learning_rate": 4.563434343434344e-06, + "loss": 0.367, + "step": 27425 + }, + { + "epoch": 1.1, + "learning_rate": 4.558383838383838e-06, + "loss": 0.3986, + "step": 27450 + }, + { + "epoch": 1.1, + "learning_rate": 4.5533333333333335e-06, + "loss": 0.3798, + "step": 27475 + }, + { + "epoch": 1.1, + "learning_rate": 4.548282828282829e-06, + "loss": 0.3842, + "step": 27500 + }, + { + "epoch": 1.1, + "eval_loss": 0.4022856056690216, + "eval_runtime": 322.6887, + "eval_samples_per_second": 15.51, + "eval_steps_per_second": 1.94, + "eval_wer": 33.63155271838439, + "step": 27500 + }, + { + "epoch": 1.1, + "learning_rate": 4.543232323232323e-06, + "loss": 0.361, + "step": 27525 + }, + { + "epoch": 1.1, + "learning_rate": 4.538181818181819e-06, + "loss": 0.3699, + "step": 27550 + }, + { + "epoch": 1.11, + "learning_rate": 4.533131313131314e-06, + "loss": 0.3763, + "step": 27575 + }, + { + "epoch": 1.11, + "learning_rate": 4.528080808080808e-06, + "loss": 0.371, + "step": 27600 + }, + { + "epoch": 1.11, + "learning_rate": 4.5230303030303035e-06, + "loss": 0.3696, + "step": 27625 + }, + { + "epoch": 1.11, + "learning_rate": 4.517979797979799e-06, + "loss": 0.3897, + "step": 27650 + }, + { + "epoch": 1.11, + "learning_rate": 4.512929292929294e-06, + "loss": 0.3757, + "step": 27675 + }, + { + "epoch": 1.11, + "learning_rate": 4.507878787878788e-06, + "loss": 0.3852, + "step": 27700 + }, + { + "epoch": 1.11, + "learning_rate": 4.502828282828283e-06, + "loss": 0.3945, + "step": 27725 + }, + { + "epoch": 1.11, + "learning_rate": 4.497777777777778e-06, + "loss": 0.3839, + "step": 27750 + }, + { + "epoch": 1.11, + "learning_rate": 4.492727272727273e-06, + "loss": 0.3827, + "step": 27775 + }, + { + "epoch": 1.11, + "learning_rate": 4.487676767676768e-06, + "loss": 0.3886, + "step": 27800 + }, + { + "epoch": 1.12, + "learning_rate": 4.482626262626263e-06, + "loss": 0.3664, + "step": 27825 + }, + { + "epoch": 1.12, + "learning_rate": 4.477575757575758e-06, + "loss": 0.3928, + "step": 27850 + }, + { + "epoch": 1.12, + "learning_rate": 4.472525252525252e-06, + "loss": 0.3776, + "step": 27875 + }, + { + "epoch": 1.12, + "learning_rate": 4.4674747474747475e-06, + "loss": 0.3925, + "step": 27900 + }, + { + "epoch": 1.12, + "learning_rate": 4.462424242424243e-06, + "loss": 0.3815, + "step": 27925 + }, + { + "epoch": 1.12, + "learning_rate": 4.457373737373738e-06, + "loss": 0.3881, + "step": 27950 + }, + { + "epoch": 1.12, + "learning_rate": 4.452323232323233e-06, + "loss": 0.3703, + "step": 27975 + }, + { + "epoch": 1.12, + "learning_rate": 4.447272727272728e-06, + "loss": 0.3955, + "step": 28000 + }, + { + "epoch": 1.12, + "learning_rate": 4.442222222222222e-06, + "loss": 0.3786, + "step": 28025 + }, + { + "epoch": 1.12, + "learning_rate": 4.4371717171717176e-06, + "loss": 0.4067, + "step": 28050 + }, + { + "epoch": 1.13, + "learning_rate": 4.432121212121213e-06, + "loss": 0.3632, + "step": 28075 + }, + { + "epoch": 1.13, + "learning_rate": 4.427070707070708e-06, + "loss": 0.381, + "step": 28100 + }, + { + "epoch": 1.13, + "learning_rate": 4.422020202020202e-06, + "loss": 0.3744, + "step": 28125 + }, + { + "epoch": 1.13, + "learning_rate": 4.416969696969697e-06, + "loss": 0.3843, + "step": 28150 + }, + { + "epoch": 1.13, + "learning_rate": 4.4119191919191924e-06, + "loss": 0.3729, + "step": 28175 + }, + { + "epoch": 1.13, + "learning_rate": 4.4068686868686876e-06, + "loss": 0.3548, + "step": 28200 + }, + { + "epoch": 1.13, + "learning_rate": 4.401818181818182e-06, + "loss": 0.3733, + "step": 28225 + }, + { + "epoch": 1.13, + "learning_rate": 4.396767676767677e-06, + "loss": 0.3919, + "step": 28250 + }, + { + "epoch": 1.13, + "learning_rate": 4.391717171717172e-06, + "loss": 0.3762, + "step": 28275 + }, + { + "epoch": 1.13, + "learning_rate": 4.3866666666666665e-06, + "loss": 0.3767, + "step": 28300 + }, + { + "epoch": 1.14, + "learning_rate": 4.381616161616162e-06, + "loss": 0.3704, + "step": 28325 + }, + { + "epoch": 1.14, + "learning_rate": 4.376565656565657e-06, + "loss": 0.3963, + "step": 28350 + }, + { + "epoch": 1.14, + "learning_rate": 4.371515151515152e-06, + "loss": 0.3824, + "step": 28375 + }, + { + "epoch": 1.14, + "learning_rate": 4.366464646464647e-06, + "loss": 0.3832, + "step": 28400 + }, + { + "epoch": 1.14, + "learning_rate": 4.361414141414142e-06, + "loss": 0.366, + "step": 28425 + }, + { + "epoch": 1.14, + "learning_rate": 4.356363636363637e-06, + "loss": 0.377, + "step": 28450 + }, + { + "epoch": 1.14, + "learning_rate": 4.351313131313132e-06, + "loss": 0.3651, + "step": 28475 + }, + { + "epoch": 1.14, + "learning_rate": 4.346262626262627e-06, + "loss": 0.3938, + "step": 28500 + }, + { + "epoch": 1.14, + "learning_rate": 4.341212121212122e-06, + "loss": 0.3796, + "step": 28525 + }, + { + "epoch": 1.14, + "learning_rate": 4.336161616161616e-06, + "loss": 0.3877, + "step": 28550 + }, + { + "epoch": 1.15, + "learning_rate": 4.331111111111111e-06, + "loss": 0.3801, + "step": 28575 + }, + { + "epoch": 1.15, + "learning_rate": 4.3260606060606065e-06, + "loss": 0.3907, + "step": 28600 + }, + { + "epoch": 1.15, + "learning_rate": 4.321010101010102e-06, + "loss": 0.3832, + "step": 28625 + }, + { + "epoch": 1.15, + "learning_rate": 4.315959595959596e-06, + "loss": 0.3799, + "step": 28650 + }, + { + "epoch": 1.15, + "learning_rate": 4.310909090909091e-06, + "loss": 0.3825, + "step": 28675 + }, + { + "epoch": 1.15, + "learning_rate": 4.305858585858586e-06, + "loss": 0.3681, + "step": 28700 + }, + { + "epoch": 1.15, + "learning_rate": 4.300808080808081e-06, + "loss": 0.3675, + "step": 28725 + }, + { + "epoch": 1.15, + "learning_rate": 4.295757575757576e-06, + "loss": 0.3728, + "step": 28750 + }, + { + "epoch": 1.15, + "learning_rate": 4.290707070707071e-06, + "loss": 0.3684, + "step": 28775 + }, + { + "epoch": 1.15, + "learning_rate": 4.285656565656566e-06, + "loss": 0.3687, + "step": 28800 + }, + { + "epoch": 1.16, + "learning_rate": 4.280606060606061e-06, + "loss": 0.365, + "step": 28825 + }, + { + "epoch": 1.16, + "learning_rate": 4.275555555555556e-06, + "loss": 0.3874, + "step": 28850 + }, + { + "epoch": 1.16, + "learning_rate": 4.270505050505051e-06, + "loss": 0.3783, + "step": 28875 + }, + { + "epoch": 1.16, + "learning_rate": 4.265454545454546e-06, + "loss": 0.3832, + "step": 28900 + }, + { + "epoch": 1.16, + "learning_rate": 4.260404040404041e-06, + "loss": 0.3815, + "step": 28925 + }, + { + "epoch": 1.16, + "learning_rate": 4.255353535353536e-06, + "loss": 0.3875, + "step": 28950 + }, + { + "epoch": 1.16, + "learning_rate": 4.250303030303031e-06, + "loss": 0.3624, + "step": 28975 + }, + { + "epoch": 1.16, + "learning_rate": 4.245252525252525e-06, + "loss": 0.3646, + "step": 29000 + }, + { + "epoch": 1.16, + "learning_rate": 4.2402020202020205e-06, + "loss": 0.3803, + "step": 29025 + }, + { + "epoch": 1.16, + "learning_rate": 4.235151515151516e-06, + "loss": 0.3728, + "step": 29050 + }, + { + "epoch": 1.17, + "learning_rate": 4.23010101010101e-06, + "loss": 0.3881, + "step": 29075 + }, + { + "epoch": 1.17, + "learning_rate": 4.225050505050505e-06, + "loss": 0.375, + "step": 29100 + }, + { + "epoch": 1.17, + "learning_rate": 4.22e-06, + "loss": 0.3652, + "step": 29125 + }, + { + "epoch": 1.17, + "learning_rate": 4.214949494949495e-06, + "loss": 0.384, + "step": 29150 + }, + { + "epoch": 1.17, + "learning_rate": 4.20989898989899e-06, + "loss": 0.3605, + "step": 29175 + }, + { + "epoch": 1.17, + "learning_rate": 4.204848484848485e-06, + "loss": 0.3659, + "step": 29200 + }, + { + "epoch": 1.17, + "learning_rate": 4.19979797979798e-06, + "loss": 0.3696, + "step": 29225 + }, + { + "epoch": 1.17, + "learning_rate": 4.194747474747475e-06, + "loss": 0.3855, + "step": 29250 + }, + { + "epoch": 1.17, + "learning_rate": 4.18969696969697e-06, + "loss": 0.3844, + "step": 29275 + }, + { + "epoch": 1.17, + "learning_rate": 4.184646464646465e-06, + "loss": 0.363, + "step": 29300 + }, + { + "epoch": 1.18, + "learning_rate": 4.17959595959596e-06, + "loss": 0.376, + "step": 29325 + }, + { + "epoch": 1.18, + "learning_rate": 4.174545454545455e-06, + "loss": 0.3875, + "step": 29350 + }, + { + "epoch": 1.18, + "learning_rate": 4.16949494949495e-06, + "loss": 0.3933, + "step": 29375 + }, + { + "epoch": 1.18, + "learning_rate": 4.164444444444445e-06, + "loss": 0.3746, + "step": 29400 + }, + { + "epoch": 1.18, + "learning_rate": 4.1593939393939394e-06, + "loss": 0.3743, + "step": 29425 + }, + { + "epoch": 1.18, + "learning_rate": 4.1543434343434346e-06, + "loss": 0.3803, + "step": 29450 + }, + { + "epoch": 1.18, + "learning_rate": 4.14929292929293e-06, + "loss": 0.3782, + "step": 29475 + }, + { + "epoch": 1.18, + "learning_rate": 4.144242424242425e-06, + "loss": 0.3827, + "step": 29500 + }, + { + "epoch": 1.18, + "learning_rate": 4.139191919191919e-06, + "loss": 0.3827, + "step": 29525 + }, + { + "epoch": 1.18, + "learning_rate": 4.134141414141414e-06, + "loss": 0.3686, + "step": 29550 + }, + { + "epoch": 1.19, + "learning_rate": 4.1290909090909094e-06, + "loss": 0.3547, + "step": 29575 + }, + { + "epoch": 1.19, + "learning_rate": 4.124040404040405e-06, + "loss": 0.3831, + "step": 29600 + }, + { + "epoch": 1.19, + "learning_rate": 4.118989898989899e-06, + "loss": 0.374, + "step": 29625 + }, + { + "epoch": 1.19, + "learning_rate": 4.113939393939394e-06, + "loss": 0.3723, + "step": 29650 + }, + { + "epoch": 1.19, + "learning_rate": 4.108888888888889e-06, + "loss": 0.3813, + "step": 29675 + }, + { + "epoch": 1.19, + "learning_rate": 4.103838383838384e-06, + "loss": 0.382, + "step": 29700 + }, + { + "epoch": 1.19, + "learning_rate": 4.0987878787878795e-06, + "loss": 0.3801, + "step": 29725 + }, + { + "epoch": 1.19, + "learning_rate": 4.093737373737375e-06, + "loss": 0.3686, + "step": 29750 + }, + { + "epoch": 1.19, + "learning_rate": 4.088686868686869e-06, + "loss": 0.3743, + "step": 29775 + }, + { + "epoch": 1.19, + "learning_rate": 4.083636363636364e-06, + "loss": 0.3665, + "step": 29800 + }, + { + "epoch": 1.2, + "learning_rate": 4.078585858585859e-06, + "loss": 0.3657, + "step": 29825 + }, + { + "epoch": 1.2, + "learning_rate": 4.0735353535353535e-06, + "loss": 0.3683, + "step": 29850 + }, + { + "epoch": 1.2, + "learning_rate": 4.068484848484849e-06, + "loss": 0.3697, + "step": 29875 + }, + { + "epoch": 1.2, + "learning_rate": 4.063434343434344e-06, + "loss": 0.387, + "step": 29900 + }, + { + "epoch": 1.2, + "learning_rate": 4.058383838383839e-06, + "loss": 0.3793, + "step": 29925 + }, + { + "epoch": 1.2, + "learning_rate": 4.053333333333333e-06, + "loss": 0.3765, + "step": 29950 + }, + { + "epoch": 1.2, + "learning_rate": 4.048282828282828e-06, + "loss": 0.3854, + "step": 29975 + }, + { + "epoch": 1.2, + "learning_rate": 4.0432323232323235e-06, + "loss": 0.3848, + "step": 30000 + }, + { + "epoch": 1.2, + "eval_loss": 0.3984352946281433, + "eval_runtime": 321.4637, + "eval_samples_per_second": 15.569, + "eval_steps_per_second": 1.947, + "eval_wer": 30.10987446308645, + "step": 30000 + }, + { + "epoch": 1.2, + "learning_rate": 4.038181818181819e-06, + "loss": 0.3611, + "step": 30025 + }, + { + "epoch": 1.2, + "learning_rate": 4.033131313131313e-06, + "loss": 0.3679, + "step": 30050 + }, + { + "epoch": 1.21, + "learning_rate": 4.028080808080808e-06, + "loss": 0.3871, + "step": 30075 + }, + { + "epoch": 1.21, + "learning_rate": 4.023030303030303e-06, + "loss": 0.37, + "step": 30100 + }, + { + "epoch": 1.21, + "learning_rate": 4.017979797979798e-06, + "loss": 0.3907, + "step": 30125 + }, + { + "epoch": 1.21, + "learning_rate": 4.0129292929292935e-06, + "loss": 0.3855, + "step": 30150 + }, + { + "epoch": 1.21, + "learning_rate": 4.007878787878789e-06, + "loss": 0.3823, + "step": 30175 + }, + { + "epoch": 1.21, + "learning_rate": 4.002828282828283e-06, + "loss": 0.3737, + "step": 30200 + }, + { + "epoch": 1.21, + "learning_rate": 3.997777777777778e-06, + "loss": 0.3771, + "step": 30225 + }, + { + "epoch": 1.21, + "learning_rate": 3.992727272727273e-06, + "loss": 0.3616, + "step": 30250 + }, + { + "epoch": 1.21, + "learning_rate": 3.987676767676768e-06, + "loss": 0.3891, + "step": 30275 + }, + { + "epoch": 1.22, + "learning_rate": 3.982626262626263e-06, + "loss": 0.3803, + "step": 30300 + }, + { + "epoch": 1.22, + "learning_rate": 3.977575757575758e-06, + "loss": 0.3833, + "step": 30325 + }, + { + "epoch": 1.22, + "learning_rate": 3.972525252525253e-06, + "loss": 0.3839, + "step": 30350 + }, + { + "epoch": 1.22, + "learning_rate": 3.967474747474748e-06, + "loss": 0.3631, + "step": 30375 + }, + { + "epoch": 1.22, + "learning_rate": 3.962424242424242e-06, + "loss": 0.3719, + "step": 30400 + }, + { + "epoch": 1.22, + "learning_rate": 3.9573737373737375e-06, + "loss": 0.369, + "step": 30425 + }, + { + "epoch": 1.22, + "learning_rate": 3.952323232323233e-06, + "loss": 0.3953, + "step": 30450 + }, + { + "epoch": 1.22, + "learning_rate": 3.947272727272727e-06, + "loss": 0.3675, + "step": 30475 + }, + { + "epoch": 1.22, + "learning_rate": 3.942222222222222e-06, + "loss": 0.3801, + "step": 30500 + }, + { + "epoch": 1.22, + "learning_rate": 3.937171717171718e-06, + "loss": 0.3821, + "step": 30525 + }, + { + "epoch": 1.23, + "learning_rate": 3.932121212121212e-06, + "loss": 0.377, + "step": 30550 + }, + { + "epoch": 1.23, + "learning_rate": 3.9270707070707076e-06, + "loss": 0.3815, + "step": 30575 + }, + { + "epoch": 1.23, + "learning_rate": 3.922020202020203e-06, + "loss": 0.3986, + "step": 30600 + }, + { + "epoch": 1.23, + "learning_rate": 3.916969696969698e-06, + "loss": 0.3857, + "step": 30625 + }, + { + "epoch": 1.23, + "learning_rate": 3.911919191919192e-06, + "loss": 0.3729, + "step": 30650 + }, + { + "epoch": 1.23, + "learning_rate": 3.906868686868687e-06, + "loss": 0.365, + "step": 30675 + }, + { + "epoch": 1.23, + "learning_rate": 3.901818181818182e-06, + "loss": 0.3761, + "step": 30700 + }, + { + "epoch": 1.23, + "learning_rate": 3.896767676767677e-06, + "loss": 0.3843, + "step": 30725 + }, + { + "epoch": 1.23, + "learning_rate": 3.891717171717172e-06, + "loss": 0.3866, + "step": 30750 + }, + { + "epoch": 1.23, + "learning_rate": 3.886666666666667e-06, + "loss": 0.3839, + "step": 30775 + }, + { + "epoch": 1.24, + "learning_rate": 3.881616161616162e-06, + "loss": 0.3657, + "step": 30800 + }, + { + "epoch": 1.24, + "learning_rate": 3.8765656565656564e-06, + "loss": 0.3783, + "step": 30825 + }, + { + "epoch": 1.24, + "learning_rate": 3.871515151515152e-06, + "loss": 0.3709, + "step": 30850 + }, + { + "epoch": 1.24, + "learning_rate": 3.866666666666667e-06, + "loss": 0.3716, + "step": 30875 + }, + { + "epoch": 1.24, + "learning_rate": 3.8616161616161615e-06, + "loss": 0.3539, + "step": 30900 + }, + { + "epoch": 1.24, + "learning_rate": 3.856565656565657e-06, + "loss": 0.3722, + "step": 30925 + }, + { + "epoch": 1.24, + "learning_rate": 3.851515151515152e-06, + "loss": 0.3756, + "step": 30950 + }, + { + "epoch": 1.24, + "learning_rate": 3.846464646464647e-06, + "loss": 0.3721, + "step": 30975 + }, + { + "epoch": 1.24, + "learning_rate": 3.841414141414141e-06, + "loss": 0.3652, + "step": 31000 + }, + { + "epoch": 1.24, + "learning_rate": 3.836363636363636e-06, + "loss": 0.3591, + "step": 31025 + }, + { + "epoch": 1.25, + "learning_rate": 3.8313131313131315e-06, + "loss": 0.3523, + "step": 31050 + }, + { + "epoch": 1.25, + "learning_rate": 3.826262626262627e-06, + "loss": 0.3621, + "step": 31075 + }, + { + "epoch": 1.25, + "learning_rate": 3.821212121212122e-06, + "loss": 0.3723, + "step": 31100 + }, + { + "epoch": 1.25, + "learning_rate": 3.816161616161617e-06, + "loss": 0.408, + "step": 31125 + }, + { + "epoch": 1.25, + "learning_rate": 3.8111111111111117e-06, + "loss": 0.3633, + "step": 31150 + }, + { + "epoch": 1.25, + "learning_rate": 3.8060606060606064e-06, + "loss": 0.3777, + "step": 31175 + }, + { + "epoch": 1.25, + "learning_rate": 3.8010101010101015e-06, + "loss": 0.3545, + "step": 31200 + }, + { + "epoch": 1.25, + "learning_rate": 3.7959595959595962e-06, + "loss": 0.3702, + "step": 31225 + }, + { + "epoch": 1.25, + "learning_rate": 3.7909090909090914e-06, + "loss": 0.3834, + "step": 31250 + }, + { + "epoch": 1.25, + "learning_rate": 3.785858585858586e-06, + "loss": 0.3783, + "step": 31275 + }, + { + "epoch": 1.26, + "learning_rate": 3.7808080808080812e-06, + "loss": 0.3867, + "step": 31300 + }, + { + "epoch": 1.26, + "learning_rate": 3.775757575757576e-06, + "loss": 0.3957, + "step": 31325 + }, + { + "epoch": 1.26, + "learning_rate": 3.7707070707070707e-06, + "loss": 0.3978, + "step": 31350 + }, + { + "epoch": 1.26, + "learning_rate": 3.765656565656566e-06, + "loss": 0.3811, + "step": 31375 + }, + { + "epoch": 1.26, + "learning_rate": 3.7606060606060605e-06, + "loss": 0.3783, + "step": 31400 + }, + { + "epoch": 1.26, + "learning_rate": 3.7555555555555557e-06, + "loss": 0.376, + "step": 31425 + }, + { + "epoch": 1.26, + "learning_rate": 3.7505050505050504e-06, + "loss": 0.4037, + "step": 31450 + }, + { + "epoch": 1.26, + "learning_rate": 3.745454545454546e-06, + "loss": 0.3646, + "step": 31475 + }, + { + "epoch": 1.26, + "learning_rate": 3.740404040404041e-06, + "loss": 0.3956, + "step": 31500 + }, + { + "epoch": 1.26, + "learning_rate": 3.735353535353536e-06, + "loss": 0.3631, + "step": 31525 + }, + { + "epoch": 1.27, + "learning_rate": 3.7303030303030306e-06, + "loss": 0.3911, + "step": 31550 + }, + { + "epoch": 1.27, + "learning_rate": 3.7252525252525257e-06, + "loss": 0.3575, + "step": 31575 + }, + { + "epoch": 1.27, + "learning_rate": 3.7202020202020204e-06, + "loss": 0.3684, + "step": 31600 + }, + { + "epoch": 1.27, + "learning_rate": 3.7151515151515156e-06, + "loss": 0.3883, + "step": 31625 + }, + { + "epoch": 1.27, + "learning_rate": 3.7103030303030308e-06, + "loss": 0.3612, + "step": 31650 + }, + { + "epoch": 1.27, + "learning_rate": 3.7052525252525255e-06, + "loss": 0.3719, + "step": 31675 + }, + { + "epoch": 1.27, + "learning_rate": 3.7002020202020206e-06, + "loss": 0.3751, + "step": 31700 + }, + { + "epoch": 1.27, + "learning_rate": 3.6951515151515153e-06, + "loss": 0.3733, + "step": 31725 + }, + { + "epoch": 1.27, + "learning_rate": 3.6901010101010105e-06, + "loss": 0.3703, + "step": 31750 + }, + { + "epoch": 1.27, + "learning_rate": 3.685050505050505e-06, + "loss": 0.3749, + "step": 31775 + }, + { + "epoch": 1.28, + "learning_rate": 3.6800000000000003e-06, + "loss": 0.3645, + "step": 31800 + }, + { + "epoch": 1.28, + "learning_rate": 3.674949494949495e-06, + "loss": 0.3783, + "step": 31825 + }, + { + "epoch": 1.28, + "learning_rate": 3.66989898989899e-06, + "loss": 0.3761, + "step": 31850 + }, + { + "epoch": 1.28, + "learning_rate": 3.664848484848485e-06, + "loss": 0.3799, + "step": 31875 + }, + { + "epoch": 1.28, + "learning_rate": 3.65979797979798e-06, + "loss": 0.3971, + "step": 31900 + }, + { + "epoch": 1.28, + "learning_rate": 3.6547474747474748e-06, + "loss": 0.3596, + "step": 31925 + }, + { + "epoch": 1.28, + "learning_rate": 3.64969696969697e-06, + "loss": 0.3811, + "step": 31950 + }, + { + "epoch": 1.28, + "learning_rate": 3.644646464646465e-06, + "loss": 0.3619, + "step": 31975 + }, + { + "epoch": 1.28, + "learning_rate": 3.6395959595959602e-06, + "loss": 0.3776, + "step": 32000 + }, + { + "epoch": 1.28, + "learning_rate": 3.634545454545455e-06, + "loss": 0.3886, + "step": 32025 + }, + { + "epoch": 1.29, + "learning_rate": 3.62949494949495e-06, + "loss": 0.3691, + "step": 32050 + }, + { + "epoch": 1.29, + "learning_rate": 3.624444444444445e-06, + "loss": 0.3774, + "step": 32075 + }, + { + "epoch": 1.29, + "learning_rate": 3.61939393939394e-06, + "loss": 0.3706, + "step": 32100 + }, + { + "epoch": 1.29, + "learning_rate": 3.6143434343434347e-06, + "loss": 0.3684, + "step": 32125 + }, + { + "epoch": 1.29, + "learning_rate": 3.60929292929293e-06, + "loss": 0.3787, + "step": 32150 + }, + { + "epoch": 1.29, + "learning_rate": 3.6042424242424245e-06, + "loss": 0.3814, + "step": 32175 + }, + { + "epoch": 1.29, + "learning_rate": 3.5991919191919197e-06, + "loss": 0.3632, + "step": 32200 + }, + { + "epoch": 1.29, + "learning_rate": 3.5941414141414144e-06, + "loss": 0.3616, + "step": 32225 + }, + { + "epoch": 1.29, + "learning_rate": 3.589090909090909e-06, + "loss": 0.3776, + "step": 32250 + }, + { + "epoch": 1.29, + "learning_rate": 3.5840404040404043e-06, + "loss": 0.3877, + "step": 32275 + }, + { + "epoch": 1.3, + "learning_rate": 3.578989898989899e-06, + "loss": 0.3801, + "step": 32300 + }, + { + "epoch": 1.3, + "learning_rate": 3.573939393939394e-06, + "loss": 0.38, + "step": 32325 + }, + { + "epoch": 1.3, + "learning_rate": 3.568888888888889e-06, + "loss": 0.3855, + "step": 32350 + }, + { + "epoch": 1.3, + "learning_rate": 3.563838383838384e-06, + "loss": 0.3809, + "step": 32375 + }, + { + "epoch": 1.3, + "learning_rate": 3.5587878787878795e-06, + "loss": 0.3729, + "step": 32400 + }, + { + "epoch": 1.3, + "learning_rate": 3.5537373737373743e-06, + "loss": 0.3869, + "step": 32425 + }, + { + "epoch": 1.3, + "learning_rate": 3.548686868686869e-06, + "loss": 0.373, + "step": 32450 + }, + { + "epoch": 1.3, + "learning_rate": 3.543636363636364e-06, + "loss": 0.3739, + "step": 32475 + }, + { + "epoch": 1.3, + "learning_rate": 3.538585858585859e-06, + "loss": 0.3774, + "step": 32500 + }, + { + "epoch": 1.3, + "eval_loss": 0.39484164118766785, + "eval_runtime": 316.8768, + "eval_samples_per_second": 15.795, + "eval_steps_per_second": 1.976, + "eval_wer": 29.286409264576758, + "step": 32500 + }, + { + "epoch": 1.3, + "learning_rate": 3.533535353535354e-06, + "loss": 0.3763, + "step": 32525 + }, + { + "epoch": 1.31, + "learning_rate": 3.5284848484848487e-06, + "loss": 0.3612, + "step": 32550 + }, + { + "epoch": 1.31, + "learning_rate": 3.523434343434344e-06, + "loss": 0.3716, + "step": 32575 + }, + { + "epoch": 1.31, + "learning_rate": 3.5183838383838386e-06, + "loss": 0.3837, + "step": 32600 + }, + { + "epoch": 1.31, + "learning_rate": 3.5133333333333337e-06, + "loss": 0.3732, + "step": 32625 + }, + { + "epoch": 1.31, + "learning_rate": 3.5082828282828284e-06, + "loss": 0.3579, + "step": 32650 + }, + { + "epoch": 1.31, + "learning_rate": 3.5032323232323236e-06, + "loss": 0.3632, + "step": 32675 + }, + { + "epoch": 1.31, + "learning_rate": 3.4981818181818183e-06, + "loss": 0.3622, + "step": 32700 + }, + { + "epoch": 1.31, + "learning_rate": 3.4931313131313134e-06, + "loss": 0.372, + "step": 32725 + }, + { + "epoch": 1.31, + "learning_rate": 3.488080808080808e-06, + "loss": 0.3654, + "step": 32750 + }, + { + "epoch": 1.31, + "learning_rate": 3.483030303030303e-06, + "loss": 0.3585, + "step": 32775 + }, + { + "epoch": 1.32, + "learning_rate": 3.477979797979798e-06, + "loss": 0.3741, + "step": 32800 + }, + { + "epoch": 1.32, + "learning_rate": 3.4729292929292936e-06, + "loss": 0.3837, + "step": 32825 + }, + { + "epoch": 1.32, + "learning_rate": 3.4678787878787883e-06, + "loss": 0.3789, + "step": 32850 + }, + { + "epoch": 1.32, + "learning_rate": 3.4628282828282835e-06, + "loss": 0.3655, + "step": 32875 + }, + { + "epoch": 1.32, + "learning_rate": 3.457777777777778e-06, + "loss": 0.3971, + "step": 32900 + }, + { + "epoch": 1.32, + "learning_rate": 3.4527272727272733e-06, + "loss": 0.3546, + "step": 32925 + }, + { + "epoch": 1.32, + "learning_rate": 3.447676767676768e-06, + "loss": 0.3669, + "step": 32950 + }, + { + "epoch": 1.32, + "learning_rate": 3.442626262626263e-06, + "loss": 0.3724, + "step": 32975 + }, + { + "epoch": 1.32, + "learning_rate": 3.437575757575758e-06, + "loss": 0.3663, + "step": 33000 + }, + { + "epoch": 1.32, + "learning_rate": 3.4325252525252526e-06, + "loss": 0.3658, + "step": 33025 + }, + { + "epoch": 1.33, + "learning_rate": 3.4274747474747478e-06, + "loss": 0.3767, + "step": 33050 + }, + { + "epoch": 1.33, + "learning_rate": 3.4224242424242425e-06, + "loss": 0.3873, + "step": 33075 + }, + { + "epoch": 1.33, + "learning_rate": 3.4173737373737376e-06, + "loss": 0.3811, + "step": 33100 + }, + { + "epoch": 1.33, + "learning_rate": 3.4123232323232323e-06, + "loss": 0.3642, + "step": 33125 + }, + { + "epoch": 1.33, + "learning_rate": 3.4072727272727275e-06, + "loss": 0.3857, + "step": 33150 + }, + { + "epoch": 1.33, + "learning_rate": 3.4022222222222222e-06, + "loss": 0.3699, + "step": 33175 + }, + { + "epoch": 1.33, + "learning_rate": 3.3971717171717174e-06, + "loss": 0.3551, + "step": 33200 + }, + { + "epoch": 1.33, + "learning_rate": 3.392121212121212e-06, + "loss": 0.3643, + "step": 33225 + }, + { + "epoch": 1.33, + "learning_rate": 3.3870707070707076e-06, + "loss": 0.3619, + "step": 33250 + }, + { + "epoch": 1.33, + "learning_rate": 3.3820202020202024e-06, + "loss": 0.3629, + "step": 33275 + }, + { + "epoch": 1.34, + "learning_rate": 3.3769696969696975e-06, + "loss": 0.3771, + "step": 33300 + }, + { + "epoch": 1.34, + "learning_rate": 3.3719191919191922e-06, + "loss": 0.3686, + "step": 33325 + }, + { + "epoch": 1.34, + "learning_rate": 3.3668686868686874e-06, + "loss": 0.384, + "step": 33350 + }, + { + "epoch": 1.34, + "learning_rate": 3.361818181818182e-06, + "loss": 0.3782, + "step": 33375 + }, + { + "epoch": 1.34, + "learning_rate": 3.3567676767676772e-06, + "loss": 0.3908, + "step": 33400 + }, + { + "epoch": 1.34, + "learning_rate": 3.351717171717172e-06, + "loss": 0.3656, + "step": 33425 + }, + { + "epoch": 1.34, + "learning_rate": 3.346666666666667e-06, + "loss": 0.3744, + "step": 33450 + }, + { + "epoch": 1.34, + "learning_rate": 3.341616161616162e-06, + "loss": 0.3734, + "step": 33475 + }, + { + "epoch": 1.34, + "learning_rate": 3.336565656565657e-06, + "loss": 0.3818, + "step": 33500 + }, + { + "epoch": 1.34, + "learning_rate": 3.3315151515151517e-06, + "loss": 0.357, + "step": 33525 + }, + { + "epoch": 1.35, + "learning_rate": 3.326464646464647e-06, + "loss": 0.3672, + "step": 33550 + }, + { + "epoch": 1.35, + "learning_rate": 3.3214141414141415e-06, + "loss": 0.3844, + "step": 33575 + }, + { + "epoch": 1.35, + "learning_rate": 3.3163636363636363e-06, + "loss": 0.3595, + "step": 33600 + }, + { + "epoch": 1.35, + "learning_rate": 3.3113131313131314e-06, + "loss": 0.3811, + "step": 33625 + }, + { + "epoch": 1.35, + "learning_rate": 3.306262626262626e-06, + "loss": 0.3512, + "step": 33650 + }, + { + "epoch": 1.35, + "learning_rate": 3.3012121212121217e-06, + "loss": 0.379, + "step": 33675 + }, + { + "epoch": 1.35, + "learning_rate": 3.296161616161617e-06, + "loss": 0.3905, + "step": 33700 + }, + { + "epoch": 1.35, + "learning_rate": 3.2911111111111116e-06, + "loss": 0.3655, + "step": 33725 + }, + { + "epoch": 1.35, + "learning_rate": 3.2860606060606067e-06, + "loss": 0.3791, + "step": 33750 + }, + { + "epoch": 1.35, + "learning_rate": 3.2810101010101014e-06, + "loss": 0.3635, + "step": 33775 + }, + { + "epoch": 1.36, + "learning_rate": 3.275959595959596e-06, + "loss": 0.3685, + "step": 33800 + }, + { + "epoch": 1.36, + "learning_rate": 3.2709090909090913e-06, + "loss": 0.3658, + "step": 33825 + }, + { + "epoch": 1.36, + "learning_rate": 3.265858585858586e-06, + "loss": 0.3813, + "step": 33850 + }, + { + "epoch": 1.36, + "learning_rate": 3.260808080808081e-06, + "loss": 0.3697, + "step": 33875 + }, + { + "epoch": 1.36, + "learning_rate": 3.255757575757576e-06, + "loss": 0.3699, + "step": 33900 + }, + { + "epoch": 1.36, + "learning_rate": 3.250707070707071e-06, + "loss": 0.3908, + "step": 33925 + }, + { + "epoch": 1.36, + "learning_rate": 3.2456565656565657e-06, + "loss": 0.3789, + "step": 33950 + }, + { + "epoch": 1.36, + "learning_rate": 3.240606060606061e-06, + "loss": 0.3673, + "step": 33975 + }, + { + "epoch": 1.36, + "learning_rate": 3.2355555555555556e-06, + "loss": 0.3746, + "step": 34000 + }, + { + "epoch": 1.36, + "learning_rate": 3.2305050505050507e-06, + "loss": 0.3683, + "step": 34025 + }, + { + "epoch": 1.37, + "learning_rate": 3.2254545454545455e-06, + "loss": 0.3722, + "step": 34050 + }, + { + "epoch": 1.37, + "learning_rate": 3.2204040404040406e-06, + "loss": 0.3844, + "step": 34075 + }, + { + "epoch": 1.37, + "learning_rate": 3.2153535353535357e-06, + "loss": 0.3661, + "step": 34100 + }, + { + "epoch": 1.37, + "learning_rate": 3.210303030303031e-06, + "loss": 0.3803, + "step": 34125 + }, + { + "epoch": 1.37, + "learning_rate": 3.2052525252525256e-06, + "loss": 0.3847, + "step": 34150 + }, + { + "epoch": 1.37, + "learning_rate": 3.2002020202020207e-06, + "loss": 0.3853, + "step": 34175 + }, + { + "epoch": 1.37, + "learning_rate": 3.1951515151515155e-06, + "loss": 0.3683, + "step": 34200 + }, + { + "epoch": 1.37, + "learning_rate": 3.1901010101010106e-06, + "loss": 0.379, + "step": 34225 + }, + { + "epoch": 1.37, + "learning_rate": 3.1850505050505053e-06, + "loss": 0.3779, + "step": 34250 + }, + { + "epoch": 1.37, + "learning_rate": 3.1800000000000005e-06, + "loss": 0.3689, + "step": 34275 + }, + { + "epoch": 1.38, + "learning_rate": 3.174949494949495e-06, + "loss": 0.3779, + "step": 34300 + }, + { + "epoch": 1.38, + "learning_rate": 3.1698989898989903e-06, + "loss": 0.3603, + "step": 34325 + }, + { + "epoch": 1.38, + "learning_rate": 3.164848484848485e-06, + "loss": 0.3832, + "step": 34350 + }, + { + "epoch": 1.38, + "learning_rate": 3.1597979797979798e-06, + "loss": 0.3902, + "step": 34375 + }, + { + "epoch": 1.38, + "learning_rate": 3.154747474747475e-06, + "loss": 0.37, + "step": 34400 + }, + { + "epoch": 1.38, + "learning_rate": 3.1496969696969696e-06, + "loss": 0.3629, + "step": 34425 + }, + { + "epoch": 1.38, + "learning_rate": 3.1446464646464648e-06, + "loss": 0.3733, + "step": 34450 + }, + { + "epoch": 1.38, + "learning_rate": 3.1395959595959595e-06, + "loss": 0.3633, + "step": 34475 + }, + { + "epoch": 1.38, + "learning_rate": 3.1345454545454546e-06, + "loss": 0.3804, + "step": 34500 + }, + { + "epoch": 1.38, + "learning_rate": 3.1294949494949494e-06, + "loss": 0.3715, + "step": 34525 + }, + { + "epoch": 1.39, + "learning_rate": 3.124444444444445e-06, + "loss": 0.3571, + "step": 34550 + }, + { + "epoch": 1.39, + "learning_rate": 3.11939393939394e-06, + "loss": 0.3838, + "step": 34575 + }, + { + "epoch": 1.39, + "learning_rate": 3.114343434343435e-06, + "loss": 0.3638, + "step": 34600 + }, + { + "epoch": 1.39, + "learning_rate": 3.1092929292929295e-06, + "loss": 0.3643, + "step": 34625 + }, + { + "epoch": 1.39, + "learning_rate": 3.1042424242424247e-06, + "loss": 0.3621, + "step": 34650 + }, + { + "epoch": 1.39, + "learning_rate": 3.0991919191919194e-06, + "loss": 0.3687, + "step": 34675 + }, + { + "epoch": 1.39, + "learning_rate": 3.0941414141414145e-06, + "loss": 0.3607, + "step": 34700 + }, + { + "epoch": 1.39, + "learning_rate": 3.0890909090909092e-06, + "loss": 0.3902, + "step": 34725 + }, + { + "epoch": 1.39, + "learning_rate": 3.0840404040404044e-06, + "loss": 0.3709, + "step": 34750 + }, + { + "epoch": 1.39, + "learning_rate": 3.078989898989899e-06, + "loss": 0.3906, + "step": 34775 + }, + { + "epoch": 1.4, + "learning_rate": 3.0739393939393942e-06, + "loss": 0.3538, + "step": 34800 + }, + { + "epoch": 1.4, + "learning_rate": 3.068888888888889e-06, + "loss": 0.3618, + "step": 34825 + }, + { + "epoch": 1.4, + "learning_rate": 3.063838383838384e-06, + "loss": 0.3723, + "step": 34850 + }, + { + "epoch": 1.4, + "learning_rate": 3.058787878787879e-06, + "loss": 0.3607, + "step": 34875 + }, + { + "epoch": 1.4, + "learning_rate": 3.053737373737374e-06, + "loss": 0.363, + "step": 34900 + }, + { + "epoch": 1.4, + "learning_rate": 3.0486868686868687e-06, + "loss": 0.3426, + "step": 34925 + }, + { + "epoch": 1.4, + "learning_rate": 3.0436363636363634e-06, + "loss": 0.3637, + "step": 34950 + }, + { + "epoch": 1.4, + "learning_rate": 3.038585858585859e-06, + "loss": 0.3681, + "step": 34975 + }, + { + "epoch": 1.4, + "learning_rate": 3.033535353535354e-06, + "loss": 0.3667, + "step": 35000 + }, + { + "epoch": 1.4, + "eval_loss": 0.3912336826324463, + "eval_runtime": 305.76, + "eval_samples_per_second": 16.369, + "eval_steps_per_second": 2.047, + "eval_wer": 29.516599824390706, + "step": 35000 + }, + { + "epoch": 1.4, + "learning_rate": 3.028484848484849e-06, + "loss": 0.371, + "step": 35025 + }, + { + "epoch": 1.41, + "learning_rate": 3.023434343434344e-06, + "loss": 0.3572, + "step": 35050 + }, + { + "epoch": 1.41, + "learning_rate": 3.0183838383838387e-06, + "loss": 0.3677, + "step": 35075 + }, + { + "epoch": 1.41, + "learning_rate": 3.013333333333334e-06, + "loss": 0.3687, + "step": 35100 + }, + { + "epoch": 1.41, + "learning_rate": 3.0082828282828286e-06, + "loss": 0.3723, + "step": 35125 + }, + { + "epoch": 1.41, + "learning_rate": 3.0032323232323237e-06, + "loss": 0.3641, + "step": 35150 + }, + { + "epoch": 1.41, + "learning_rate": 2.9981818181818184e-06, + "loss": 0.3574, + "step": 35175 + }, + { + "epoch": 1.41, + "learning_rate": 2.993131313131313e-06, + "loss": 0.3686, + "step": 35200 + }, + { + "epoch": 1.41, + "learning_rate": 2.9880808080808083e-06, + "loss": 0.3802, + "step": 35225 + }, + { + "epoch": 1.41, + "learning_rate": 2.983030303030303e-06, + "loss": 0.3695, + "step": 35250 + }, + { + "epoch": 1.41, + "learning_rate": 2.977979797979798e-06, + "loss": 0.3799, + "step": 35275 + }, + { + "epoch": 1.42, + "learning_rate": 2.972929292929293e-06, + "loss": 0.3693, + "step": 35300 + }, + { + "epoch": 1.42, + "learning_rate": 2.967878787878788e-06, + "loss": 0.3745, + "step": 35325 + }, + { + "epoch": 1.42, + "learning_rate": 2.9628282828282827e-06, + "loss": 0.3884, + "step": 35350 + }, + { + "epoch": 1.42, + "learning_rate": 2.957777777777778e-06, + "loss": 0.3866, + "step": 35375 + }, + { + "epoch": 1.42, + "learning_rate": 2.952727272727273e-06, + "loss": 0.3682, + "step": 35400 + }, + { + "epoch": 1.42, + "learning_rate": 2.947676767676768e-06, + "loss": 0.3848, + "step": 35425 + }, + { + "epoch": 1.42, + "learning_rate": 2.942626262626263e-06, + "loss": 0.3718, + "step": 35450 + }, + { + "epoch": 1.42, + "learning_rate": 2.937575757575758e-06, + "loss": 0.3725, + "step": 35475 + }, + { + "epoch": 1.42, + "learning_rate": 2.9325252525252528e-06, + "loss": 0.3892, + "step": 35500 + }, + { + "epoch": 1.42, + "learning_rate": 2.927474747474748e-06, + "loss": 0.3646, + "step": 35525 + }, + { + "epoch": 1.43, + "learning_rate": 2.9224242424242426e-06, + "loss": 0.3628, + "step": 35550 + }, + { + "epoch": 1.43, + "learning_rate": 2.9173737373737378e-06, + "loss": 0.3609, + "step": 35575 + }, + { + "epoch": 1.43, + "learning_rate": 2.9123232323232325e-06, + "loss": 0.3547, + "step": 35600 + }, + { + "epoch": 1.43, + "learning_rate": 2.9072727272727276e-06, + "loss": 0.3778, + "step": 35625 + }, + { + "epoch": 1.43, + "learning_rate": 2.9022222222222223e-06, + "loss": 0.3585, + "step": 35650 + }, + { + "epoch": 1.43, + "learning_rate": 2.8973737373737375e-06, + "loss": 0.369, + "step": 35675 + }, + { + "epoch": 1.43, + "learning_rate": 2.8923232323232327e-06, + "loss": 0.3617, + "step": 35700 + }, + { + "epoch": 1.43, + "learning_rate": 2.8872727272727274e-06, + "loss": 0.3639, + "step": 35725 + }, + { + "epoch": 1.43, + "learning_rate": 2.8822222222222225e-06, + "loss": 0.3638, + "step": 35750 + }, + { + "epoch": 1.43, + "learning_rate": 2.8771717171717173e-06, + "loss": 0.3639, + "step": 35775 + }, + { + "epoch": 1.44, + "learning_rate": 2.8721212121212124e-06, + "loss": 0.3808, + "step": 35800 + }, + { + "epoch": 1.44, + "learning_rate": 2.867070707070707e-06, + "loss": 0.375, + "step": 35825 + }, + { + "epoch": 1.44, + "learning_rate": 2.862020202020202e-06, + "loss": 0.3533, + "step": 35850 + }, + { + "epoch": 1.44, + "learning_rate": 2.856969696969697e-06, + "loss": 0.3687, + "step": 35875 + }, + { + "epoch": 1.44, + "learning_rate": 2.8519191919191925e-06, + "loss": 0.3734, + "step": 35900 + }, + { + "epoch": 1.44, + "learning_rate": 2.8468686868686873e-06, + "loss": 0.3532, + "step": 35925 + }, + { + "epoch": 1.44, + "learning_rate": 2.8418181818181824e-06, + "loss": 0.3764, + "step": 35950 + }, + { + "epoch": 1.44, + "learning_rate": 2.836767676767677e-06, + "loss": 0.3668, + "step": 35975 + }, + { + "epoch": 1.44, + "learning_rate": 2.8317171717171723e-06, + "loss": 0.3666, + "step": 36000 + }, + { + "epoch": 1.44, + "learning_rate": 2.826666666666667e-06, + "loss": 0.3726, + "step": 36025 + }, + { + "epoch": 1.45, + "learning_rate": 2.8216161616161617e-06, + "loss": 0.3732, + "step": 36050 + }, + { + "epoch": 1.45, + "learning_rate": 2.816565656565657e-06, + "loss": 0.3792, + "step": 36075 + }, + { + "epoch": 1.45, + "learning_rate": 2.8115151515151516e-06, + "loss": 0.3611, + "step": 36100 + }, + { + "epoch": 1.45, + "learning_rate": 2.8064646464646467e-06, + "loss": 0.3788, + "step": 36125 + }, + { + "epoch": 1.45, + "learning_rate": 2.8014141414141414e-06, + "loss": 0.3708, + "step": 36150 + }, + { + "epoch": 1.45, + "learning_rate": 2.7963636363636366e-06, + "loss": 0.3748, + "step": 36175 + }, + { + "epoch": 1.45, + "learning_rate": 2.7913131313131313e-06, + "loss": 0.3703, + "step": 36200 + }, + { + "epoch": 1.45, + "learning_rate": 2.7862626262626264e-06, + "loss": 0.3886, + "step": 36225 + }, + { + "epoch": 1.45, + "learning_rate": 2.781212121212121e-06, + "loss": 0.3808, + "step": 36250 + }, + { + "epoch": 1.45, + "learning_rate": 2.7761616161616163e-06, + "loss": 0.3718, + "step": 36275 + }, + { + "epoch": 1.46, + "learning_rate": 2.771111111111111e-06, + "loss": 0.3705, + "step": 36300 + }, + { + "epoch": 1.46, + "learning_rate": 2.7660606060606066e-06, + "loss": 0.3652, + "step": 36325 + }, + { + "epoch": 1.46, + "learning_rate": 2.7610101010101013e-06, + "loss": 0.3868, + "step": 36350 + }, + { + "epoch": 1.46, + "learning_rate": 2.7559595959595965e-06, + "loss": 0.3726, + "step": 36375 + }, + { + "epoch": 1.46, + "learning_rate": 2.750909090909091e-06, + "loss": 0.3618, + "step": 36400 + }, + { + "epoch": 1.46, + "learning_rate": 2.7458585858585863e-06, + "loss": 0.3691, + "step": 36425 + }, + { + "epoch": 1.46, + "learning_rate": 2.740808080808081e-06, + "loss": 0.3828, + "step": 36450 + }, + { + "epoch": 1.46, + "learning_rate": 2.735757575757576e-06, + "loss": 0.3493, + "step": 36475 + }, + { + "epoch": 1.46, + "learning_rate": 2.730707070707071e-06, + "loss": 0.3479, + "step": 36500 + }, + { + "epoch": 1.46, + "learning_rate": 2.725656565656566e-06, + "loss": 0.3757, + "step": 36525 + }, + { + "epoch": 1.47, + "learning_rate": 2.7206060606060608e-06, + "loss": 0.382, + "step": 36550 + }, + { + "epoch": 1.47, + "learning_rate": 2.715555555555556e-06, + "loss": 0.3821, + "step": 36575 + }, + { + "epoch": 1.47, + "learning_rate": 2.7105050505050506e-06, + "loss": 0.3745, + "step": 36600 + }, + { + "epoch": 1.47, + "learning_rate": 2.7054545454545453e-06, + "loss": 0.3865, + "step": 36625 + }, + { + "epoch": 1.47, + "learning_rate": 2.7004040404040405e-06, + "loss": 0.3973, + "step": 36650 + }, + { + "epoch": 1.47, + "learning_rate": 2.695353535353535e-06, + "loss": 0.3608, + "step": 36675 + }, + { + "epoch": 1.47, + "learning_rate": 2.6903030303030304e-06, + "loss": 0.3895, + "step": 36700 + }, + { + "epoch": 1.47, + "learning_rate": 2.685252525252525e-06, + "loss": 0.3636, + "step": 36725 + }, + { + "epoch": 1.47, + "learning_rate": 2.6802020202020206e-06, + "loss": 0.3612, + "step": 36750 + }, + { + "epoch": 1.47, + "learning_rate": 2.6751515151515158e-06, + "loss": 0.3774, + "step": 36775 + }, + { + "epoch": 1.48, + "learning_rate": 2.6701010101010105e-06, + "loss": 0.3648, + "step": 36800 + }, + { + "epoch": 1.48, + "learning_rate": 2.6650505050505056e-06, + "loss": 0.3923, + "step": 36825 + }, + { + "epoch": 1.48, + "learning_rate": 2.6600000000000004e-06, + "loss": 0.3753, + "step": 36850 + }, + { + "epoch": 1.48, + "learning_rate": 2.654949494949495e-06, + "loss": 0.359, + "step": 36875 + }, + { + "epoch": 1.48, + "learning_rate": 2.6498989898989902e-06, + "loss": 0.3599, + "step": 36900 + }, + { + "epoch": 1.48, + "learning_rate": 2.644848484848485e-06, + "loss": 0.3582, + "step": 36925 + }, + { + "epoch": 1.48, + "learning_rate": 2.63979797979798e-06, + "loss": 0.377, + "step": 36950 + }, + { + "epoch": 1.48, + "learning_rate": 2.634747474747475e-06, + "loss": 0.3565, + "step": 36975 + }, + { + "epoch": 1.48, + "learning_rate": 2.62969696969697e-06, + "loss": 0.3517, + "step": 37000 + }, + { + "epoch": 1.48, + "learning_rate": 2.6246464646464647e-06, + "loss": 0.3668, + "step": 37025 + }, + { + "epoch": 1.49, + "learning_rate": 2.61959595959596e-06, + "loss": 0.3779, + "step": 37050 + }, + { + "epoch": 1.49, + "learning_rate": 2.6145454545454545e-06, + "loss": 0.3635, + "step": 37075 + }, + { + "epoch": 1.49, + "learning_rate": 2.6094949494949497e-06, + "loss": 0.3662, + "step": 37100 + }, + { + "epoch": 1.49, + "learning_rate": 2.6044444444444444e-06, + "loss": 0.3695, + "step": 37125 + }, + { + "epoch": 1.49, + "learning_rate": 2.5993939393939395e-06, + "loss": 0.3585, + "step": 37150 + }, + { + "epoch": 1.49, + "learning_rate": 2.5943434343434347e-06, + "loss": 0.3716, + "step": 37175 + }, + { + "epoch": 1.49, + "learning_rate": 2.58929292929293e-06, + "loss": 0.3694, + "step": 37200 + }, + { + "epoch": 1.49, + "learning_rate": 2.5842424242424246e-06, + "loss": 0.3676, + "step": 37225 + }, + { + "epoch": 1.49, + "learning_rate": 2.5791919191919197e-06, + "loss": 0.3785, + "step": 37250 + }, + { + "epoch": 1.49, + "learning_rate": 2.5741414141414144e-06, + "loss": 0.3505, + "step": 37275 + }, + { + "epoch": 1.5, + "learning_rate": 2.5690909090909096e-06, + "loss": 0.3643, + "step": 37300 + }, + { + "epoch": 1.5, + "learning_rate": 2.5640404040404043e-06, + "loss": 0.3612, + "step": 37325 + }, + { + "epoch": 1.5, + "learning_rate": 2.5589898989898994e-06, + "loss": 0.3833, + "step": 37350 + }, + { + "epoch": 1.5, + "learning_rate": 2.553939393939394e-06, + "loss": 0.3497, + "step": 37375 + }, + { + "epoch": 1.5, + "learning_rate": 2.5488888888888893e-06, + "loss": 0.358, + "step": 37400 + }, + { + "epoch": 1.5, + "learning_rate": 2.543838383838384e-06, + "loss": 0.3683, + "step": 37425 + }, + { + "epoch": 1.5, + "learning_rate": 2.5387878787878787e-06, + "loss": 0.3678, + "step": 37450 + }, + { + "epoch": 1.5, + "learning_rate": 2.533737373737374e-06, + "loss": 0.367, + "step": 37475 + }, + { + "epoch": 1.5, + "learning_rate": 2.5286868686868686e-06, + "loss": 0.3674, + "step": 37500 + }, + { + "epoch": 1.5, + "eval_loss": 0.3881114423274994, + "eval_runtime": 315.0434, + "eval_samples_per_second": 15.887, + "eval_steps_per_second": 1.987, + "eval_wer": 29.611523766582025, + "step": 37500 + }, + { + "epoch": 1.5, + "learning_rate": 2.5236363636363637e-06, + "loss": 0.3705, + "step": 37525 + }, + { + "epoch": 1.51, + "learning_rate": 2.5185858585858584e-06, + "loss": 0.3774, + "step": 37550 + }, + { + "epoch": 1.51, + "learning_rate": 2.5135353535353536e-06, + "loss": 0.3828, + "step": 37575 + }, + { + "epoch": 1.51, + "learning_rate": 2.508484848484849e-06, + "loss": 0.3841, + "step": 37600 + }, + { + "epoch": 1.51, + "learning_rate": 2.503434343434344e-06, + "loss": 0.365, + "step": 37625 + }, + { + "epoch": 1.51, + "learning_rate": 2.4983838383838386e-06, + "loss": 0.3662, + "step": 37650 + }, + { + "epoch": 1.51, + "learning_rate": 2.4935353535353538e-06, + "loss": 0.3612, + "step": 37675 + }, + { + "epoch": 1.51, + "learning_rate": 2.4884848484848485e-06, + "loss": 0.3737, + "step": 37700 + }, + { + "epoch": 1.51, + "learning_rate": 2.4834343434343436e-06, + "loss": 0.3698, + "step": 37725 + }, + { + "epoch": 1.51, + "learning_rate": 2.4783838383838384e-06, + "loss": 0.3605, + "step": 37750 + }, + { + "epoch": 1.51, + "learning_rate": 2.4733333333333335e-06, + "loss": 0.3811, + "step": 37775 + }, + { + "epoch": 1.52, + "learning_rate": 2.4682828282828287e-06, + "loss": 0.3475, + "step": 37800 + }, + { + "epoch": 1.52, + "learning_rate": 2.4632323232323234e-06, + "loss": 0.384, + "step": 37825 + }, + { + "epoch": 1.52, + "learning_rate": 2.4581818181818185e-06, + "loss": 0.3673, + "step": 37850 + }, + { + "epoch": 1.52, + "learning_rate": 2.4531313131313132e-06, + "loss": 0.3607, + "step": 37875 + }, + { + "epoch": 1.52, + "learning_rate": 2.4480808080808084e-06, + "loss": 0.3692, + "step": 37900 + }, + { + "epoch": 1.52, + "learning_rate": 2.443030303030303e-06, + "loss": 0.3598, + "step": 37925 + }, + { + "epoch": 1.52, + "learning_rate": 2.4379797979797982e-06, + "loss": 0.375, + "step": 37950 + }, + { + "epoch": 1.52, + "learning_rate": 2.432929292929293e-06, + "loss": 0.3648, + "step": 37975 + }, + { + "epoch": 1.52, + "learning_rate": 2.427878787878788e-06, + "loss": 0.371, + "step": 38000 + }, + { + "epoch": 1.52, + "learning_rate": 2.4228282828282832e-06, + "loss": 0.3652, + "step": 38025 + }, + { + "epoch": 1.53, + "learning_rate": 2.417777777777778e-06, + "loss": 0.366, + "step": 38050 + }, + { + "epoch": 1.53, + "learning_rate": 2.412727272727273e-06, + "loss": 0.3743, + "step": 38075 + }, + { + "epoch": 1.53, + "learning_rate": 2.407676767676768e-06, + "loss": 0.3759, + "step": 38100 + }, + { + "epoch": 1.53, + "learning_rate": 2.402626262626263e-06, + "loss": 0.3602, + "step": 38125 + }, + { + "epoch": 1.53, + "learning_rate": 2.3975757575757577e-06, + "loss": 0.3499, + "step": 38150 + }, + { + "epoch": 1.53, + "learning_rate": 2.392525252525253e-06, + "loss": 0.379, + "step": 38175 + }, + { + "epoch": 1.53, + "learning_rate": 2.3874747474747476e-06, + "loss": 0.3714, + "step": 38200 + }, + { + "epoch": 1.53, + "learning_rate": 2.3824242424242427e-06, + "loss": 0.3651, + "step": 38225 + }, + { + "epoch": 1.53, + "learning_rate": 2.377373737373738e-06, + "loss": 0.3924, + "step": 38250 + }, + { + "epoch": 1.53, + "learning_rate": 2.3723232323232326e-06, + "loss": 0.3603, + "step": 38275 + }, + { + "epoch": 1.54, + "learning_rate": 2.3672727272727277e-06, + "loss": 0.3641, + "step": 38300 + }, + { + "epoch": 1.54, + "learning_rate": 2.3622222222222224e-06, + "loss": 0.3601, + "step": 38325 + }, + { + "epoch": 1.54, + "learning_rate": 2.357171717171717e-06, + "loss": 0.3579, + "step": 38350 + }, + { + "epoch": 1.54, + "learning_rate": 2.3521212121212123e-06, + "loss": 0.3695, + "step": 38375 + }, + { + "epoch": 1.54, + "learning_rate": 2.347070707070707e-06, + "loss": 0.3897, + "step": 38400 + }, + { + "epoch": 1.54, + "learning_rate": 2.342020202020202e-06, + "loss": 0.3636, + "step": 38425 + }, + { + "epoch": 1.54, + "learning_rate": 2.3369696969696973e-06, + "loss": 0.3608, + "step": 38450 + }, + { + "epoch": 1.54, + "learning_rate": 2.331919191919192e-06, + "loss": 0.3822, + "step": 38475 + }, + { + "epoch": 1.54, + "learning_rate": 2.326868686868687e-06, + "loss": 0.3553, + "step": 38500 + }, + { + "epoch": 1.54, + "learning_rate": 2.321818181818182e-06, + "loss": 0.3531, + "step": 38525 + }, + { + "epoch": 1.55, + "learning_rate": 2.316767676767677e-06, + "loss": 0.3777, + "step": 38550 + }, + { + "epoch": 1.55, + "learning_rate": 2.3117171717171717e-06, + "loss": 0.3587, + "step": 38575 + }, + { + "epoch": 1.55, + "learning_rate": 2.306666666666667e-06, + "loss": 0.351, + "step": 38600 + }, + { + "epoch": 1.55, + "learning_rate": 2.3016161616161616e-06, + "loss": 0.3717, + "step": 38625 + }, + { + "epoch": 1.55, + "learning_rate": 2.2965656565656568e-06, + "loss": 0.3726, + "step": 38650 + }, + { + "epoch": 1.55, + "learning_rate": 2.291515151515152e-06, + "loss": 0.3658, + "step": 38675 + }, + { + "epoch": 1.55, + "learning_rate": 2.2864646464646466e-06, + "loss": 0.3675, + "step": 38700 + }, + { + "epoch": 1.55, + "learning_rate": 2.2814141414141418e-06, + "loss": 0.3596, + "step": 38725 + }, + { + "epoch": 1.55, + "learning_rate": 2.2763636363636365e-06, + "loss": 0.3791, + "step": 38750 + }, + { + "epoch": 1.55, + "learning_rate": 2.2713131313131316e-06, + "loss": 0.3683, + "step": 38775 + }, + { + "epoch": 1.56, + "learning_rate": 2.2662626262626263e-06, + "loss": 0.3827, + "step": 38800 + }, + { + "epoch": 1.56, + "learning_rate": 2.2612121212121215e-06, + "loss": 0.3748, + "step": 38825 + }, + { + "epoch": 1.56, + "learning_rate": 2.256161616161616e-06, + "loss": 0.371, + "step": 38850 + }, + { + "epoch": 1.56, + "learning_rate": 2.2511111111111113e-06, + "loss": 0.3624, + "step": 38875 + }, + { + "epoch": 1.56, + "learning_rate": 2.2460606060606065e-06, + "loss": 0.3662, + "step": 38900 + }, + { + "epoch": 1.56, + "learning_rate": 2.241010101010101e-06, + "loss": 0.3618, + "step": 38925 + }, + { + "epoch": 1.56, + "learning_rate": 2.2359595959595964e-06, + "loss": 0.366, + "step": 38950 + }, + { + "epoch": 1.56, + "learning_rate": 2.230909090909091e-06, + "loss": 0.3647, + "step": 38975 + }, + { + "epoch": 1.56, + "learning_rate": 2.225858585858586e-06, + "loss": 0.3719, + "step": 39000 + }, + { + "epoch": 1.56, + "learning_rate": 2.220808080808081e-06, + "loss": 0.3861, + "step": 39025 + }, + { + "epoch": 1.57, + "learning_rate": 2.2157575757575757e-06, + "loss": 0.374, + "step": 39050 + }, + { + "epoch": 1.57, + "learning_rate": 2.2107070707070712e-06, + "loss": 0.3668, + "step": 39075 + }, + { + "epoch": 1.57, + "learning_rate": 2.205656565656566e-06, + "loss": 0.3666, + "step": 39100 + }, + { + "epoch": 1.57, + "learning_rate": 2.2006060606060607e-06, + "loss": 0.3709, + "step": 39125 + }, + { + "epoch": 1.57, + "learning_rate": 2.195555555555556e-06, + "loss": 0.3439, + "step": 39150 + }, + { + "epoch": 1.57, + "learning_rate": 2.1905050505050505e-06, + "loss": 0.3771, + "step": 39175 + }, + { + "epoch": 1.57, + "learning_rate": 2.1854545454545457e-06, + "loss": 0.3647, + "step": 39200 + }, + { + "epoch": 1.57, + "learning_rate": 2.1804040404040404e-06, + "loss": 0.3765, + "step": 39225 + }, + { + "epoch": 1.57, + "learning_rate": 2.1753535353535355e-06, + "loss": 0.3626, + "step": 39250 + }, + { + "epoch": 1.57, + "learning_rate": 2.1703030303030303e-06, + "loss": 0.3637, + "step": 39275 + }, + { + "epoch": 1.58, + "learning_rate": 2.1652525252525254e-06, + "loss": 0.351, + "step": 39300 + }, + { + "epoch": 1.58, + "learning_rate": 2.1602020202020205e-06, + "loss": 0.3615, + "step": 39325 + }, + { + "epoch": 1.58, + "learning_rate": 2.1551515151515153e-06, + "loss": 0.361, + "step": 39350 + }, + { + "epoch": 1.58, + "learning_rate": 2.1501010101010104e-06, + "loss": 0.349, + "step": 39375 + }, + { + "epoch": 1.58, + "learning_rate": 2.145050505050505e-06, + "loss": 0.3675, + "step": 39400 + }, + { + "epoch": 1.58, + "learning_rate": 2.1400000000000003e-06, + "loss": 0.3569, + "step": 39425 + }, + { + "epoch": 1.58, + "learning_rate": 2.134949494949495e-06, + "loss": 0.347, + "step": 39450 + }, + { + "epoch": 1.58, + "learning_rate": 2.12989898989899e-06, + "loss": 0.3669, + "step": 39475 + }, + { + "epoch": 1.58, + "learning_rate": 2.1248484848484853e-06, + "loss": 0.3688, + "step": 39500 + }, + { + "epoch": 1.58, + "learning_rate": 2.11979797979798e-06, + "loss": 0.3631, + "step": 39525 + }, + { + "epoch": 1.59, + "learning_rate": 2.114747474747475e-06, + "loss": 0.3549, + "step": 39550 + }, + { + "epoch": 1.59, + "learning_rate": 2.10969696969697e-06, + "loss": 0.3504, + "step": 39575 + }, + { + "epoch": 1.59, + "learning_rate": 2.104646464646465e-06, + "loss": 0.3579, + "step": 39600 + }, + { + "epoch": 1.59, + "learning_rate": 2.0995959595959597e-06, + "loss": 0.3856, + "step": 39625 + }, + { + "epoch": 1.59, + "learning_rate": 2.094545454545455e-06, + "loss": 0.3729, + "step": 39650 + }, + { + "epoch": 1.59, + "learning_rate": 2.0894949494949496e-06, + "loss": 0.3809, + "step": 39675 + }, + { + "epoch": 1.59, + "learning_rate": 2.0846464646464648e-06, + "loss": 0.3682, + "step": 39700 + }, + { + "epoch": 1.59, + "learning_rate": 2.07959595959596e-06, + "loss": 0.3707, + "step": 39725 + }, + { + "epoch": 1.59, + "learning_rate": 2.0745454545454546e-06, + "loss": 0.35, + "step": 39750 + }, + { + "epoch": 1.59, + "learning_rate": 2.0694949494949493e-06, + "loss": 0.3763, + "step": 39775 + }, + { + "epoch": 1.6, + "learning_rate": 2.064444444444445e-06, + "loss": 0.3857, + "step": 39800 + }, + { + "epoch": 1.6, + "learning_rate": 2.0593939393939396e-06, + "loss": 0.3519, + "step": 39825 + }, + { + "epoch": 1.6, + "learning_rate": 2.0543434343434348e-06, + "loss": 0.3685, + "step": 39850 + }, + { + "epoch": 1.6, + "learning_rate": 2.0492929292929295e-06, + "loss": 0.3894, + "step": 39875 + }, + { + "epoch": 1.6, + "learning_rate": 2.0442424242424242e-06, + "loss": 0.3639, + "step": 39900 + }, + { + "epoch": 1.6, + "learning_rate": 2.0391919191919194e-06, + "loss": 0.3852, + "step": 39925 + }, + { + "epoch": 1.6, + "learning_rate": 2.034141414141414e-06, + "loss": 0.3704, + "step": 39950 + }, + { + "epoch": 1.6, + "learning_rate": 2.0290909090909092e-06, + "loss": 0.3497, + "step": 39975 + }, + { + "epoch": 1.6, + "learning_rate": 2.024040404040404e-06, + "loss": 0.3721, + "step": 40000 + }, + { + "epoch": 1.6, + "eval_loss": 0.38509780168533325, + "eval_runtime": 317.4006, + "eval_samples_per_second": 15.769, + "eval_steps_per_second": 1.972, + "eval_wer": 30.406511782434325, + "step": 40000 + }, + { + "epoch": 1.6, + "learning_rate": 2.018989898989899e-06, + "loss": 0.3682, + "step": 40025 + }, + { + "epoch": 1.61, + "learning_rate": 2.0139393939393942e-06, + "loss": 0.3679, + "step": 40050 + }, + { + "epoch": 1.61, + "learning_rate": 2.008888888888889e-06, + "loss": 0.3719, + "step": 40075 + }, + { + "epoch": 1.61, + "learning_rate": 2.003838383838384e-06, + "loss": 0.3647, + "step": 40100 + }, + { + "epoch": 1.61, + "learning_rate": 1.998787878787879e-06, + "loss": 0.3515, + "step": 40125 + }, + { + "epoch": 1.61, + "learning_rate": 1.993737373737374e-06, + "loss": 0.3651, + "step": 40150 + }, + { + "epoch": 1.61, + "learning_rate": 1.9886868686868687e-06, + "loss": 0.3716, + "step": 40175 + }, + { + "epoch": 1.61, + "learning_rate": 1.983636363636364e-06, + "loss": 0.3559, + "step": 40200 + }, + { + "epoch": 1.61, + "learning_rate": 1.9785858585858585e-06, + "loss": 0.3673, + "step": 40225 + }, + { + "epoch": 1.61, + "learning_rate": 1.9735353535353537e-06, + "loss": 0.3724, + "step": 40250 + }, + { + "epoch": 1.62, + "learning_rate": 1.968484848484849e-06, + "loss": 0.3587, + "step": 40275 + }, + { + "epoch": 1.62, + "learning_rate": 1.9634343434343435e-06, + "loss": 0.3762, + "step": 40300 + }, + { + "epoch": 1.62, + "learning_rate": 1.9583838383838387e-06, + "loss": 0.3616, + "step": 40325 + }, + { + "epoch": 1.62, + "learning_rate": 1.9533333333333334e-06, + "loss": 0.3605, + "step": 40350 + }, + { + "epoch": 1.62, + "learning_rate": 1.9482828282828286e-06, + "loss": 0.3805, + "step": 40375 + }, + { + "epoch": 1.62, + "learning_rate": 1.9432323232323233e-06, + "loss": 0.3777, + "step": 40400 + }, + { + "epoch": 1.62, + "learning_rate": 1.9381818181818184e-06, + "loss": 0.3648, + "step": 40425 + }, + { + "epoch": 1.62, + "learning_rate": 1.9331313131313136e-06, + "loss": 0.3803, + "step": 40450 + }, + { + "epoch": 1.62, + "learning_rate": 1.9280808080808083e-06, + "loss": 0.3942, + "step": 40475 + }, + { + "epoch": 1.62, + "learning_rate": 1.9230303030303034e-06, + "loss": 0.3739, + "step": 40500 + }, + { + "epoch": 1.63, + "learning_rate": 1.917979797979798e-06, + "loss": 0.3552, + "step": 40525 + }, + { + "epoch": 1.63, + "learning_rate": 1.9129292929292933e-06, + "loss": 0.367, + "step": 40550 + }, + { + "epoch": 1.63, + "learning_rate": 1.907878787878788e-06, + "loss": 0.3621, + "step": 40575 + }, + { + "epoch": 1.63, + "learning_rate": 1.902828282828283e-06, + "loss": 0.3791, + "step": 40600 + }, + { + "epoch": 1.63, + "learning_rate": 1.8977777777777779e-06, + "loss": 0.3655, + "step": 40625 + }, + { + "epoch": 1.63, + "learning_rate": 1.8927272727272728e-06, + "loss": 0.3467, + "step": 40650 + }, + { + "epoch": 1.63, + "learning_rate": 1.887676767676768e-06, + "loss": 0.3754, + "step": 40675 + }, + { + "epoch": 1.63, + "learning_rate": 1.8826262626262629e-06, + "loss": 0.3749, + "step": 40700 + }, + { + "epoch": 1.63, + "learning_rate": 1.8775757575757578e-06, + "loss": 0.3766, + "step": 40725 + }, + { + "epoch": 1.63, + "learning_rate": 1.8725252525252527e-06, + "loss": 0.3737, + "step": 40750 + }, + { + "epoch": 1.64, + "learning_rate": 1.8674747474747477e-06, + "loss": 0.3661, + "step": 40775 + }, + { + "epoch": 1.64, + "learning_rate": 1.8624242424242426e-06, + "loss": 0.396, + "step": 40800 + }, + { + "epoch": 1.64, + "learning_rate": 1.8573737373737375e-06, + "loss": 0.3857, + "step": 40825 + }, + { + "epoch": 1.64, + "learning_rate": 1.8523232323232325e-06, + "loss": 0.3655, + "step": 40850 + }, + { + "epoch": 1.64, + "learning_rate": 1.8472727272727276e-06, + "loss": 0.3718, + "step": 40875 + }, + { + "epoch": 1.64, + "learning_rate": 1.8422222222222225e-06, + "loss": 0.3662, + "step": 40900 + }, + { + "epoch": 1.64, + "learning_rate": 1.8371717171717175e-06, + "loss": 0.3759, + "step": 40925 + }, + { + "epoch": 1.64, + "learning_rate": 1.8321212121212124e-06, + "loss": 0.3694, + "step": 40950 + }, + { + "epoch": 1.64, + "learning_rate": 1.8270707070707071e-06, + "loss": 0.3765, + "step": 40975 + }, + { + "epoch": 1.64, + "learning_rate": 1.822020202020202e-06, + "loss": 0.3684, + "step": 41000 + }, + { + "epoch": 1.65, + "learning_rate": 1.816969696969697e-06, + "loss": 0.3709, + "step": 41025 + }, + { + "epoch": 1.65, + "learning_rate": 1.811919191919192e-06, + "loss": 0.3516, + "step": 41050 + }, + { + "epoch": 1.65, + "learning_rate": 1.8068686868686868e-06, + "loss": 0.3558, + "step": 41075 + }, + { + "epoch": 1.65, + "learning_rate": 1.801818181818182e-06, + "loss": 0.3525, + "step": 41100 + }, + { + "epoch": 1.65, + "learning_rate": 1.796767676767677e-06, + "loss": 0.3709, + "step": 41125 + }, + { + "epoch": 1.65, + "learning_rate": 1.7917171717171719e-06, + "loss": 0.3559, + "step": 41150 + }, + { + "epoch": 1.65, + "learning_rate": 1.7866666666666668e-06, + "loss": 0.3896, + "step": 41175 + }, + { + "epoch": 1.65, + "learning_rate": 1.7816161616161617e-06, + "loss": 0.3619, + "step": 41200 + }, + { + "epoch": 1.65, + "learning_rate": 1.7765656565656566e-06, + "loss": 0.3749, + "step": 41225 + }, + { + "epoch": 1.65, + "learning_rate": 1.7715151515151516e-06, + "loss": 0.3763, + "step": 41250 + }, + { + "epoch": 1.66, + "learning_rate": 1.7664646464646465e-06, + "loss": 0.3526, + "step": 41275 + }, + { + "epoch": 1.66, + "learning_rate": 1.7614141414141417e-06, + "loss": 0.366, + "step": 41300 + }, + { + "epoch": 1.66, + "learning_rate": 1.7563636363636366e-06, + "loss": 0.367, + "step": 41325 + }, + { + "epoch": 1.66, + "learning_rate": 1.7513131313131315e-06, + "loss": 0.3867, + "step": 41350 + }, + { + "epoch": 1.66, + "learning_rate": 1.7462626262626264e-06, + "loss": 0.3798, + "step": 41375 + }, + { + "epoch": 1.66, + "learning_rate": 1.7412121212121214e-06, + "loss": 0.36, + "step": 41400 + }, + { + "epoch": 1.66, + "learning_rate": 1.7361616161616163e-06, + "loss": 0.3643, + "step": 41425 + }, + { + "epoch": 1.66, + "learning_rate": 1.7311111111111112e-06, + "loss": 0.3475, + "step": 41450 + }, + { + "epoch": 1.66, + "learning_rate": 1.7260606060606062e-06, + "loss": 0.3631, + "step": 41475 + }, + { + "epoch": 1.66, + "learning_rate": 1.721010101010101e-06, + "loss": 0.3672, + "step": 41500 + }, + { + "epoch": 1.67, + "learning_rate": 1.7159595959595962e-06, + "loss": 0.368, + "step": 41525 + }, + { + "epoch": 1.67, + "learning_rate": 1.7109090909090912e-06, + "loss": 0.3634, + "step": 41550 + }, + { + "epoch": 1.67, + "learning_rate": 1.7058585858585861e-06, + "loss": 0.3569, + "step": 41575 + }, + { + "epoch": 1.67, + "learning_rate": 1.700808080808081e-06, + "loss": 0.3395, + "step": 41600 + }, + { + "epoch": 1.67, + "learning_rate": 1.695757575757576e-06, + "loss": 0.3582, + "step": 41625 + }, + { + "epoch": 1.67, + "learning_rate": 1.6907070707070707e-06, + "loss": 0.3674, + "step": 41650 + }, + { + "epoch": 1.67, + "learning_rate": 1.6856565656565656e-06, + "loss": 0.377, + "step": 41675 + }, + { + "epoch": 1.67, + "learning_rate": 1.680808080808081e-06, + "loss": 0.3689, + "step": 41700 + }, + { + "epoch": 1.67, + "learning_rate": 1.675757575757576e-06, + "loss": 0.3744, + "step": 41725 + }, + { + "epoch": 1.67, + "learning_rate": 1.6707070707070707e-06, + "loss": 0.3565, + "step": 41750 + }, + { + "epoch": 1.68, + "learning_rate": 1.6656565656565656e-06, + "loss": 0.3623, + "step": 41775 + }, + { + "epoch": 1.68, + "learning_rate": 1.6606060606060605e-06, + "loss": 0.3758, + "step": 41800 + }, + { + "epoch": 1.68, + "learning_rate": 1.6555555555555559e-06, + "loss": 0.3699, + "step": 41825 + }, + { + "epoch": 1.68, + "learning_rate": 1.6505050505050508e-06, + "loss": 0.3665, + "step": 41850 + }, + { + "epoch": 1.68, + "learning_rate": 1.6454545454545455e-06, + "loss": 0.3513, + "step": 41875 + }, + { + "epoch": 1.68, + "learning_rate": 1.6404040404040405e-06, + "loss": 0.3731, + "step": 41900 + }, + { + "epoch": 1.68, + "learning_rate": 1.6353535353535354e-06, + "loss": 0.3793, + "step": 41925 + }, + { + "epoch": 1.68, + "learning_rate": 1.6303030303030303e-06, + "loss": 0.3615, + "step": 41950 + }, + { + "epoch": 1.68, + "learning_rate": 1.6252525252525253e-06, + "loss": 0.3517, + "step": 41975 + }, + { + "epoch": 1.68, + "learning_rate": 1.6202020202020202e-06, + "loss": 0.3619, + "step": 42000 + }, + { + "epoch": 1.69, + "learning_rate": 1.6151515151515153e-06, + "loss": 0.3916, + "step": 42025 + }, + { + "epoch": 1.69, + "learning_rate": 1.6101010101010103e-06, + "loss": 0.3582, + "step": 42050 + }, + { + "epoch": 1.69, + "learning_rate": 1.6050505050505052e-06, + "loss": 0.3558, + "step": 42075 + }, + { + "epoch": 1.69, + "learning_rate": 1.6000000000000001e-06, + "loss": 0.3679, + "step": 42100 + }, + { + "epoch": 1.69, + "learning_rate": 1.594949494949495e-06, + "loss": 0.3584, + "step": 42125 + }, + { + "epoch": 1.69, + "learning_rate": 1.58989898989899e-06, + "loss": 0.3667, + "step": 42150 + }, + { + "epoch": 1.69, + "learning_rate": 1.584848484848485e-06, + "loss": 0.3477, + "step": 42175 + }, + { + "epoch": 1.69, + "learning_rate": 1.5797979797979799e-06, + "loss": 0.3554, + "step": 42200 + }, + { + "epoch": 1.69, + "learning_rate": 1.5747474747474748e-06, + "loss": 0.3663, + "step": 42225 + }, + { + "epoch": 1.69, + "learning_rate": 1.56969696969697e-06, + "loss": 0.3485, + "step": 42250 + }, + { + "epoch": 1.7, + "learning_rate": 1.5646464646464649e-06, + "loss": 0.3515, + "step": 42275 + }, + { + "epoch": 1.7, + "learning_rate": 1.5595959595959598e-06, + "loss": 0.3592, + "step": 42300 + }, + { + "epoch": 1.7, + "learning_rate": 1.5545454545454547e-06, + "loss": 0.3737, + "step": 42325 + }, + { + "epoch": 1.7, + "learning_rate": 1.5494949494949497e-06, + "loss": 0.3788, + "step": 42350 + }, + { + "epoch": 1.7, + "learning_rate": 1.5444444444444446e-06, + "loss": 0.3592, + "step": 42375 + }, + { + "epoch": 1.7, + "learning_rate": 1.5393939393939395e-06, + "loss": 0.342, + "step": 42400 + }, + { + "epoch": 1.7, + "learning_rate": 1.5343434343434345e-06, + "loss": 0.3619, + "step": 42425 + }, + { + "epoch": 1.7, + "learning_rate": 1.5292929292929296e-06, + "loss": 0.3524, + "step": 42450 + }, + { + "epoch": 1.7, + "learning_rate": 1.5242424242424245e-06, + "loss": 0.3443, + "step": 42475 + }, + { + "epoch": 1.7, + "learning_rate": 1.5191919191919195e-06, + "loss": 0.3533, + "step": 42500 + }, + { + "epoch": 1.7, + "eval_loss": 0.3833695948123932, + "eval_runtime": 310.9704, + "eval_samples_per_second": 16.095, + "eval_steps_per_second": 2.013, + "eval_wer": 27.969339566672204, + "step": 42500 + }, + { + "epoch": 1.71, + "learning_rate": 1.5141414141414144e-06, + "loss": 0.3873, + "step": 42525 + }, + { + "epoch": 1.71, + "learning_rate": 1.5090909090909091e-06, + "loss": 0.3634, + "step": 42550 + }, + { + "epoch": 1.71, + "learning_rate": 1.504040404040404e-06, + "loss": 0.3539, + "step": 42575 + }, + { + "epoch": 1.71, + "learning_rate": 1.498989898989899e-06, + "loss": 0.3574, + "step": 42600 + }, + { + "epoch": 1.71, + "learning_rate": 1.493939393939394e-06, + "loss": 0.3717, + "step": 42625 + }, + { + "epoch": 1.71, + "learning_rate": 1.4888888888888888e-06, + "loss": 0.3548, + "step": 42650 + }, + { + "epoch": 1.71, + "learning_rate": 1.483838383838384e-06, + "loss": 0.3441, + "step": 42675 + }, + { + "epoch": 1.71, + "learning_rate": 1.478787878787879e-06, + "loss": 0.3601, + "step": 42700 + }, + { + "epoch": 1.71, + "learning_rate": 1.4737373737373739e-06, + "loss": 0.3734, + "step": 42725 + }, + { + "epoch": 1.71, + "learning_rate": 1.4686868686868688e-06, + "loss": 0.3636, + "step": 42750 + }, + { + "epoch": 1.72, + "learning_rate": 1.4636363636363637e-06, + "loss": 0.366, + "step": 42775 + }, + { + "epoch": 1.72, + "learning_rate": 1.4585858585858586e-06, + "loss": 0.3627, + "step": 42800 + }, + { + "epoch": 1.72, + "learning_rate": 1.4535353535353536e-06, + "loss": 0.3757, + "step": 42825 + }, + { + "epoch": 1.72, + "learning_rate": 1.4484848484848485e-06, + "loss": 0.3681, + "step": 42850 + }, + { + "epoch": 1.72, + "learning_rate": 1.4434343434343437e-06, + "loss": 0.3629, + "step": 42875 + }, + { + "epoch": 1.72, + "learning_rate": 1.4383838383838386e-06, + "loss": 0.3865, + "step": 42900 + }, + { + "epoch": 1.72, + "learning_rate": 1.4333333333333335e-06, + "loss": 0.3495, + "step": 42925 + }, + { + "epoch": 1.72, + "learning_rate": 1.4282828282828284e-06, + "loss": 0.3639, + "step": 42950 + }, + { + "epoch": 1.72, + "learning_rate": 1.4232323232323234e-06, + "loss": 0.3836, + "step": 42975 + }, + { + "epoch": 1.72, + "learning_rate": 1.4181818181818183e-06, + "loss": 0.339, + "step": 43000 + }, + { + "epoch": 1.73, + "learning_rate": 1.4131313131313132e-06, + "loss": 0.3689, + "step": 43025 + }, + { + "epoch": 1.73, + "learning_rate": 1.4080808080808082e-06, + "loss": 0.3676, + "step": 43050 + }, + { + "epoch": 1.73, + "learning_rate": 1.403030303030303e-06, + "loss": 0.3709, + "step": 43075 + }, + { + "epoch": 1.73, + "learning_rate": 1.3979797979797982e-06, + "loss": 0.3642, + "step": 43100 + }, + { + "epoch": 1.73, + "learning_rate": 1.3929292929292932e-06, + "loss": 0.3747, + "step": 43125 + }, + { + "epoch": 1.73, + "learning_rate": 1.3878787878787881e-06, + "loss": 0.377, + "step": 43150 + }, + { + "epoch": 1.73, + "learning_rate": 1.382828282828283e-06, + "loss": 0.3567, + "step": 43175 + }, + { + "epoch": 1.73, + "learning_rate": 1.377777777777778e-06, + "loss": 0.3613, + "step": 43200 + }, + { + "epoch": 1.73, + "learning_rate": 1.3727272727272727e-06, + "loss": 0.3624, + "step": 43225 + }, + { + "epoch": 1.73, + "learning_rate": 1.3676767676767676e-06, + "loss": 0.3782, + "step": 43250 + }, + { + "epoch": 1.74, + "learning_rate": 1.3626262626262626e-06, + "loss": 0.3644, + "step": 43275 + }, + { + "epoch": 1.74, + "learning_rate": 1.357575757575758e-06, + "loss": 0.3648, + "step": 43300 + }, + { + "epoch": 1.74, + "learning_rate": 1.3525252525252528e-06, + "loss": 0.3521, + "step": 43325 + }, + { + "epoch": 1.74, + "learning_rate": 1.3474747474747476e-06, + "loss": 0.3833, + "step": 43350 + }, + { + "epoch": 1.74, + "learning_rate": 1.3424242424242425e-06, + "loss": 0.3597, + "step": 43375 + }, + { + "epoch": 1.74, + "learning_rate": 1.3373737373737374e-06, + "loss": 0.3648, + "step": 43400 + }, + { + "epoch": 1.74, + "learning_rate": 1.3323232323232324e-06, + "loss": 0.3674, + "step": 43425 + }, + { + "epoch": 1.74, + "learning_rate": 1.3272727272727273e-06, + "loss": 0.3361, + "step": 43450 + }, + { + "epoch": 1.74, + "learning_rate": 1.3222222222222222e-06, + "loss": 0.36, + "step": 43475 + }, + { + "epoch": 1.74, + "learning_rate": 1.3171717171717172e-06, + "loss": 0.3592, + "step": 43500 + }, + { + "epoch": 1.75, + "learning_rate": 1.3121212121212123e-06, + "loss": 0.3741, + "step": 43525 + }, + { + "epoch": 1.75, + "learning_rate": 1.3070707070707072e-06, + "loss": 0.36, + "step": 43550 + }, + { + "epoch": 1.75, + "learning_rate": 1.3020202020202022e-06, + "loss": 0.3622, + "step": 43575 + }, + { + "epoch": 1.75, + "learning_rate": 1.296969696969697e-06, + "loss": 0.3577, + "step": 43600 + }, + { + "epoch": 1.75, + "learning_rate": 1.291919191919192e-06, + "loss": 0.3591, + "step": 43625 + }, + { + "epoch": 1.75, + "learning_rate": 1.286868686868687e-06, + "loss": 0.3711, + "step": 43650 + }, + { + "epoch": 1.75, + "learning_rate": 1.2818181818181819e-06, + "loss": 0.3559, + "step": 43675 + }, + { + "epoch": 1.75, + "learning_rate": 1.276969696969697e-06, + "loss": 0.3399, + "step": 43700 + }, + { + "epoch": 1.75, + "learning_rate": 1.271919191919192e-06, + "loss": 0.3564, + "step": 43725 + }, + { + "epoch": 1.75, + "learning_rate": 1.266868686868687e-06, + "loss": 0.3511, + "step": 43750 + }, + { + "epoch": 1.76, + "learning_rate": 1.2618181818181819e-06, + "loss": 0.3581, + "step": 43775 + }, + { + "epoch": 1.76, + "learning_rate": 1.2567676767676768e-06, + "loss": 0.3699, + "step": 43800 + }, + { + "epoch": 1.76, + "learning_rate": 1.251717171717172e-06, + "loss": 0.3608, + "step": 43825 + }, + { + "epoch": 1.76, + "learning_rate": 1.2466666666666667e-06, + "loss": 0.4034, + "step": 43850 + }, + { + "epoch": 1.76, + "learning_rate": 1.2416161616161618e-06, + "loss": 0.3626, + "step": 43875 + }, + { + "epoch": 1.76, + "learning_rate": 1.2365656565656567e-06, + "loss": 0.3781, + "step": 43900 + }, + { + "epoch": 1.76, + "learning_rate": 1.2315151515151517e-06, + "loss": 0.3429, + "step": 43925 + }, + { + "epoch": 1.76, + "learning_rate": 1.2264646464646466e-06, + "loss": 0.3661, + "step": 43950 + }, + { + "epoch": 1.76, + "learning_rate": 1.2214141414141415e-06, + "loss": 0.3534, + "step": 43975 + }, + { + "epoch": 1.76, + "learning_rate": 1.2163636363636365e-06, + "loss": 0.3589, + "step": 44000 + }, + { + "epoch": 1.77, + "learning_rate": 1.2113131313131314e-06, + "loss": 0.3432, + "step": 44025 + }, + { + "epoch": 1.77, + "learning_rate": 1.2062626262626263e-06, + "loss": 0.3779, + "step": 44050 + }, + { + "epoch": 1.77, + "learning_rate": 1.2012121212121213e-06, + "loss": 0.3539, + "step": 44075 + }, + { + "epoch": 1.77, + "learning_rate": 1.1961616161616164e-06, + "loss": 0.3715, + "step": 44100 + }, + { + "epoch": 1.77, + "learning_rate": 1.1911111111111111e-06, + "loss": 0.3593, + "step": 44125 + }, + { + "epoch": 1.77, + "learning_rate": 1.186060606060606e-06, + "loss": 0.375, + "step": 44150 + }, + { + "epoch": 1.77, + "learning_rate": 1.181010101010101e-06, + "loss": 0.3881, + "step": 44175 + }, + { + "epoch": 1.77, + "learning_rate": 1.1759595959595961e-06, + "loss": 0.3624, + "step": 44200 + }, + { + "epoch": 1.77, + "learning_rate": 1.170909090909091e-06, + "loss": 0.3858, + "step": 44225 + }, + { + "epoch": 1.77, + "learning_rate": 1.165858585858586e-06, + "loss": 0.3705, + "step": 44250 + }, + { + "epoch": 1.78, + "learning_rate": 1.160808080808081e-06, + "loss": 0.3474, + "step": 44275 + }, + { + "epoch": 1.78, + "learning_rate": 1.1557575757575759e-06, + "loss": 0.3674, + "step": 44300 + }, + { + "epoch": 1.78, + "learning_rate": 1.1507070707070708e-06, + "loss": 0.3706, + "step": 44325 + }, + { + "epoch": 1.78, + "learning_rate": 1.1456565656565657e-06, + "loss": 0.3674, + "step": 44350 + }, + { + "epoch": 1.78, + "learning_rate": 1.1406060606060606e-06, + "loss": 0.367, + "step": 44375 + }, + { + "epoch": 1.78, + "learning_rate": 1.1355555555555558e-06, + "loss": 0.3647, + "step": 44400 + }, + { + "epoch": 1.78, + "learning_rate": 1.1305050505050507e-06, + "loss": 0.3667, + "step": 44425 + }, + { + "epoch": 1.78, + "learning_rate": 1.1254545454545457e-06, + "loss": 0.3557, + "step": 44450 + }, + { + "epoch": 1.78, + "learning_rate": 1.1204040404040404e-06, + "loss": 0.3523, + "step": 44475 + }, + { + "epoch": 1.78, + "learning_rate": 1.1153535353535353e-06, + "loss": 0.3559, + "step": 44500 + }, + { + "epoch": 1.79, + "learning_rate": 1.1103030303030304e-06, + "loss": 0.3484, + "step": 44525 + }, + { + "epoch": 1.79, + "learning_rate": 1.1052525252525254e-06, + "loss": 0.372, + "step": 44550 + }, + { + "epoch": 1.79, + "learning_rate": 1.1002020202020203e-06, + "loss": 0.3515, + "step": 44575 + }, + { + "epoch": 1.79, + "learning_rate": 1.0951515151515152e-06, + "loss": 0.3759, + "step": 44600 + }, + { + "epoch": 1.79, + "learning_rate": 1.0901010101010102e-06, + "loss": 0.3682, + "step": 44625 + }, + { + "epoch": 1.79, + "learning_rate": 1.085050505050505e-06, + "loss": 0.362, + "step": 44650 + }, + { + "epoch": 1.79, + "learning_rate": 1.08e-06, + "loss": 0.3558, + "step": 44675 + }, + { + "epoch": 1.79, + "learning_rate": 1.074949494949495e-06, + "loss": 0.3483, + "step": 44700 + }, + { + "epoch": 1.79, + "learning_rate": 1.0698989898989901e-06, + "loss": 0.3358, + "step": 44725 + }, + { + "epoch": 1.79, + "learning_rate": 1.064848484848485e-06, + "loss": 0.3726, + "step": 44750 + }, + { + "epoch": 1.8, + "learning_rate": 1.05979797979798e-06, + "loss": 0.3698, + "step": 44775 + }, + { + "epoch": 1.8, + "learning_rate": 1.0547474747474747e-06, + "loss": 0.3674, + "step": 44800 + }, + { + "epoch": 1.8, + "learning_rate": 1.0496969696969696e-06, + "loss": 0.3718, + "step": 44825 + }, + { + "epoch": 1.8, + "learning_rate": 1.0446464646464648e-06, + "loss": 0.3684, + "step": 44850 + }, + { + "epoch": 1.8, + "learning_rate": 1.0395959595959597e-06, + "loss": 0.3546, + "step": 44875 + }, + { + "epoch": 1.8, + "learning_rate": 1.0345454545454546e-06, + "loss": 0.357, + "step": 44900 + }, + { + "epoch": 1.8, + "learning_rate": 1.0294949494949496e-06, + "loss": 0.3537, + "step": 44925 + }, + { + "epoch": 1.8, + "learning_rate": 1.0244444444444445e-06, + "loss": 0.3616, + "step": 44950 + }, + { + "epoch": 1.8, + "learning_rate": 1.0193939393939394e-06, + "loss": 0.349, + "step": 44975 + }, + { + "epoch": 1.8, + "learning_rate": 1.0143434343434344e-06, + "loss": 0.3594, + "step": 45000 + }, + { + "epoch": 1.8, + "eval_loss": 0.38151976466178894, + "eval_runtime": 308.7744, + "eval_samples_per_second": 16.209, + "eval_steps_per_second": 2.027, + "eval_wer": 28.856878426161035, + "step": 45000 + }, + { + "epoch": 1.81, + "learning_rate": 1.0092929292929293e-06, + "loss": 0.3538, + "step": 45025 + }, + { + "epoch": 1.81, + "learning_rate": 1.0042424242424244e-06, + "loss": 0.3699, + "step": 45050 + }, + { + "epoch": 1.81, + "learning_rate": 9.991919191919194e-07, + "loss": 0.3676, + "step": 45075 + }, + { + "epoch": 1.81, + "learning_rate": 9.941414141414143e-07, + "loss": 0.3679, + "step": 45100 + }, + { + "epoch": 1.81, + "learning_rate": 9.890909090909092e-07, + "loss": 0.3621, + "step": 45125 + }, + { + "epoch": 1.81, + "learning_rate": 9.840404040404042e-07, + "loss": 0.3517, + "step": 45150 + }, + { + "epoch": 1.81, + "learning_rate": 9.78989898989899e-07, + "loss": 0.3819, + "step": 45175 + }, + { + "epoch": 1.81, + "learning_rate": 9.73939393939394e-07, + "loss": 0.3628, + "step": 45200 + }, + { + "epoch": 1.81, + "learning_rate": 9.68888888888889e-07, + "loss": 0.3475, + "step": 45225 + }, + { + "epoch": 1.81, + "learning_rate": 9.638383838383839e-07, + "loss": 0.3486, + "step": 45250 + }, + { + "epoch": 1.82, + "learning_rate": 9.587878787878788e-07, + "loss": 0.3573, + "step": 45275 + }, + { + "epoch": 1.82, + "learning_rate": 9.537373737373737e-07, + "loss": 0.3664, + "step": 45300 + }, + { + "epoch": 1.82, + "learning_rate": 9.486868686868688e-07, + "loss": 0.3648, + "step": 45325 + }, + { + "epoch": 1.82, + "learning_rate": 9.436363636363636e-07, + "loss": 0.3614, + "step": 45350 + }, + { + "epoch": 1.82, + "learning_rate": 9.385858585858588e-07, + "loss": 0.3586, + "step": 45375 + }, + { + "epoch": 1.82, + "learning_rate": 9.335353535353536e-07, + "loss": 0.3629, + "step": 45400 + }, + { + "epoch": 1.82, + "learning_rate": 9.284848484848485e-07, + "loss": 0.38, + "step": 45425 + }, + { + "epoch": 1.82, + "learning_rate": 9.234343434343434e-07, + "loss": 0.3636, + "step": 45450 + }, + { + "epoch": 1.82, + "learning_rate": 9.183838383838385e-07, + "loss": 0.3382, + "step": 45475 + }, + { + "epoch": 1.82, + "learning_rate": 9.133333333333334e-07, + "loss": 0.3504, + "step": 45500 + }, + { + "epoch": 1.83, + "learning_rate": 9.082828282828283e-07, + "loss": 0.3541, + "step": 45525 + }, + { + "epoch": 1.83, + "learning_rate": 9.032323232323233e-07, + "loss": 0.3672, + "step": 45550 + }, + { + "epoch": 1.83, + "learning_rate": 8.981818181818183e-07, + "loss": 0.3681, + "step": 45575 + }, + { + "epoch": 1.83, + "learning_rate": 8.931313131313132e-07, + "loss": 0.3692, + "step": 45600 + }, + { + "epoch": 1.83, + "learning_rate": 8.880808080808082e-07, + "loss": 0.3579, + "step": 45625 + }, + { + "epoch": 1.83, + "learning_rate": 8.830303030303031e-07, + "loss": 0.3597, + "step": 45650 + }, + { + "epoch": 1.83, + "learning_rate": 8.77979797979798e-07, + "loss": 0.3499, + "step": 45675 + }, + { + "epoch": 1.83, + "learning_rate": 8.729292929292931e-07, + "loss": 0.3556, + "step": 45700 + }, + { + "epoch": 1.83, + "learning_rate": 8.680808080808082e-07, + "loss": 0.3659, + "step": 45725 + }, + { + "epoch": 1.83, + "learning_rate": 8.630303030303031e-07, + "loss": 0.3677, + "step": 45750 + }, + { + "epoch": 1.84, + "learning_rate": 8.579797979797981e-07, + "loss": 0.352, + "step": 45775 + }, + { + "epoch": 1.84, + "learning_rate": 8.529292929292931e-07, + "loss": 0.3722, + "step": 45800 + }, + { + "epoch": 1.84, + "learning_rate": 8.47878787878788e-07, + "loss": 0.353, + "step": 45825 + }, + { + "epoch": 1.84, + "learning_rate": 8.428282828282828e-07, + "loss": 0.3546, + "step": 45850 + }, + { + "epoch": 1.84, + "learning_rate": 8.37777777777778e-07, + "loss": 0.3588, + "step": 45875 + }, + { + "epoch": 1.84, + "learning_rate": 8.327272727272728e-07, + "loss": 0.367, + "step": 45900 + }, + { + "epoch": 1.84, + "learning_rate": 8.276767676767677e-07, + "loss": 0.3414, + "step": 45925 + }, + { + "epoch": 1.84, + "learning_rate": 8.226262626262626e-07, + "loss": 0.3635, + "step": 45950 + }, + { + "epoch": 1.84, + "learning_rate": 8.175757575757576e-07, + "loss": 0.3416, + "step": 45975 + }, + { + "epoch": 1.84, + "learning_rate": 8.125252525252526e-07, + "loss": 0.3722, + "step": 46000 + }, + { + "epoch": 1.85, + "learning_rate": 8.074747474747475e-07, + "loss": 0.3616, + "step": 46025 + }, + { + "epoch": 1.85, + "learning_rate": 8.024242424242425e-07, + "loss": 0.3517, + "step": 46050 + }, + { + "epoch": 1.85, + "learning_rate": 7.973737373737374e-07, + "loss": 0.3687, + "step": 46075 + }, + { + "epoch": 1.85, + "learning_rate": 7.923232323232324e-07, + "loss": 0.3546, + "step": 46100 + }, + { + "epoch": 1.85, + "learning_rate": 7.872727272727274e-07, + "loss": 0.3582, + "step": 46125 + }, + { + "epoch": 1.85, + "learning_rate": 7.822222222222223e-07, + "loss": 0.357, + "step": 46150 + }, + { + "epoch": 1.85, + "learning_rate": 7.771717171717172e-07, + "loss": 0.3703, + "step": 46175 + }, + { + "epoch": 1.85, + "learning_rate": 7.721212121212123e-07, + "loss": 0.3619, + "step": 46200 + }, + { + "epoch": 1.85, + "learning_rate": 7.670707070707072e-07, + "loss": 0.3441, + "step": 46225 + }, + { + "epoch": 1.85, + "learning_rate": 7.62020202020202e-07, + "loss": 0.3565, + "step": 46250 + }, + { + "epoch": 1.86, + "learning_rate": 7.56969696969697e-07, + "loss": 0.3517, + "step": 46275 + }, + { + "epoch": 1.86, + "learning_rate": 7.51919191919192e-07, + "loss": 0.3505, + "step": 46300 + }, + { + "epoch": 1.86, + "learning_rate": 7.468686868686869e-07, + "loss": 0.3691, + "step": 46325 + }, + { + "epoch": 1.86, + "learning_rate": 7.418181818181819e-07, + "loss": 0.3626, + "step": 46350 + }, + { + "epoch": 1.86, + "learning_rate": 7.367676767676768e-07, + "loss": 0.3582, + "step": 46375 + }, + { + "epoch": 1.86, + "learning_rate": 7.317171717171717e-07, + "loss": 0.3677, + "step": 46400 + }, + { + "epoch": 1.86, + "learning_rate": 7.266666666666668e-07, + "loss": 0.3636, + "step": 46425 + }, + { + "epoch": 1.86, + "learning_rate": 7.216161616161617e-07, + "loss": 0.3677, + "step": 46450 + }, + { + "epoch": 1.86, + "learning_rate": 7.165656565656566e-07, + "loss": 0.3497, + "step": 46475 + }, + { + "epoch": 1.86, + "learning_rate": 7.115151515151516e-07, + "loss": 0.3627, + "step": 46500 + }, + { + "epoch": 1.87, + "learning_rate": 7.064646464646466e-07, + "loss": 0.3588, + "step": 46525 + }, + { + "epoch": 1.87, + "learning_rate": 7.014141414141415e-07, + "loss": 0.3537, + "step": 46550 + }, + { + "epoch": 1.87, + "learning_rate": 6.963636363636364e-07, + "loss": 0.357, + "step": 46575 + }, + { + "epoch": 1.87, + "learning_rate": 6.913131313131313e-07, + "loss": 0.3552, + "step": 46600 + }, + { + "epoch": 1.87, + "learning_rate": 6.862626262626264e-07, + "loss": 0.3761, + "step": 46625 + }, + { + "epoch": 1.87, + "learning_rate": 6.812121212121213e-07, + "loss": 0.3831, + "step": 46650 + }, + { + "epoch": 1.87, + "learning_rate": 6.761616161616162e-07, + "loss": 0.3443, + "step": 46675 + }, + { + "epoch": 1.87, + "learning_rate": 6.711111111111111e-07, + "loss": 0.3653, + "step": 46700 + }, + { + "epoch": 1.87, + "learning_rate": 6.66060606060606e-07, + "loss": 0.3495, + "step": 46725 + }, + { + "epoch": 1.87, + "learning_rate": 6.610101010101011e-07, + "loss": 0.3669, + "step": 46750 + }, + { + "epoch": 1.88, + "learning_rate": 6.55959595959596e-07, + "loss": 0.3691, + "step": 46775 + }, + { + "epoch": 1.88, + "learning_rate": 6.50909090909091e-07, + "loss": 0.3505, + "step": 46800 + }, + { + "epoch": 1.88, + "learning_rate": 6.458585858585859e-07, + "loss": 0.3646, + "step": 46825 + }, + { + "epoch": 1.88, + "learning_rate": 6.408080808080809e-07, + "loss": 0.3684, + "step": 46850 + }, + { + "epoch": 1.88, + "learning_rate": 6.357575757575759e-07, + "loss": 0.3579, + "step": 46875 + }, + { + "epoch": 1.88, + "learning_rate": 6.307070707070708e-07, + "loss": 0.3586, + "step": 46900 + }, + { + "epoch": 1.88, + "learning_rate": 6.256565656565656e-07, + "loss": 0.3602, + "step": 46925 + }, + { + "epoch": 1.88, + "learning_rate": 6.206060606060606e-07, + "loss": 0.3524, + "step": 46950 + }, + { + "epoch": 1.88, + "learning_rate": 6.155555555555556e-07, + "loss": 0.3422, + "step": 46975 + }, + { + "epoch": 1.88, + "learning_rate": 6.105050505050505e-07, + "loss": 0.3642, + "step": 47000 + }, + { + "epoch": 1.89, + "learning_rate": 6.054545454545455e-07, + "loss": 0.3673, + "step": 47025 + }, + { + "epoch": 1.89, + "learning_rate": 6.004040404040405e-07, + "loss": 0.3477, + "step": 47050 + }, + { + "epoch": 1.89, + "learning_rate": 5.953535353535354e-07, + "loss": 0.3442, + "step": 47075 + }, + { + "epoch": 1.89, + "learning_rate": 5.903030303030303e-07, + "loss": 0.3736, + "step": 47100 + }, + { + "epoch": 1.89, + "learning_rate": 5.852525252525253e-07, + "loss": 0.3658, + "step": 47125 + }, + { + "epoch": 1.89, + "learning_rate": 5.802020202020202e-07, + "loss": 0.3574, + "step": 47150 + }, + { + "epoch": 1.89, + "learning_rate": 5.751515151515151e-07, + "loss": 0.357, + "step": 47175 + }, + { + "epoch": 1.89, + "learning_rate": 5.701010101010102e-07, + "loss": 0.3691, + "step": 47200 + }, + { + "epoch": 1.89, + "learning_rate": 5.650505050505051e-07, + "loss": 0.3572, + "step": 47225 + }, + { + "epoch": 1.89, + "learning_rate": 5.6e-07, + "loss": 0.3423, + "step": 47250 + }, + { + "epoch": 1.9, + "learning_rate": 5.54949494949495e-07, + "loss": 0.3505, + "step": 47275 + }, + { + "epoch": 1.9, + "learning_rate": 5.4989898989899e-07, + "loss": 0.3661, + "step": 47300 + }, + { + "epoch": 1.9, + "learning_rate": 5.448484848484848e-07, + "loss": 0.3482, + "step": 47325 + }, + { + "epoch": 1.9, + "learning_rate": 5.397979797979799e-07, + "loss": 0.366, + "step": 47350 + }, + { + "epoch": 1.9, + "learning_rate": 5.347474747474748e-07, + "loss": 0.3585, + "step": 47375 + }, + { + "epoch": 1.9, + "learning_rate": 5.296969696969697e-07, + "loss": 0.3755, + "step": 47400 + }, + { + "epoch": 1.9, + "learning_rate": 5.246464646464647e-07, + "loss": 0.356, + "step": 47425 + }, + { + "epoch": 1.9, + "learning_rate": 5.195959595959597e-07, + "loss": 0.3426, + "step": 47450 + }, + { + "epoch": 1.9, + "learning_rate": 5.145454545454546e-07, + "loss": 0.3696, + "step": 47475 + }, + { + "epoch": 1.9, + "learning_rate": 5.094949494949496e-07, + "loss": 0.3628, + "step": 47500 + }, + { + "epoch": 1.9, + "eval_loss": 0.38016417622566223, + "eval_runtime": 305.1241, + "eval_samples_per_second": 16.403, + "eval_steps_per_second": 2.052, + "eval_wer": 28.12596407128788, + "step": 47500 + }, + { + "epoch": 1.91, + "learning_rate": 5.044444444444445e-07, + "loss": 0.349, + "step": 47525 + }, + { + "epoch": 1.91, + "learning_rate": 4.993939393939394e-07, + "loss": 0.3586, + "step": 47550 + }, + { + "epoch": 1.91, + "learning_rate": 4.943434343434344e-07, + "loss": 0.3719, + "step": 47575 + }, + { + "epoch": 1.91, + "learning_rate": 4.892929292929293e-07, + "loss": 0.3709, + "step": 47600 + }, + { + "epoch": 1.91, + "learning_rate": 4.842424242424243e-07, + "loss": 0.3573, + "step": 47625 + }, + { + "epoch": 1.91, + "learning_rate": 4.791919191919193e-07, + "loss": 0.3461, + "step": 47650 + }, + { + "epoch": 1.91, + "learning_rate": 4.741414141414142e-07, + "loss": 0.3678, + "step": 47675 + }, + { + "epoch": 1.91, + "learning_rate": 4.690909090909091e-07, + "loss": 0.3563, + "step": 47700 + }, + { + "epoch": 1.91, + "learning_rate": 4.640404040404041e-07, + "loss": 0.3588, + "step": 47725 + }, + { + "epoch": 1.91, + "learning_rate": 4.5898989898989904e-07, + "loss": 0.3578, + "step": 47750 + }, + { + "epoch": 1.92, + "learning_rate": 4.5414141414141417e-07, + "loss": 0.3741, + "step": 47775 + }, + { + "epoch": 1.92, + "learning_rate": 4.4909090909090916e-07, + "loss": 0.3793, + "step": 47800 + }, + { + "epoch": 1.92, + "learning_rate": 4.440404040404041e-07, + "loss": 0.3776, + "step": 47825 + }, + { + "epoch": 1.92, + "learning_rate": 4.38989898989899e-07, + "loss": 0.3486, + "step": 47850 + }, + { + "epoch": 1.92, + "learning_rate": 4.33939393939394e-07, + "loss": 0.362, + "step": 47875 + }, + { + "epoch": 1.92, + "learning_rate": 4.288888888888889e-07, + "loss": 0.3597, + "step": 47900 + }, + { + "epoch": 1.92, + "learning_rate": 4.2383838383838387e-07, + "loss": 0.3692, + "step": 47925 + }, + { + "epoch": 1.92, + "learning_rate": 4.187878787878788e-07, + "loss": 0.3558, + "step": 47950 + }, + { + "epoch": 1.92, + "learning_rate": 4.137373737373738e-07, + "loss": 0.3565, + "step": 47975 + }, + { + "epoch": 1.92, + "learning_rate": 4.086868686868687e-07, + "loss": 0.3516, + "step": 48000 + }, + { + "epoch": 1.93, + "learning_rate": 4.036363636363637e-07, + "loss": 0.3644, + "step": 48025 + }, + { + "epoch": 1.93, + "learning_rate": 3.985858585858586e-07, + "loss": 0.3622, + "step": 48050 + }, + { + "epoch": 1.93, + "learning_rate": 3.935353535353536e-07, + "loss": 0.3378, + "step": 48075 + }, + { + "epoch": 1.93, + "learning_rate": 3.884848484848485e-07, + "loss": 0.3791, + "step": 48100 + }, + { + "epoch": 1.93, + "learning_rate": 3.834343434343435e-07, + "loss": 0.3635, + "step": 48125 + }, + { + "epoch": 1.93, + "learning_rate": 3.783838383838384e-07, + "loss": 0.3637, + "step": 48150 + }, + { + "epoch": 1.93, + "learning_rate": 3.733333333333334e-07, + "loss": 0.3659, + "step": 48175 + }, + { + "epoch": 1.93, + "learning_rate": 3.682828282828283e-07, + "loss": 0.354, + "step": 48200 + }, + { + "epoch": 1.93, + "learning_rate": 3.632323232323232e-07, + "loss": 0.3786, + "step": 48225 + }, + { + "epoch": 1.93, + "learning_rate": 3.581818181818182e-07, + "loss": 0.3566, + "step": 48250 + }, + { + "epoch": 1.94, + "learning_rate": 3.531313131313131e-07, + "loss": 0.3541, + "step": 48275 + }, + { + "epoch": 1.94, + "learning_rate": 3.480808080808081e-07, + "loss": 0.3627, + "step": 48300 + }, + { + "epoch": 1.94, + "learning_rate": 3.4303030303030304e-07, + "loss": 0.3565, + "step": 48325 + }, + { + "epoch": 1.94, + "learning_rate": 3.37979797979798e-07, + "loss": 0.3752, + "step": 48350 + }, + { + "epoch": 1.94, + "learning_rate": 3.3292929292929295e-07, + "loss": 0.3762, + "step": 48375 + }, + { + "epoch": 1.94, + "learning_rate": 3.2787878787878794e-07, + "loss": 0.3475, + "step": 48400 + }, + { + "epoch": 1.94, + "learning_rate": 3.228282828282828e-07, + "loss": 0.3726, + "step": 48425 + }, + { + "epoch": 1.94, + "learning_rate": 3.177777777777778e-07, + "loss": 0.3556, + "step": 48450 + }, + { + "epoch": 1.94, + "learning_rate": 3.1272727272727273e-07, + "loss": 0.4022, + "step": 48475 + }, + { + "epoch": 1.94, + "learning_rate": 3.076767676767677e-07, + "loss": 0.3513, + "step": 48500 + }, + { + "epoch": 1.95, + "learning_rate": 3.0262626262626265e-07, + "loss": 0.355, + "step": 48525 + }, + { + "epoch": 1.95, + "learning_rate": 2.975757575757576e-07, + "loss": 0.3733, + "step": 48550 + }, + { + "epoch": 1.95, + "learning_rate": 2.9252525252525256e-07, + "loss": 0.3635, + "step": 48575 + }, + { + "epoch": 1.95, + "learning_rate": 2.874747474747475e-07, + "loss": 0.3639, + "step": 48600 + }, + { + "epoch": 1.95, + "learning_rate": 2.8242424242424243e-07, + "loss": 0.3438, + "step": 48625 + }, + { + "epoch": 1.95, + "learning_rate": 2.773737373737374e-07, + "loss": 0.3616, + "step": 48650 + }, + { + "epoch": 1.95, + "learning_rate": 2.7232323232323234e-07, + "loss": 0.3639, + "step": 48675 + }, + { + "epoch": 1.95, + "learning_rate": 2.6727272727272733e-07, + "loss": 0.3542, + "step": 48700 + }, + { + "epoch": 1.95, + "learning_rate": 2.6222222222222226e-07, + "loss": 0.3455, + "step": 48725 + }, + { + "epoch": 1.95, + "learning_rate": 2.571717171717172e-07, + "loss": 0.3833, + "step": 48750 + }, + { + "epoch": 1.96, + "learning_rate": 2.521212121212122e-07, + "loss": 0.359, + "step": 48775 + }, + { + "epoch": 1.96, + "learning_rate": 2.470707070707071e-07, + "loss": 0.3734, + "step": 48800 + }, + { + "epoch": 1.96, + "learning_rate": 2.4202020202020204e-07, + "loss": 0.3745, + "step": 48825 + }, + { + "epoch": 1.96, + "learning_rate": 2.3696969696969697e-07, + "loss": 0.3558, + "step": 48850 + }, + { + "epoch": 1.96, + "learning_rate": 2.3191919191919193e-07, + "loss": 0.3513, + "step": 48875 + }, + { + "epoch": 1.96, + "learning_rate": 2.2686868686868689e-07, + "loss": 0.3703, + "step": 48900 + }, + { + "epoch": 1.96, + "learning_rate": 2.2181818181818182e-07, + "loss": 0.3623, + "step": 48925 + }, + { + "epoch": 1.96, + "learning_rate": 2.1676767676767677e-07, + "loss": 0.3853, + "step": 48950 + }, + { + "epoch": 1.96, + "learning_rate": 2.1171717171717173e-07, + "loss": 0.3714, + "step": 48975 + }, + { + "epoch": 1.96, + "learning_rate": 2.066666666666667e-07, + "loss": 0.3584, + "step": 49000 + }, + { + "epoch": 1.97, + "learning_rate": 2.0161616161616162e-07, + "loss": 0.3547, + "step": 49025 + }, + { + "epoch": 1.97, + "learning_rate": 1.9656565656565658e-07, + "loss": 0.3564, + "step": 49050 + }, + { + "epoch": 1.97, + "learning_rate": 1.9151515151515154e-07, + "loss": 0.3501, + "step": 49075 + }, + { + "epoch": 1.97, + "learning_rate": 1.864646464646465e-07, + "loss": 0.3717, + "step": 49100 + }, + { + "epoch": 1.97, + "learning_rate": 1.8141414141414143e-07, + "loss": 0.3698, + "step": 49125 + }, + { + "epoch": 1.97, + "learning_rate": 1.7636363636363639e-07, + "loss": 0.3603, + "step": 49150 + }, + { + "epoch": 1.97, + "learning_rate": 1.7131313131313134e-07, + "loss": 0.37, + "step": 49175 + }, + { + "epoch": 1.97, + "learning_rate": 1.662626262626263e-07, + "loss": 0.3386, + "step": 49200 + }, + { + "epoch": 1.97, + "learning_rate": 1.612121212121212e-07, + "loss": 0.3509, + "step": 49225 + }, + { + "epoch": 1.97, + "learning_rate": 1.5616161616161617e-07, + "loss": 0.3479, + "step": 49250 + }, + { + "epoch": 1.98, + "learning_rate": 1.5111111111111112e-07, + "loss": 0.3466, + "step": 49275 + }, + { + "epoch": 1.98, + "learning_rate": 1.4606060606060608e-07, + "loss": 0.3577, + "step": 49300 + }, + { + "epoch": 1.98, + "learning_rate": 1.41010101010101e-07, + "loss": 0.366, + "step": 49325 + }, + { + "epoch": 1.98, + "learning_rate": 1.3595959595959597e-07, + "loss": 0.387, + "step": 49350 + }, + { + "epoch": 1.98, + "learning_rate": 1.3090909090909093e-07, + "loss": 0.3762, + "step": 49375 + }, + { + "epoch": 1.98, + "learning_rate": 1.2585858585858586e-07, + "loss": 0.3528, + "step": 49400 + }, + { + "epoch": 1.98, + "learning_rate": 1.2080808080808082e-07, + "loss": 0.372, + "step": 49425 + }, + { + "epoch": 1.98, + "learning_rate": 1.1575757575757578e-07, + "loss": 0.3442, + "step": 49450 + }, + { + "epoch": 1.98, + "learning_rate": 1.1070707070707072e-07, + "loss": 0.3603, + "step": 49475 + }, + { + "epoch": 1.98, + "learning_rate": 1.0565656565656568e-07, + "loss": 0.3604, + "step": 49500 + }, + { + "epoch": 1.99, + "learning_rate": 1.0060606060606061e-07, + "loss": 0.3561, + "step": 49525 + }, + { + "epoch": 1.99, + "learning_rate": 9.555555555555556e-08, + "loss": 0.3634, + "step": 49550 + }, + { + "epoch": 1.99, + "learning_rate": 9.050505050505051e-08, + "loss": 0.361, + "step": 49575 + }, + { + "epoch": 1.99, + "learning_rate": 8.545454545454546e-08, + "loss": 0.3529, + "step": 49600 + }, + { + "epoch": 1.99, + "learning_rate": 8.040404040404042e-08, + "loss": 0.358, + "step": 49625 + }, + { + "epoch": 1.99, + "learning_rate": 7.535353535353536e-08, + "loss": 0.352, + "step": 49650 + }, + { + "epoch": 1.99, + "learning_rate": 7.03030303030303e-08, + "loss": 0.3733, + "step": 49675 + }, + { + "epoch": 1.99, + "learning_rate": 6.525252525252525e-08, + "loss": 0.3568, + "step": 49700 + }, + { + "epoch": 1.99, + "learning_rate": 6.020202020202021e-08, + "loss": 0.3649, + "step": 49725 + }, + { + "epoch": 1.99, + "learning_rate": 5.515151515151516e-08, + "loss": 0.3645, + "step": 49750 + }, + { + "epoch": 2.0, + "learning_rate": 5.0101010101010105e-08, + "loss": 0.3589, + "step": 49775 + }, + { + "epoch": 2.0, + "learning_rate": 4.5252525252525257e-08, + "loss": 0.3687, + "step": 49800 + }, + { + "epoch": 2.0, + "learning_rate": 4.020202020202021e-08, + "loss": 0.3764, + "step": 49825 + }, + { + "epoch": 2.0, + "learning_rate": 3.515151515151515e-08, + "loss": 0.3622, + "step": 49850 + }, + { + "epoch": 2.0, + "learning_rate": 3.0101010101010104e-08, + "loss": 0.349, + "step": 49875 + }, + { + "epoch": 2.0, + "learning_rate": 2.5050505050505052e-08, + "loss": 0.3612, + "step": 49900 + }, + { + "epoch": 2.0, + "learning_rate": 2e-08, + "loss": 0.358, + "step": 49925 + }, + { + "epoch": 2.0, + "learning_rate": 1.4949494949494952e-08, + "loss": 0.3431, + "step": 49950 + }, + { + "epoch": 2.0, + "learning_rate": 9.8989898989899e-09, + "loss": 0.353, + "step": 49975 + }, + { + "epoch": 2.0, + "learning_rate": 4.848484848484849e-09, + "loss": 0.3392, + "step": 50000 + }, + { + "epoch": 2.0, + "eval_loss": 0.37952831387519836, + "eval_runtime": 312.4104, + "eval_samples_per_second": 16.021, + "eval_steps_per_second": 2.004, + "eval_wer": 28.726358005647974, + "step": 50000 + }, + { + "epoch": 2.0, + "step": 50000, + "total_flos": 9.7854051981312e+19, + "train_loss": 0.47914609115600587, + "train_runtime": 101277.4875, + "train_samples_per_second": 31.596, + "train_steps_per_second": 0.494 + } + ], + "logging_steps": 25, + "max_steps": 50000, + "num_input_tokens_seen": 0, + "num_train_epochs": 3, + "save_steps": 2500, + "total_flos": 9.7854051981312e+19, + "train_batch_size": 64, + "trial_name": null, + "trial_params": null +}