{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.0, "eval_steps": 500, "global_step": 9981, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 6.666666666666668e-08, "loss": 4.1142, "step": 1 }, { "epoch": 0.0, "learning_rate": 1.3333333333333336e-07, "loss": 4.2466, "step": 2 }, { "epoch": 0.0, "learning_rate": 2.0000000000000002e-07, "loss": 4.3258, "step": 3 }, { "epoch": 0.0, "learning_rate": 2.666666666666667e-07, "loss": 4.0749, "step": 4 }, { "epoch": 0.0, "learning_rate": 3.3333333333333335e-07, "loss": 4.2308, "step": 5 }, { "epoch": 0.0, "learning_rate": 4.0000000000000003e-07, "loss": 4.2258, "step": 6 }, { "epoch": 0.0, "learning_rate": 4.666666666666667e-07, "loss": 4.2295, "step": 7 }, { "epoch": 0.0, "learning_rate": 5.333333333333335e-07, "loss": 4.2409, "step": 8 }, { "epoch": 0.0, "learning_rate": 6.000000000000001e-07, "loss": 4.1947, "step": 9 }, { "epoch": 0.0, "learning_rate": 6.666666666666667e-07, "loss": 4.3093, "step": 10 }, { "epoch": 0.0, "learning_rate": 7.333333333333334e-07, "loss": 4.3633, "step": 11 }, { "epoch": 0.0, "learning_rate": 8.000000000000001e-07, "loss": 4.0784, "step": 12 }, { "epoch": 0.0, "learning_rate": 8.666666666666668e-07, "loss": 4.2004, "step": 13 }, { "epoch": 0.0, "learning_rate": 9.333333333333334e-07, "loss": 4.1177, "step": 14 }, { "epoch": 0.0, "learning_rate": 1.0000000000000002e-06, "loss": 4.0068, "step": 15 }, { "epoch": 0.0, "learning_rate": 1.066666666666667e-06, "loss": 3.9262, "step": 16 }, { "epoch": 0.0, "learning_rate": 1.1333333333333334e-06, "loss": 3.869, "step": 17 }, { "epoch": 0.0, "learning_rate": 1.2000000000000002e-06, "loss": 3.8189, "step": 18 }, { "epoch": 0.0, "learning_rate": 1.2666666666666669e-06, "loss": 3.633, "step": 19 }, { "epoch": 0.0, "learning_rate": 1.3333333333333334e-06, "loss": 3.8466, "step": 20 }, { "epoch": 0.0, "learning_rate": 1.4000000000000001e-06, "loss": 3.8185, "step": 21 }, { "epoch": 0.0, "learning_rate": 1.4666666666666669e-06, "loss": 3.6195, "step": 22 }, { "epoch": 0.0, "learning_rate": 1.5333333333333334e-06, "loss": 3.4017, "step": 23 }, { "epoch": 0.0, "learning_rate": 1.6000000000000001e-06, "loss": 3.359, "step": 24 }, { "epoch": 0.0, "learning_rate": 1.6666666666666667e-06, "loss": 3.2968, "step": 25 }, { "epoch": 0.0, "learning_rate": 1.7333333333333336e-06, "loss": 3.2485, "step": 26 }, { "epoch": 0.0, "learning_rate": 1.8000000000000001e-06, "loss": 3.1204, "step": 27 }, { "epoch": 0.0, "learning_rate": 1.8666666666666669e-06, "loss": 3.1333, "step": 28 }, { "epoch": 0.0, "learning_rate": 1.9333333333333336e-06, "loss": 3.0454, "step": 29 }, { "epoch": 0.0, "learning_rate": 2.0000000000000003e-06, "loss": 3.0848, "step": 30 }, { "epoch": 0.0, "learning_rate": 2.0666666666666666e-06, "loss": 2.9496, "step": 31 }, { "epoch": 0.0, "learning_rate": 2.133333333333334e-06, "loss": 2.8949, "step": 32 }, { "epoch": 0.0, "learning_rate": 2.2e-06, "loss": 3.0362, "step": 33 }, { "epoch": 0.0, "learning_rate": 2.266666666666667e-06, "loss": 2.9358, "step": 34 }, { "epoch": 0.0, "learning_rate": 2.3333333333333336e-06, "loss": 2.8306, "step": 35 }, { "epoch": 0.0, "learning_rate": 2.4000000000000003e-06, "loss": 2.9399, "step": 36 }, { "epoch": 0.0, "learning_rate": 2.466666666666667e-06, "loss": 2.8777, "step": 37 }, { "epoch": 0.0, "learning_rate": 2.5333333333333338e-06, "loss": 2.8169, "step": 38 }, { "epoch": 0.0, "learning_rate": 2.6e-06, "loss": 2.9271, "step": 39 }, { "epoch": 0.0, "learning_rate": 2.666666666666667e-06, "loss": 2.7725, "step": 40 }, { "epoch": 0.0, "learning_rate": 2.7333333333333336e-06, "loss": 2.7331, "step": 41 }, { "epoch": 0.0, "learning_rate": 2.8000000000000003e-06, "loss": 2.7108, "step": 42 }, { "epoch": 0.0, "learning_rate": 2.866666666666667e-06, "loss": 2.7805, "step": 43 }, { "epoch": 0.0, "learning_rate": 2.9333333333333338e-06, "loss": 2.8082, "step": 44 }, { "epoch": 0.0, "learning_rate": 3e-06, "loss": 2.7276, "step": 45 }, { "epoch": 0.0, "learning_rate": 3.066666666666667e-06, "loss": 2.7896, "step": 46 }, { "epoch": 0.0, "learning_rate": 3.133333333333334e-06, "loss": 2.6992, "step": 47 }, { "epoch": 0.0, "learning_rate": 3.2000000000000003e-06, "loss": 2.7146, "step": 48 }, { "epoch": 0.0, "learning_rate": 3.266666666666667e-06, "loss": 2.7177, "step": 49 }, { "epoch": 0.01, "learning_rate": 3.3333333333333333e-06, "loss": 2.6813, "step": 50 }, { "epoch": 0.01, "learning_rate": 3.4000000000000005e-06, "loss": 2.7586, "step": 51 }, { "epoch": 0.01, "learning_rate": 3.4666666666666672e-06, "loss": 2.6945, "step": 52 }, { "epoch": 0.01, "learning_rate": 3.5333333333333335e-06, "loss": 2.7163, "step": 53 }, { "epoch": 0.01, "learning_rate": 3.6000000000000003e-06, "loss": 2.6308, "step": 54 }, { "epoch": 0.01, "learning_rate": 3.6666666666666666e-06, "loss": 2.7072, "step": 55 }, { "epoch": 0.01, "learning_rate": 3.7333333333333337e-06, "loss": 2.6572, "step": 56 }, { "epoch": 0.01, "learning_rate": 3.8000000000000005e-06, "loss": 2.7382, "step": 57 }, { "epoch": 0.01, "learning_rate": 3.866666666666667e-06, "loss": 2.694, "step": 58 }, { "epoch": 0.01, "learning_rate": 3.9333333333333335e-06, "loss": 2.631, "step": 59 }, { "epoch": 0.01, "learning_rate": 4.000000000000001e-06, "loss": 2.6968, "step": 60 }, { "epoch": 0.01, "learning_rate": 4.066666666666667e-06, "loss": 2.6535, "step": 61 }, { "epoch": 0.01, "learning_rate": 4.133333333333333e-06, "loss": 2.7222, "step": 62 }, { "epoch": 0.01, "learning_rate": 4.2000000000000004e-06, "loss": 2.6363, "step": 63 }, { "epoch": 0.01, "learning_rate": 4.266666666666668e-06, "loss": 2.656, "step": 64 }, { "epoch": 0.01, "learning_rate": 4.333333333333334e-06, "loss": 2.5842, "step": 65 }, { "epoch": 0.01, "learning_rate": 4.4e-06, "loss": 2.7143, "step": 66 }, { "epoch": 0.01, "learning_rate": 4.4666666666666665e-06, "loss": 2.6362, "step": 67 }, { "epoch": 0.01, "learning_rate": 4.533333333333334e-06, "loss": 2.6539, "step": 68 }, { "epoch": 0.01, "learning_rate": 4.600000000000001e-06, "loss": 2.6775, "step": 69 }, { "epoch": 0.01, "learning_rate": 4.666666666666667e-06, "loss": 2.6523, "step": 70 }, { "epoch": 0.01, "learning_rate": 4.7333333333333335e-06, "loss": 2.5923, "step": 71 }, { "epoch": 0.01, "learning_rate": 4.800000000000001e-06, "loss": 2.6019, "step": 72 }, { "epoch": 0.01, "learning_rate": 4.866666666666667e-06, "loss": 2.6448, "step": 73 }, { "epoch": 0.01, "learning_rate": 4.933333333333334e-06, "loss": 2.6055, "step": 74 }, { "epoch": 0.01, "learning_rate": 5e-06, "loss": 2.6413, "step": 75 }, { "epoch": 0.01, "learning_rate": 5.0666666666666676e-06, "loss": 2.5562, "step": 76 }, { "epoch": 0.01, "learning_rate": 5.133333333333334e-06, "loss": 2.4563, "step": 77 }, { "epoch": 0.01, "learning_rate": 5.2e-06, "loss": 2.6777, "step": 78 }, { "epoch": 0.01, "learning_rate": 5.2666666666666665e-06, "loss": 2.5709, "step": 79 }, { "epoch": 0.01, "learning_rate": 5.333333333333334e-06, "loss": 2.5779, "step": 80 }, { "epoch": 0.01, "learning_rate": 5.400000000000001e-06, "loss": 2.5311, "step": 81 }, { "epoch": 0.01, "learning_rate": 5.466666666666667e-06, "loss": 2.6191, "step": 82 }, { "epoch": 0.01, "learning_rate": 5.533333333333334e-06, "loss": 2.6819, "step": 83 }, { "epoch": 0.01, "learning_rate": 5.600000000000001e-06, "loss": 2.7007, "step": 84 }, { "epoch": 0.01, "learning_rate": 5.666666666666667e-06, "loss": 2.5976, "step": 85 }, { "epoch": 0.01, "learning_rate": 5.733333333333334e-06, "loss": 2.5264, "step": 86 }, { "epoch": 0.01, "learning_rate": 5.8e-06, "loss": 2.6639, "step": 87 }, { "epoch": 0.01, "learning_rate": 5.8666666666666675e-06, "loss": 2.5967, "step": 88 }, { "epoch": 0.01, "learning_rate": 5.933333333333335e-06, "loss": 2.5573, "step": 89 }, { "epoch": 0.01, "learning_rate": 6e-06, "loss": 2.5966, "step": 90 }, { "epoch": 0.01, "learning_rate": 6.066666666666667e-06, "loss": 2.5812, "step": 91 }, { "epoch": 0.01, "learning_rate": 6.133333333333334e-06, "loss": 2.5866, "step": 92 }, { "epoch": 0.01, "learning_rate": 6.200000000000001e-06, "loss": 2.5836, "step": 93 }, { "epoch": 0.01, "learning_rate": 6.266666666666668e-06, "loss": 2.5052, "step": 94 }, { "epoch": 0.01, "learning_rate": 6.333333333333333e-06, "loss": 2.571, "step": 95 }, { "epoch": 0.01, "learning_rate": 6.4000000000000006e-06, "loss": 2.5081, "step": 96 }, { "epoch": 0.01, "learning_rate": 6.466666666666667e-06, "loss": 2.7358, "step": 97 }, { "epoch": 0.01, "learning_rate": 6.533333333333334e-06, "loss": 2.5592, "step": 98 }, { "epoch": 0.01, "learning_rate": 6.600000000000001e-06, "loss": 2.6436, "step": 99 }, { "epoch": 0.01, "learning_rate": 6.666666666666667e-06, "loss": 2.6079, "step": 100 }, { "epoch": 0.01, "learning_rate": 6.733333333333334e-06, "loss": 2.6632, "step": 101 }, { "epoch": 0.01, "learning_rate": 6.800000000000001e-06, "loss": 2.5882, "step": 102 }, { "epoch": 0.01, "learning_rate": 6.866666666666667e-06, "loss": 2.5879, "step": 103 }, { "epoch": 0.01, "learning_rate": 6.9333333333333344e-06, "loss": 2.5556, "step": 104 }, { "epoch": 0.01, "learning_rate": 7e-06, "loss": 2.6596, "step": 105 }, { "epoch": 0.01, "learning_rate": 7.066666666666667e-06, "loss": 2.6304, "step": 106 }, { "epoch": 0.01, "learning_rate": 7.133333333333334e-06, "loss": 2.593, "step": 107 }, { "epoch": 0.01, "learning_rate": 7.2000000000000005e-06, "loss": 2.631, "step": 108 }, { "epoch": 0.01, "learning_rate": 7.266666666666668e-06, "loss": 2.584, "step": 109 }, { "epoch": 0.01, "learning_rate": 7.333333333333333e-06, "loss": 2.5902, "step": 110 }, { "epoch": 0.01, "learning_rate": 7.4e-06, "loss": 2.5394, "step": 111 }, { "epoch": 0.01, "learning_rate": 7.4666666666666675e-06, "loss": 2.6151, "step": 112 }, { "epoch": 0.01, "learning_rate": 7.533333333333334e-06, "loss": 2.6419, "step": 113 }, { "epoch": 0.01, "learning_rate": 7.600000000000001e-06, "loss": 2.5713, "step": 114 }, { "epoch": 0.01, "learning_rate": 7.666666666666667e-06, "loss": 2.5264, "step": 115 }, { "epoch": 0.01, "learning_rate": 7.733333333333334e-06, "loss": 2.5903, "step": 116 }, { "epoch": 0.01, "learning_rate": 7.800000000000002e-06, "loss": 2.6182, "step": 117 }, { "epoch": 0.01, "learning_rate": 7.866666666666667e-06, "loss": 2.5885, "step": 118 }, { "epoch": 0.01, "learning_rate": 7.933333333333334e-06, "loss": 2.449, "step": 119 }, { "epoch": 0.01, "learning_rate": 8.000000000000001e-06, "loss": 2.5506, "step": 120 }, { "epoch": 0.01, "learning_rate": 8.066666666666667e-06, "loss": 2.6025, "step": 121 }, { "epoch": 0.01, "learning_rate": 8.133333333333334e-06, "loss": 2.5889, "step": 122 }, { "epoch": 0.01, "learning_rate": 8.2e-06, "loss": 2.6266, "step": 123 }, { "epoch": 0.01, "learning_rate": 8.266666666666667e-06, "loss": 2.5498, "step": 124 }, { "epoch": 0.01, "learning_rate": 8.333333333333334e-06, "loss": 2.6943, "step": 125 }, { "epoch": 0.01, "learning_rate": 8.400000000000001e-06, "loss": 2.6428, "step": 126 }, { "epoch": 0.01, "learning_rate": 8.466666666666668e-06, "loss": 2.4686, "step": 127 }, { "epoch": 0.01, "learning_rate": 8.533333333333335e-06, "loss": 2.6462, "step": 128 }, { "epoch": 0.01, "learning_rate": 8.6e-06, "loss": 2.4836, "step": 129 }, { "epoch": 0.01, "learning_rate": 8.666666666666668e-06, "loss": 2.527, "step": 130 }, { "epoch": 0.01, "learning_rate": 8.733333333333333e-06, "loss": 2.4329, "step": 131 }, { "epoch": 0.01, "learning_rate": 8.8e-06, "loss": 2.6084, "step": 132 }, { "epoch": 0.01, "learning_rate": 8.866666666666668e-06, "loss": 2.5556, "step": 133 }, { "epoch": 0.01, "learning_rate": 8.933333333333333e-06, "loss": 2.4995, "step": 134 }, { "epoch": 0.01, "learning_rate": 9e-06, "loss": 2.7182, "step": 135 }, { "epoch": 0.01, "learning_rate": 9.066666666666667e-06, "loss": 2.5174, "step": 136 }, { "epoch": 0.01, "learning_rate": 9.133333333333335e-06, "loss": 2.603, "step": 137 }, { "epoch": 0.01, "learning_rate": 9.200000000000002e-06, "loss": 2.6448, "step": 138 }, { "epoch": 0.01, "learning_rate": 9.266666666666667e-06, "loss": 2.5595, "step": 139 }, { "epoch": 0.01, "learning_rate": 9.333333333333334e-06, "loss": 2.5287, "step": 140 }, { "epoch": 0.01, "learning_rate": 9.4e-06, "loss": 2.5496, "step": 141 }, { "epoch": 0.01, "learning_rate": 9.466666666666667e-06, "loss": 2.4992, "step": 142 }, { "epoch": 0.01, "learning_rate": 9.533333333333334e-06, "loss": 2.4817, "step": 143 }, { "epoch": 0.01, "learning_rate": 9.600000000000001e-06, "loss": 2.478, "step": 144 }, { "epoch": 0.01, "learning_rate": 9.666666666666667e-06, "loss": 2.4938, "step": 145 }, { "epoch": 0.01, "learning_rate": 9.733333333333334e-06, "loss": 2.5876, "step": 146 }, { "epoch": 0.01, "learning_rate": 9.800000000000001e-06, "loss": 2.5809, "step": 147 }, { "epoch": 0.01, "learning_rate": 9.866666666666668e-06, "loss": 2.5978, "step": 148 }, { "epoch": 0.01, "learning_rate": 9.933333333333334e-06, "loss": 2.4569, "step": 149 }, { "epoch": 0.02, "learning_rate": 1e-05, "loss": 2.6287, "step": 150 }, { "epoch": 0.02, "learning_rate": 1.0066666666666666e-05, "loss": 2.4724, "step": 151 }, { "epoch": 0.02, "learning_rate": 1.0133333333333335e-05, "loss": 2.6302, "step": 152 }, { "epoch": 0.02, "learning_rate": 1.02e-05, "loss": 2.606, "step": 153 }, { "epoch": 0.02, "learning_rate": 1.0266666666666668e-05, "loss": 2.4868, "step": 154 }, { "epoch": 0.02, "learning_rate": 1.0333333333333335e-05, "loss": 2.529, "step": 155 }, { "epoch": 0.02, "learning_rate": 1.04e-05, "loss": 2.5403, "step": 156 }, { "epoch": 0.02, "learning_rate": 1.0466666666666668e-05, "loss": 2.5015, "step": 157 }, { "epoch": 0.02, "learning_rate": 1.0533333333333333e-05, "loss": 2.5648, "step": 158 }, { "epoch": 0.02, "learning_rate": 1.0600000000000002e-05, "loss": 2.5538, "step": 159 }, { "epoch": 0.02, "learning_rate": 1.0666666666666667e-05, "loss": 2.4636, "step": 160 }, { "epoch": 0.02, "learning_rate": 1.0733333333333333e-05, "loss": 2.4366, "step": 161 }, { "epoch": 0.02, "learning_rate": 1.0800000000000002e-05, "loss": 2.4564, "step": 162 }, { "epoch": 0.02, "learning_rate": 1.0866666666666667e-05, "loss": 2.5978, "step": 163 }, { "epoch": 0.02, "learning_rate": 1.0933333333333334e-05, "loss": 2.5548, "step": 164 }, { "epoch": 0.02, "learning_rate": 1.1000000000000001e-05, "loss": 2.4894, "step": 165 }, { "epoch": 0.02, "learning_rate": 1.1066666666666669e-05, "loss": 2.5585, "step": 166 }, { "epoch": 0.02, "learning_rate": 1.1133333333333334e-05, "loss": 2.5138, "step": 167 }, { "epoch": 0.02, "learning_rate": 1.1200000000000001e-05, "loss": 2.4752, "step": 168 }, { "epoch": 0.02, "learning_rate": 1.1266666666666668e-05, "loss": 2.4226, "step": 169 }, { "epoch": 0.02, "learning_rate": 1.1333333333333334e-05, "loss": 2.6133, "step": 170 }, { "epoch": 0.02, "learning_rate": 1.14e-05, "loss": 2.4469, "step": 171 }, { "epoch": 0.02, "learning_rate": 1.1466666666666668e-05, "loss": 2.4937, "step": 172 }, { "epoch": 0.02, "learning_rate": 1.1533333333333334e-05, "loss": 2.5308, "step": 173 }, { "epoch": 0.02, "learning_rate": 1.16e-05, "loss": 2.6064, "step": 174 }, { "epoch": 0.02, "learning_rate": 1.1666666666666668e-05, "loss": 2.4965, "step": 175 }, { "epoch": 0.02, "learning_rate": 1.1733333333333335e-05, "loss": 2.6625, "step": 176 }, { "epoch": 0.02, "learning_rate": 1.18e-05, "loss": 2.4847, "step": 177 }, { "epoch": 0.02, "learning_rate": 1.186666666666667e-05, "loss": 2.5045, "step": 178 }, { "epoch": 0.02, "learning_rate": 1.1933333333333335e-05, "loss": 2.5201, "step": 179 }, { "epoch": 0.02, "learning_rate": 1.2e-05, "loss": 2.5224, "step": 180 }, { "epoch": 0.02, "learning_rate": 1.206666666666667e-05, "loss": 2.526, "step": 181 }, { "epoch": 0.02, "learning_rate": 1.2133333333333335e-05, "loss": 2.4803, "step": 182 }, { "epoch": 0.02, "learning_rate": 1.22e-05, "loss": 2.5252, "step": 183 }, { "epoch": 0.02, "learning_rate": 1.2266666666666667e-05, "loss": 2.5662, "step": 184 }, { "epoch": 0.02, "learning_rate": 1.2333333333333334e-05, "loss": 2.5612, "step": 185 }, { "epoch": 0.02, "learning_rate": 1.2400000000000002e-05, "loss": 2.5887, "step": 186 }, { "epoch": 0.02, "learning_rate": 1.2466666666666667e-05, "loss": 2.45, "step": 187 }, { "epoch": 0.02, "learning_rate": 1.2533333333333336e-05, "loss": 2.4882, "step": 188 }, { "epoch": 0.02, "learning_rate": 1.2600000000000001e-05, "loss": 2.537, "step": 189 }, { "epoch": 0.02, "learning_rate": 1.2666666666666667e-05, "loss": 2.5389, "step": 190 }, { "epoch": 0.02, "learning_rate": 1.2733333333333336e-05, "loss": 2.3777, "step": 191 }, { "epoch": 0.02, "learning_rate": 1.2800000000000001e-05, "loss": 2.4905, "step": 192 }, { "epoch": 0.02, "learning_rate": 1.2866666666666667e-05, "loss": 2.5256, "step": 193 }, { "epoch": 0.02, "learning_rate": 1.2933333333333334e-05, "loss": 2.5367, "step": 194 }, { "epoch": 0.02, "learning_rate": 1.3000000000000001e-05, "loss": 2.5348, "step": 195 }, { "epoch": 0.02, "learning_rate": 1.3066666666666668e-05, "loss": 2.4419, "step": 196 }, { "epoch": 0.02, "learning_rate": 1.3133333333333334e-05, "loss": 2.5714, "step": 197 }, { "epoch": 0.02, "learning_rate": 1.3200000000000002e-05, "loss": 2.5416, "step": 198 }, { "epoch": 0.02, "learning_rate": 1.3266666666666668e-05, "loss": 2.5707, "step": 199 }, { "epoch": 0.02, "learning_rate": 1.3333333333333333e-05, "loss": 2.531, "step": 200 }, { "epoch": 0.02, "learning_rate": 1.3400000000000002e-05, "loss": 2.5062, "step": 201 }, { "epoch": 0.02, "learning_rate": 1.3466666666666668e-05, "loss": 2.6095, "step": 202 }, { "epoch": 0.02, "learning_rate": 1.3533333333333333e-05, "loss": 2.4759, "step": 203 }, { "epoch": 0.02, "learning_rate": 1.3600000000000002e-05, "loss": 2.5454, "step": 204 }, { "epoch": 0.02, "learning_rate": 1.3666666666666667e-05, "loss": 2.518, "step": 205 }, { "epoch": 0.02, "learning_rate": 1.3733333333333335e-05, "loss": 2.5329, "step": 206 }, { "epoch": 0.02, "learning_rate": 1.38e-05, "loss": 2.4992, "step": 207 }, { "epoch": 0.02, "learning_rate": 1.3866666666666669e-05, "loss": 2.482, "step": 208 }, { "epoch": 0.02, "learning_rate": 1.3933333333333334e-05, "loss": 2.5622, "step": 209 }, { "epoch": 0.02, "learning_rate": 1.4e-05, "loss": 2.5993, "step": 210 }, { "epoch": 0.02, "learning_rate": 1.4066666666666669e-05, "loss": 2.6138, "step": 211 }, { "epoch": 0.02, "learning_rate": 1.4133333333333334e-05, "loss": 2.5508, "step": 212 }, { "epoch": 0.02, "learning_rate": 1.4200000000000001e-05, "loss": 2.5047, "step": 213 }, { "epoch": 0.02, "learning_rate": 1.4266666666666668e-05, "loss": 2.5221, "step": 214 }, { "epoch": 0.02, "learning_rate": 1.4333333333333334e-05, "loss": 2.5561, "step": 215 }, { "epoch": 0.02, "learning_rate": 1.4400000000000001e-05, "loss": 2.4706, "step": 216 }, { "epoch": 0.02, "learning_rate": 1.4466666666666668e-05, "loss": 2.5358, "step": 217 }, { "epoch": 0.02, "learning_rate": 1.4533333333333335e-05, "loss": 2.4321, "step": 218 }, { "epoch": 0.02, "learning_rate": 1.46e-05, "loss": 2.569, "step": 219 }, { "epoch": 0.02, "learning_rate": 1.4666666666666666e-05, "loss": 2.5549, "step": 220 }, { "epoch": 0.02, "learning_rate": 1.4733333333333335e-05, "loss": 2.4971, "step": 221 }, { "epoch": 0.02, "learning_rate": 1.48e-05, "loss": 2.5886, "step": 222 }, { "epoch": 0.02, "learning_rate": 1.4866666666666668e-05, "loss": 2.5319, "step": 223 }, { "epoch": 0.02, "learning_rate": 1.4933333333333335e-05, "loss": 2.5261, "step": 224 }, { "epoch": 0.02, "learning_rate": 1.5000000000000002e-05, "loss": 2.5296, "step": 225 }, { "epoch": 0.02, "learning_rate": 1.5066666666666668e-05, "loss": 2.4627, "step": 226 }, { "epoch": 0.02, "learning_rate": 1.5133333333333335e-05, "loss": 2.4887, "step": 227 }, { "epoch": 0.02, "learning_rate": 1.5200000000000002e-05, "loss": 2.4638, "step": 228 }, { "epoch": 0.02, "learning_rate": 1.5266666666666667e-05, "loss": 2.5179, "step": 229 }, { "epoch": 0.02, "learning_rate": 1.5333333333333334e-05, "loss": 2.6529, "step": 230 }, { "epoch": 0.02, "learning_rate": 1.54e-05, "loss": 2.6809, "step": 231 }, { "epoch": 0.02, "learning_rate": 1.546666666666667e-05, "loss": 2.5372, "step": 232 }, { "epoch": 0.02, "learning_rate": 1.5533333333333333e-05, "loss": 2.4777, "step": 233 }, { "epoch": 0.02, "learning_rate": 1.5600000000000003e-05, "loss": 2.5449, "step": 234 }, { "epoch": 0.02, "learning_rate": 1.5666666666666667e-05, "loss": 2.4774, "step": 235 }, { "epoch": 0.02, "learning_rate": 1.5733333333333334e-05, "loss": 2.5766, "step": 236 }, { "epoch": 0.02, "learning_rate": 1.58e-05, "loss": 2.5015, "step": 237 }, { "epoch": 0.02, "learning_rate": 1.586666666666667e-05, "loss": 2.5134, "step": 238 }, { "epoch": 0.02, "learning_rate": 1.5933333333333336e-05, "loss": 2.5379, "step": 239 }, { "epoch": 0.02, "learning_rate": 1.6000000000000003e-05, "loss": 2.6054, "step": 240 }, { "epoch": 0.02, "learning_rate": 1.606666666666667e-05, "loss": 2.522, "step": 241 }, { "epoch": 0.02, "learning_rate": 1.6133333333333334e-05, "loss": 2.5019, "step": 242 }, { "epoch": 0.02, "learning_rate": 1.62e-05, "loss": 2.5331, "step": 243 }, { "epoch": 0.02, "learning_rate": 1.6266666666666668e-05, "loss": 2.5916, "step": 244 }, { "epoch": 0.02, "learning_rate": 1.6333333333333335e-05, "loss": 2.5598, "step": 245 }, { "epoch": 0.02, "learning_rate": 1.64e-05, "loss": 2.4894, "step": 246 }, { "epoch": 0.02, "learning_rate": 1.646666666666667e-05, "loss": 2.6247, "step": 247 }, { "epoch": 0.02, "learning_rate": 1.6533333333333333e-05, "loss": 2.5145, "step": 248 }, { "epoch": 0.02, "learning_rate": 1.66e-05, "loss": 2.4985, "step": 249 }, { "epoch": 0.03, "learning_rate": 1.6666666666666667e-05, "loss": 2.5125, "step": 250 }, { "epoch": 0.03, "learning_rate": 1.6733333333333335e-05, "loss": 2.5301, "step": 251 }, { "epoch": 0.03, "learning_rate": 1.6800000000000002e-05, "loss": 2.5707, "step": 252 }, { "epoch": 0.03, "learning_rate": 1.686666666666667e-05, "loss": 2.6231, "step": 253 }, { "epoch": 0.03, "learning_rate": 1.6933333333333336e-05, "loss": 2.5282, "step": 254 }, { "epoch": 0.03, "learning_rate": 1.7e-05, "loss": 2.4811, "step": 255 }, { "epoch": 0.03, "learning_rate": 1.706666666666667e-05, "loss": 2.5375, "step": 256 }, { "epoch": 0.03, "learning_rate": 1.7133333333333334e-05, "loss": 2.5679, "step": 257 }, { "epoch": 0.03, "learning_rate": 1.72e-05, "loss": 2.4971, "step": 258 }, { "epoch": 0.03, "learning_rate": 1.726666666666667e-05, "loss": 2.5541, "step": 259 }, { "epoch": 0.03, "learning_rate": 1.7333333333333336e-05, "loss": 2.5327, "step": 260 }, { "epoch": 0.03, "learning_rate": 1.7400000000000003e-05, "loss": 2.5249, "step": 261 }, { "epoch": 0.03, "learning_rate": 1.7466666666666667e-05, "loss": 2.4568, "step": 262 }, { "epoch": 0.03, "learning_rate": 1.7533333333333337e-05, "loss": 2.5094, "step": 263 }, { "epoch": 0.03, "learning_rate": 1.76e-05, "loss": 2.492, "step": 264 }, { "epoch": 0.03, "learning_rate": 1.7666666666666668e-05, "loss": 2.6031, "step": 265 }, { "epoch": 0.03, "learning_rate": 1.7733333333333335e-05, "loss": 2.5785, "step": 266 }, { "epoch": 0.03, "learning_rate": 1.7800000000000002e-05, "loss": 2.5742, "step": 267 }, { "epoch": 0.03, "learning_rate": 1.7866666666666666e-05, "loss": 2.533, "step": 268 }, { "epoch": 0.03, "learning_rate": 1.7933333333333333e-05, "loss": 2.4925, "step": 269 }, { "epoch": 0.03, "learning_rate": 1.8e-05, "loss": 2.5669, "step": 270 }, { "epoch": 0.03, "learning_rate": 1.8066666666666668e-05, "loss": 2.5425, "step": 271 }, { "epoch": 0.03, "learning_rate": 1.8133333333333335e-05, "loss": 2.5786, "step": 272 }, { "epoch": 0.03, "learning_rate": 1.8200000000000002e-05, "loss": 2.4624, "step": 273 }, { "epoch": 0.03, "learning_rate": 1.826666666666667e-05, "loss": 2.5207, "step": 274 }, { "epoch": 0.03, "learning_rate": 1.8333333333333333e-05, "loss": 2.4979, "step": 275 }, { "epoch": 0.03, "learning_rate": 1.8400000000000003e-05, "loss": 2.5153, "step": 276 }, { "epoch": 0.03, "learning_rate": 1.8466666666666667e-05, "loss": 2.4946, "step": 277 }, { "epoch": 0.03, "learning_rate": 1.8533333333333334e-05, "loss": 2.4198, "step": 278 }, { "epoch": 0.03, "learning_rate": 1.86e-05, "loss": 2.5295, "step": 279 }, { "epoch": 0.03, "learning_rate": 1.866666666666667e-05, "loss": 2.507, "step": 280 }, { "epoch": 0.03, "learning_rate": 1.8733333333333336e-05, "loss": 2.492, "step": 281 }, { "epoch": 0.03, "learning_rate": 1.88e-05, "loss": 2.4671, "step": 282 }, { "epoch": 0.03, "learning_rate": 1.886666666666667e-05, "loss": 2.5449, "step": 283 }, { "epoch": 0.03, "learning_rate": 1.8933333333333334e-05, "loss": 2.4647, "step": 284 }, { "epoch": 0.03, "learning_rate": 1.9e-05, "loss": 2.5323, "step": 285 }, { "epoch": 0.03, "learning_rate": 1.9066666666666668e-05, "loss": 2.5811, "step": 286 }, { "epoch": 0.03, "learning_rate": 1.9133333333333335e-05, "loss": 2.4839, "step": 287 }, { "epoch": 0.03, "learning_rate": 1.9200000000000003e-05, "loss": 2.5328, "step": 288 }, { "epoch": 0.03, "learning_rate": 1.926666666666667e-05, "loss": 2.5326, "step": 289 }, { "epoch": 0.03, "learning_rate": 1.9333333333333333e-05, "loss": 2.5704, "step": 290 }, { "epoch": 0.03, "learning_rate": 1.94e-05, "loss": 2.5132, "step": 291 }, { "epoch": 0.03, "learning_rate": 1.9466666666666668e-05, "loss": 2.604, "step": 292 }, { "epoch": 0.03, "learning_rate": 1.9533333333333335e-05, "loss": 2.5654, "step": 293 }, { "epoch": 0.03, "learning_rate": 1.9600000000000002e-05, "loss": 2.5277, "step": 294 }, { "epoch": 0.03, "learning_rate": 1.9666666666666666e-05, "loss": 2.3933, "step": 295 }, { "epoch": 0.03, "learning_rate": 1.9733333333333336e-05, "loss": 2.5401, "step": 296 }, { "epoch": 0.03, "learning_rate": 1.98e-05, "loss": 2.3431, "step": 297 }, { "epoch": 0.03, "learning_rate": 1.9866666666666667e-05, "loss": 2.4149, "step": 298 }, { "epoch": 0.03, "learning_rate": 1.9933333333333334e-05, "loss": 2.505, "step": 299 }, { "epoch": 0.03, "learning_rate": 2e-05, "loss": 2.6363, "step": 300 }, { "epoch": 0.03, "learning_rate": 1.9999999473462502e-05, "loss": 2.5307, "step": 301 }, { "epoch": 0.03, "learning_rate": 1.9999997893850064e-05, "loss": 2.5656, "step": 302 }, { "epoch": 0.03, "learning_rate": 1.999999526116285e-05, "loss": 2.555, "step": 303 }, { "epoch": 0.03, "learning_rate": 1.999999157540114e-05, "loss": 2.4498, "step": 304 }, { "epoch": 0.03, "learning_rate": 1.9999986836565317e-05, "loss": 2.6986, "step": 305 }, { "epoch": 0.03, "learning_rate": 1.9999981044655885e-05, "loss": 2.4816, "step": 306 }, { "epoch": 0.03, "learning_rate": 1.9999974199673452e-05, "loss": 2.4785, "step": 307 }, { "epoch": 0.03, "learning_rate": 1.9999966301618744e-05, "loss": 2.4968, "step": 308 }, { "epoch": 0.03, "learning_rate": 1.999995735049258e-05, "loss": 2.5629, "step": 309 }, { "epoch": 0.03, "learning_rate": 1.9999947346295915e-05, "loss": 2.5939, "step": 310 }, { "epoch": 0.03, "learning_rate": 1.99999362890298e-05, "loss": 2.4865, "step": 311 }, { "epoch": 0.03, "learning_rate": 1.9999924178695397e-05, "loss": 2.582, "step": 312 }, { "epoch": 0.03, "learning_rate": 1.999991101529398e-05, "loss": 2.6115, "step": 313 }, { "epoch": 0.03, "learning_rate": 1.999989679882694e-05, "loss": 2.5391, "step": 314 }, { "epoch": 0.03, "learning_rate": 1.9999881529295767e-05, "loss": 2.5998, "step": 315 }, { "epoch": 0.03, "learning_rate": 1.999986520670208e-05, "loss": 2.6243, "step": 316 }, { "epoch": 0.03, "learning_rate": 1.9999847831047585e-05, "loss": 2.4599, "step": 317 }, { "epoch": 0.03, "learning_rate": 1.9999829402334118e-05, "loss": 2.5385, "step": 318 }, { "epoch": 0.03, "learning_rate": 1.9999809920563626e-05, "loss": 2.4378, "step": 319 }, { "epoch": 0.03, "learning_rate": 1.9999789385738148e-05, "loss": 2.5138, "step": 320 }, { "epoch": 0.03, "learning_rate": 1.9999767797859853e-05, "loss": 2.5044, "step": 321 }, { "epoch": 0.03, "learning_rate": 1.9999745156931018e-05, "loss": 2.6465, "step": 322 }, { "epoch": 0.03, "learning_rate": 1.9999721462954018e-05, "loss": 2.5958, "step": 323 }, { "epoch": 0.03, "learning_rate": 1.9999696715931356e-05, "loss": 2.5258, "step": 324 }, { "epoch": 0.03, "learning_rate": 1.9999670915865635e-05, "loss": 2.5275, "step": 325 }, { "epoch": 0.03, "learning_rate": 1.9999644062759576e-05, "loss": 2.462, "step": 326 }, { "epoch": 0.03, "learning_rate": 1.9999616156616e-05, "loss": 2.487, "step": 327 }, { "epoch": 0.03, "learning_rate": 1.9999587197437852e-05, "loss": 2.5236, "step": 328 }, { "epoch": 0.03, "learning_rate": 1.9999557185228172e-05, "loss": 2.5199, "step": 329 }, { "epoch": 0.03, "learning_rate": 1.9999526119990133e-05, "loss": 2.5379, "step": 330 }, { "epoch": 0.03, "learning_rate": 1.9999494001727e-05, "loss": 2.5502, "step": 331 }, { "epoch": 0.03, "learning_rate": 1.999946083044215e-05, "loss": 2.5739, "step": 332 }, { "epoch": 0.03, "learning_rate": 1.999942660613909e-05, "loss": 2.515, "step": 333 }, { "epoch": 0.03, "learning_rate": 1.9999391328821415e-05, "loss": 2.5159, "step": 334 }, { "epoch": 0.03, "learning_rate": 1.9999354998492838e-05, "loss": 2.5727, "step": 335 }, { "epoch": 0.03, "learning_rate": 1.9999317615157187e-05, "loss": 2.5665, "step": 336 }, { "epoch": 0.03, "learning_rate": 1.99992791788184e-05, "loss": 2.4275, "step": 337 }, { "epoch": 0.03, "learning_rate": 1.9999239689480526e-05, "loss": 2.485, "step": 338 }, { "epoch": 0.03, "learning_rate": 1.9999199147147723e-05, "loss": 2.5728, "step": 339 }, { "epoch": 0.03, "learning_rate": 1.9999157551824258e-05, "loss": 2.511, "step": 340 }, { "epoch": 0.03, "learning_rate": 1.999911490351451e-05, "loss": 2.6095, "step": 341 }, { "epoch": 0.03, "learning_rate": 1.9999071202222974e-05, "loss": 2.5097, "step": 342 }, { "epoch": 0.03, "learning_rate": 1.9999026447954252e-05, "loss": 2.5294, "step": 343 }, { "epoch": 0.03, "learning_rate": 1.9998980640713056e-05, "loss": 2.5359, "step": 344 }, { "epoch": 0.03, "learning_rate": 1.999893378050421e-05, "loss": 2.5947, "step": 345 }, { "epoch": 0.03, "learning_rate": 1.9998885867332646e-05, "loss": 2.5955, "step": 346 }, { "epoch": 0.03, "learning_rate": 1.9998836901203416e-05, "loss": 2.5543, "step": 347 }, { "epoch": 0.03, "learning_rate": 1.9998786882121667e-05, "loss": 2.5647, "step": 348 }, { "epoch": 0.03, "learning_rate": 1.9998735810092676e-05, "loss": 2.5203, "step": 349 }, { "epoch": 0.04, "learning_rate": 1.9998683685121816e-05, "loss": 2.5167, "step": 350 }, { "epoch": 0.04, "learning_rate": 1.9998630507214578e-05, "loss": 2.4052, "step": 351 }, { "epoch": 0.04, "learning_rate": 1.999857627637656e-05, "loss": 2.5254, "step": 352 }, { "epoch": 0.04, "learning_rate": 1.9998520992613475e-05, "loss": 2.5367, "step": 353 }, { "epoch": 0.04, "learning_rate": 1.9998464655931144e-05, "loss": 2.4931, "step": 354 }, { "epoch": 0.04, "learning_rate": 1.9998407266335498e-05, "loss": 2.4881, "step": 355 }, { "epoch": 0.04, "learning_rate": 1.9998348823832582e-05, "loss": 2.5302, "step": 356 }, { "epoch": 0.04, "learning_rate": 1.9998289328428553e-05, "loss": 2.4631, "step": 357 }, { "epoch": 0.04, "learning_rate": 1.9998228780129675e-05, "loss": 2.4864, "step": 358 }, { "epoch": 0.04, "learning_rate": 1.9998167178942318e-05, "loss": 2.5266, "step": 359 }, { "epoch": 0.04, "learning_rate": 1.999810452487298e-05, "loss": 2.4915, "step": 360 }, { "epoch": 0.04, "learning_rate": 1.9998040817928248e-05, "loss": 2.5352, "step": 361 }, { "epoch": 0.04, "learning_rate": 1.9997976058114837e-05, "loss": 2.5273, "step": 362 }, { "epoch": 0.04, "learning_rate": 1.9997910245439568e-05, "loss": 2.5303, "step": 363 }, { "epoch": 0.04, "learning_rate": 1.999784337990937e-05, "loss": 2.5215, "step": 364 }, { "epoch": 0.04, "learning_rate": 1.999777546153128e-05, "loss": 2.4489, "step": 365 }, { "epoch": 0.04, "learning_rate": 1.9997706490312455e-05, "loss": 2.455, "step": 366 }, { "epoch": 0.04, "learning_rate": 1.9997636466260163e-05, "loss": 2.584, "step": 367 }, { "epoch": 0.04, "learning_rate": 1.9997565389381765e-05, "loss": 2.5838, "step": 368 }, { "epoch": 0.04, "learning_rate": 1.9997493259684754e-05, "loss": 2.5447, "step": 369 }, { "epoch": 0.04, "learning_rate": 1.9997420077176727e-05, "loss": 2.486, "step": 370 }, { "epoch": 0.04, "learning_rate": 1.999734584186539e-05, "loss": 2.4638, "step": 371 }, { "epoch": 0.04, "learning_rate": 1.9997270553758557e-05, "loss": 2.5974, "step": 372 }, { "epoch": 0.04, "learning_rate": 1.999719421286416e-05, "loss": 2.4976, "step": 373 }, { "epoch": 0.04, "learning_rate": 1.9997116819190238e-05, "loss": 2.5544, "step": 374 }, { "epoch": 0.04, "learning_rate": 1.999703837274494e-05, "loss": 2.3968, "step": 375 }, { "epoch": 0.04, "learning_rate": 1.999695887353652e-05, "loss": 2.6879, "step": 376 }, { "epoch": 0.04, "learning_rate": 1.9996878321573363e-05, "loss": 2.496, "step": 377 }, { "epoch": 0.04, "learning_rate": 1.9996796716863943e-05, "loss": 2.4768, "step": 378 }, { "epoch": 0.04, "learning_rate": 1.9996714059416857e-05, "loss": 2.5219, "step": 379 }, { "epoch": 0.04, "learning_rate": 1.999663034924081e-05, "loss": 2.5442, "step": 380 }, { "epoch": 0.04, "learning_rate": 1.9996545586344616e-05, "loss": 2.5981, "step": 381 }, { "epoch": 0.04, "learning_rate": 1.99964597707372e-05, "loss": 2.5783, "step": 382 }, { "epoch": 0.04, "learning_rate": 1.9996372902427598e-05, "loss": 2.5177, "step": 383 }, { "epoch": 0.04, "learning_rate": 1.9996284981424963e-05, "loss": 2.5465, "step": 384 }, { "epoch": 0.04, "learning_rate": 1.999619600773855e-05, "loss": 2.5295, "step": 385 }, { "epoch": 0.04, "learning_rate": 1.999610598137773e-05, "loss": 2.5512, "step": 386 }, { "epoch": 0.04, "learning_rate": 1.9996014902351983e-05, "loss": 2.4786, "step": 387 }, { "epoch": 0.04, "learning_rate": 1.9995922770670897e-05, "loss": 2.4029, "step": 388 }, { "epoch": 0.04, "learning_rate": 1.999582958634418e-05, "loss": 2.5599, "step": 389 }, { "epoch": 0.04, "learning_rate": 1.999573534938164e-05, "loss": 2.4123, "step": 390 }, { "epoch": 0.04, "learning_rate": 1.9995640059793206e-05, "loss": 2.5963, "step": 391 }, { "epoch": 0.04, "learning_rate": 1.9995543717588908e-05, "loss": 2.4379, "step": 392 }, { "epoch": 0.04, "learning_rate": 1.9995446322778894e-05, "loss": 2.3748, "step": 393 }, { "epoch": 0.04, "learning_rate": 1.999534787537342e-05, "loss": 2.5341, "step": 394 }, { "epoch": 0.04, "learning_rate": 1.9995248375382853e-05, "loss": 2.4378, "step": 395 }, { "epoch": 0.04, "learning_rate": 1.9995147822817667e-05, "loss": 2.6469, "step": 396 }, { "epoch": 0.04, "learning_rate": 1.999504621768846e-05, "loss": 2.4613, "step": 397 }, { "epoch": 0.04, "learning_rate": 1.9994943560005924e-05, "loss": 2.523, "step": 398 }, { "epoch": 0.04, "learning_rate": 1.999483984978088e-05, "loss": 2.5012, "step": 399 }, { "epoch": 0.04, "learning_rate": 1.9994735087024232e-05, "loss": 2.4657, "step": 400 }, { "epoch": 0.04, "learning_rate": 1.9994629271747027e-05, "loss": 2.4376, "step": 401 }, { "epoch": 0.04, "learning_rate": 1.9994522403960404e-05, "loss": 2.5781, "step": 402 }, { "epoch": 0.04, "learning_rate": 1.9994414483675614e-05, "loss": 2.4739, "step": 403 }, { "epoch": 0.04, "learning_rate": 1.9994305510904026e-05, "loss": 2.6079, "step": 404 }, { "epoch": 0.04, "learning_rate": 1.9994195485657113e-05, "loss": 2.458, "step": 405 }, { "epoch": 0.04, "learning_rate": 1.999408440794646e-05, "loss": 2.5382, "step": 406 }, { "epoch": 0.04, "learning_rate": 1.999397227778377e-05, "loss": 2.4843, "step": 407 }, { "epoch": 0.04, "learning_rate": 1.9993859095180848e-05, "loss": 2.4869, "step": 408 }, { "epoch": 0.04, "learning_rate": 1.999374486014961e-05, "loss": 2.5266, "step": 409 }, { "epoch": 0.04, "learning_rate": 1.999362957270209e-05, "loss": 2.5052, "step": 410 }, { "epoch": 0.04, "learning_rate": 1.9993513232850428e-05, "loss": 2.4692, "step": 411 }, { "epoch": 0.04, "learning_rate": 1.9993395840606875e-05, "loss": 2.4712, "step": 412 }, { "epoch": 0.04, "learning_rate": 1.999327739598379e-05, "loss": 2.4573, "step": 413 }, { "epoch": 0.04, "learning_rate": 1.9993157898993654e-05, "loss": 2.5959, "step": 414 }, { "epoch": 0.04, "learning_rate": 1.9993037349649042e-05, "loss": 2.3877, "step": 415 }, { "epoch": 0.04, "learning_rate": 1.9992915747962653e-05, "loss": 2.5971, "step": 416 }, { "epoch": 0.04, "learning_rate": 1.999279309394729e-05, "loss": 2.4907, "step": 417 }, { "epoch": 0.04, "learning_rate": 1.9992669387615878e-05, "loss": 2.536, "step": 418 }, { "epoch": 0.04, "learning_rate": 1.999254462898143e-05, "loss": 2.5011, "step": 419 }, { "epoch": 0.04, "learning_rate": 1.99924188180571e-05, "loss": 2.549, "step": 420 }, { "epoch": 0.04, "learning_rate": 1.9992291954856125e-05, "loss": 2.4392, "step": 421 }, { "epoch": 0.04, "learning_rate": 1.9992164039391867e-05, "loss": 2.4971, "step": 422 }, { "epoch": 0.04, "learning_rate": 1.99920350716778e-05, "loss": 2.4399, "step": 423 }, { "epoch": 0.04, "learning_rate": 1.9991905051727504e-05, "loss": 2.508, "step": 424 }, { "epoch": 0.04, "learning_rate": 1.9991773979554667e-05, "loss": 2.3993, "step": 425 }, { "epoch": 0.04, "learning_rate": 1.9991641855173095e-05, "loss": 2.6448, "step": 426 }, { "epoch": 0.04, "learning_rate": 1.9991508678596704e-05, "loss": 2.5285, "step": 427 }, { "epoch": 0.04, "learning_rate": 1.999137444983952e-05, "loss": 2.5185, "step": 428 }, { "epoch": 0.04, "learning_rate": 1.999123916891567e-05, "loss": 2.5133, "step": 429 }, { "epoch": 0.04, "learning_rate": 1.99911028358394e-05, "loss": 2.4964, "step": 430 }, { "epoch": 0.04, "learning_rate": 1.999096545062508e-05, "loss": 2.6085, "step": 431 }, { "epoch": 0.04, "learning_rate": 1.9990827013287164e-05, "loss": 2.5334, "step": 432 }, { "epoch": 0.04, "learning_rate": 1.9990687523840234e-05, "loss": 2.438, "step": 433 }, { "epoch": 0.04, "learning_rate": 1.9990546982298986e-05, "loss": 2.5391, "step": 434 }, { "epoch": 0.04, "learning_rate": 1.9990405388678216e-05, "loss": 2.4862, "step": 435 }, { "epoch": 0.04, "learning_rate": 1.999026274299283e-05, "loss": 2.5381, "step": 436 }, { "epoch": 0.04, "learning_rate": 1.9990119045257854e-05, "loss": 2.5539, "step": 437 }, { "epoch": 0.04, "learning_rate": 1.9989974295488422e-05, "loss": 2.4969, "step": 438 }, { "epoch": 0.04, "learning_rate": 1.9989828493699773e-05, "loss": 2.4687, "step": 439 }, { "epoch": 0.04, "learning_rate": 1.9989681639907267e-05, "loss": 2.4548, "step": 440 }, { "epoch": 0.04, "learning_rate": 1.998953373412636e-05, "loss": 2.4988, "step": 441 }, { "epoch": 0.04, "learning_rate": 1.9989384776372637e-05, "loss": 2.3674, "step": 442 }, { "epoch": 0.04, "learning_rate": 1.9989234766661777e-05, "loss": 2.4785, "step": 443 }, { "epoch": 0.04, "learning_rate": 1.9989083705009583e-05, "loss": 2.5715, "step": 444 }, { "epoch": 0.04, "learning_rate": 1.998893159143196e-05, "loss": 2.5831, "step": 445 }, { "epoch": 0.04, "learning_rate": 1.9988778425944924e-05, "loss": 2.5044, "step": 446 }, { "epoch": 0.04, "learning_rate": 1.998862420856461e-05, "loss": 2.6119, "step": 447 }, { "epoch": 0.04, "learning_rate": 1.9988468939307252e-05, "loss": 2.4603, "step": 448 }, { "epoch": 0.04, "learning_rate": 1.9988312618189208e-05, "loss": 2.5048, "step": 449 }, { "epoch": 0.05, "learning_rate": 1.9988155245226934e-05, "loss": 2.4734, "step": 450 }, { "epoch": 0.05, "learning_rate": 1.998799682043701e-05, "loss": 2.4875, "step": 451 }, { "epoch": 0.05, "learning_rate": 1.9987837343836108e-05, "loss": 2.5163, "step": 452 }, { "epoch": 0.05, "learning_rate": 1.998767681544103e-05, "loss": 2.5104, "step": 453 }, { "epoch": 0.05, "learning_rate": 1.9987515235268682e-05, "loss": 2.5435, "step": 454 }, { "epoch": 0.05, "learning_rate": 1.9987352603336076e-05, "loss": 2.4723, "step": 455 }, { "epoch": 0.05, "learning_rate": 1.998718891966034e-05, "loss": 2.456, "step": 456 }, { "epoch": 0.05, "learning_rate": 1.9987024184258705e-05, "loss": 2.5365, "step": 457 }, { "epoch": 0.05, "learning_rate": 1.9986858397148526e-05, "loss": 2.615, "step": 458 }, { "epoch": 0.05, "learning_rate": 1.998669155834726e-05, "loss": 2.5073, "step": 459 }, { "epoch": 0.05, "learning_rate": 1.998652366787248e-05, "loss": 2.5643, "step": 460 }, { "epoch": 0.05, "learning_rate": 1.9986354725741857e-05, "loss": 2.4613, "step": 461 }, { "epoch": 0.05, "learning_rate": 1.9986184731973193e-05, "loss": 2.4603, "step": 462 }, { "epoch": 0.05, "learning_rate": 1.998601368658438e-05, "loss": 2.4177, "step": 463 }, { "epoch": 0.05, "learning_rate": 1.9985841589593434e-05, "loss": 2.4737, "step": 464 }, { "epoch": 0.05, "learning_rate": 1.9985668441018478e-05, "loss": 2.5948, "step": 465 }, { "epoch": 0.05, "learning_rate": 1.998549424087775e-05, "loss": 2.4667, "step": 466 }, { "epoch": 0.05, "learning_rate": 1.9985318989189585e-05, "loss": 2.4201, "step": 467 }, { "epoch": 0.05, "learning_rate": 1.998514268597245e-05, "loss": 2.4639, "step": 468 }, { "epoch": 0.05, "learning_rate": 1.99849653312449e-05, "loss": 2.5545, "step": 469 }, { "epoch": 0.05, "learning_rate": 1.9984786925025617e-05, "loss": 2.5149, "step": 470 }, { "epoch": 0.05, "learning_rate": 1.998460746733339e-05, "loss": 2.4898, "step": 471 }, { "epoch": 0.05, "learning_rate": 1.9984426958187115e-05, "loss": 2.4624, "step": 472 }, { "epoch": 0.05, "learning_rate": 1.99842453976058e-05, "loss": 2.493, "step": 473 }, { "epoch": 0.05, "learning_rate": 1.9984062785608568e-05, "loss": 2.4814, "step": 474 }, { "epoch": 0.05, "learning_rate": 1.998387912221465e-05, "loss": 2.5352, "step": 475 }, { "epoch": 0.05, "learning_rate": 1.998369440744338e-05, "loss": 2.519, "step": 476 }, { "epoch": 0.05, "learning_rate": 1.998350864131422e-05, "loss": 2.5346, "step": 477 }, { "epoch": 0.05, "learning_rate": 1.998332182384672e-05, "loss": 2.4182, "step": 478 }, { "epoch": 0.05, "learning_rate": 1.9983133955060567e-05, "loss": 2.487, "step": 479 }, { "epoch": 0.05, "learning_rate": 1.9982945034975537e-05, "loss": 2.5514, "step": 480 }, { "epoch": 0.05, "learning_rate": 1.9982755063611522e-05, "loss": 2.4571, "step": 481 }, { "epoch": 0.05, "learning_rate": 1.9982564040988536e-05, "loss": 2.5098, "step": 482 }, { "epoch": 0.05, "learning_rate": 1.998237196712669e-05, "loss": 2.4514, "step": 483 }, { "epoch": 0.05, "learning_rate": 1.998217884204621e-05, "loss": 2.454, "step": 484 }, { "epoch": 0.05, "learning_rate": 1.9981984665767435e-05, "loss": 2.4763, "step": 485 }, { "epoch": 0.05, "learning_rate": 1.9981789438310814e-05, "loss": 2.5675, "step": 486 }, { "epoch": 0.05, "learning_rate": 1.9981593159696905e-05, "loss": 2.3775, "step": 487 }, { "epoch": 0.05, "learning_rate": 1.9981395829946376e-05, "loss": 2.5676, "step": 488 }, { "epoch": 0.05, "learning_rate": 1.9981197449080012e-05, "loss": 2.4557, "step": 489 }, { "epoch": 0.05, "learning_rate": 1.9980998017118704e-05, "loss": 2.4516, "step": 490 }, { "epoch": 0.05, "learning_rate": 1.9980797534083444e-05, "loss": 2.4759, "step": 491 }, { "epoch": 0.05, "learning_rate": 1.9980595999995354e-05, "loss": 2.5353, "step": 492 }, { "epoch": 0.05, "learning_rate": 1.9980393414875654e-05, "loss": 2.5315, "step": 493 }, { "epoch": 0.05, "learning_rate": 1.998018977874568e-05, "loss": 2.4876, "step": 494 }, { "epoch": 0.05, "learning_rate": 1.9979985091626868e-05, "loss": 2.5313, "step": 495 }, { "epoch": 0.05, "learning_rate": 1.9979779353540785e-05, "loss": 2.5437, "step": 496 }, { "epoch": 0.05, "learning_rate": 1.997957256450909e-05, "loss": 2.5609, "step": 497 }, { "epoch": 0.05, "learning_rate": 1.997936472455356e-05, "loss": 2.449, "step": 498 }, { "epoch": 0.05, "learning_rate": 1.9979155833696082e-05, "loss": 2.6204, "step": 499 }, { "epoch": 0.05, "learning_rate": 1.9978945891958656e-05, "loss": 2.4763, "step": 500 }, { "epoch": 0.05, "learning_rate": 1.9978734899363387e-05, "loss": 2.4951, "step": 501 }, { "epoch": 0.05, "learning_rate": 1.9978522855932498e-05, "loss": 2.4856, "step": 502 }, { "epoch": 0.05, "learning_rate": 1.9978309761688316e-05, "loss": 2.4736, "step": 503 }, { "epoch": 0.05, "learning_rate": 1.997809561665328e-05, "loss": 2.4864, "step": 504 }, { "epoch": 0.05, "learning_rate": 1.9977880420849945e-05, "loss": 2.6175, "step": 505 }, { "epoch": 0.05, "learning_rate": 1.997766417430097e-05, "loss": 2.5319, "step": 506 }, { "epoch": 0.05, "learning_rate": 1.9977446877029134e-05, "loss": 2.463, "step": 507 }, { "epoch": 0.05, "learning_rate": 1.997722852905731e-05, "loss": 2.5182, "step": 508 }, { "epoch": 0.05, "learning_rate": 1.9977009130408495e-05, "loss": 2.5305, "step": 509 }, { "epoch": 0.05, "learning_rate": 1.9976788681105795e-05, "loss": 2.47, "step": 510 }, { "epoch": 0.05, "learning_rate": 1.9976567181172427e-05, "loss": 2.4968, "step": 511 }, { "epoch": 0.05, "learning_rate": 1.9976344630631714e-05, "loss": 2.4267, "step": 512 }, { "epoch": 0.05, "learning_rate": 1.9976121029507088e-05, "loss": 2.6084, "step": 513 }, { "epoch": 0.05, "learning_rate": 1.99758963778221e-05, "loss": 2.6059, "step": 514 }, { "epoch": 0.05, "learning_rate": 1.997567067560041e-05, "loss": 2.4494, "step": 515 }, { "epoch": 0.05, "learning_rate": 1.9975443922865784e-05, "loss": 2.5164, "step": 516 }, { "epoch": 0.05, "learning_rate": 1.99752161196421e-05, "loss": 2.5004, "step": 517 }, { "epoch": 0.05, "learning_rate": 1.997498726595335e-05, "loss": 2.4915, "step": 518 }, { "epoch": 0.05, "learning_rate": 1.9974757361823628e-05, "loss": 2.5856, "step": 519 }, { "epoch": 0.05, "learning_rate": 1.997452640727715e-05, "loss": 2.6151, "step": 520 }, { "epoch": 0.05, "learning_rate": 1.9974294402338237e-05, "loss": 2.6082, "step": 521 }, { "epoch": 0.05, "learning_rate": 1.997406134703132e-05, "loss": 2.4376, "step": 522 }, { "epoch": 0.05, "learning_rate": 1.997382724138094e-05, "loss": 2.6183, "step": 523 }, { "epoch": 0.05, "learning_rate": 1.997359208541175e-05, "loss": 2.4892, "step": 524 }, { "epoch": 0.05, "learning_rate": 1.9973355879148518e-05, "loss": 2.481, "step": 525 }, { "epoch": 0.05, "learning_rate": 1.997311862261611e-05, "loss": 2.5075, "step": 526 }, { "epoch": 0.05, "learning_rate": 1.9972880315839523e-05, "loss": 2.4574, "step": 527 }, { "epoch": 0.05, "learning_rate": 1.997264095884384e-05, "loss": 2.4653, "step": 528 }, { "epoch": 0.05, "learning_rate": 1.9972400551654275e-05, "loss": 2.4287, "step": 529 }, { "epoch": 0.05, "learning_rate": 1.9972159094296142e-05, "loss": 2.47, "step": 530 }, { "epoch": 0.05, "learning_rate": 1.9971916586794866e-05, "loss": 2.4869, "step": 531 }, { "epoch": 0.05, "learning_rate": 1.9971673029175992e-05, "loss": 2.4792, "step": 532 }, { "epoch": 0.05, "learning_rate": 1.997142842146516e-05, "loss": 2.5195, "step": 533 }, { "epoch": 0.05, "learning_rate": 1.9971182763688134e-05, "loss": 2.5148, "step": 534 }, { "epoch": 0.05, "learning_rate": 1.9970936055870785e-05, "loss": 2.6105, "step": 535 }, { "epoch": 0.05, "learning_rate": 1.997068829803909e-05, "loss": 2.4623, "step": 536 }, { "epoch": 0.05, "learning_rate": 1.9970439490219137e-05, "loss": 2.4341, "step": 537 }, { "epoch": 0.05, "learning_rate": 1.9970189632437134e-05, "loss": 2.4391, "step": 538 }, { "epoch": 0.05, "learning_rate": 1.9969938724719388e-05, "loss": 2.514, "step": 539 }, { "epoch": 0.05, "learning_rate": 1.9969686767092324e-05, "loss": 2.5331, "step": 540 }, { "epoch": 0.05, "learning_rate": 1.9969433759582473e-05, "loss": 2.5327, "step": 541 }, { "epoch": 0.05, "learning_rate": 1.9969179702216484e-05, "loss": 2.5317, "step": 542 }, { "epoch": 0.05, "learning_rate": 1.9968924595021103e-05, "loss": 2.5216, "step": 543 }, { "epoch": 0.05, "learning_rate": 1.9968668438023197e-05, "loss": 2.522, "step": 544 }, { "epoch": 0.05, "learning_rate": 1.9968411231249746e-05, "loss": 2.4694, "step": 545 }, { "epoch": 0.05, "learning_rate": 1.996815297472783e-05, "loss": 2.5139, "step": 546 }, { "epoch": 0.05, "learning_rate": 1.9967893668484653e-05, "loss": 2.4842, "step": 547 }, { "epoch": 0.05, "learning_rate": 1.9967633312547513e-05, "loss": 2.3592, "step": 548 }, { "epoch": 0.06, "learning_rate": 1.996737190694383e-05, "loss": 2.4599, "step": 549 }, { "epoch": 0.06, "learning_rate": 1.9967109451701138e-05, "loss": 2.4099, "step": 550 }, { "epoch": 0.06, "learning_rate": 1.9966845946847066e-05, "loss": 2.5485, "step": 551 }, { "epoch": 0.06, "learning_rate": 1.9966581392409373e-05, "loss": 2.4462, "step": 552 }, { "epoch": 0.06, "learning_rate": 1.9966315788415912e-05, "loss": 2.4479, "step": 553 }, { "epoch": 0.06, "learning_rate": 1.996604913489465e-05, "loss": 2.4504, "step": 554 }, { "epoch": 0.06, "learning_rate": 1.9965781431873676e-05, "loss": 2.5061, "step": 555 }, { "epoch": 0.06, "learning_rate": 1.996551267938118e-05, "loss": 2.4979, "step": 556 }, { "epoch": 0.06, "learning_rate": 1.9965242877445453e-05, "loss": 2.5088, "step": 557 }, { "epoch": 0.06, "learning_rate": 1.9964972026094923e-05, "loss": 2.5166, "step": 558 }, { "epoch": 0.06, "learning_rate": 1.99647001253581e-05, "loss": 2.4412, "step": 559 }, { "epoch": 0.06, "learning_rate": 1.996442717526362e-05, "loss": 2.5052, "step": 560 }, { "epoch": 0.06, "learning_rate": 1.9964153175840234e-05, "loss": 2.498, "step": 561 }, { "epoch": 0.06, "learning_rate": 1.996387812711679e-05, "loss": 2.4824, "step": 562 }, { "epoch": 0.06, "learning_rate": 1.996360202912225e-05, "loss": 2.5992, "step": 563 }, { "epoch": 0.06, "learning_rate": 1.9963324881885695e-05, "loss": 2.4954, "step": 564 }, { "epoch": 0.06, "learning_rate": 1.996304668543631e-05, "loss": 2.4934, "step": 565 }, { "epoch": 0.06, "learning_rate": 1.9962767439803387e-05, "loss": 2.5209, "step": 566 }, { "epoch": 0.06, "learning_rate": 1.9962487145016335e-05, "loss": 2.5096, "step": 567 }, { "epoch": 0.06, "learning_rate": 1.9962205801104673e-05, "loss": 2.4612, "step": 568 }, { "epoch": 0.06, "learning_rate": 1.996192340809803e-05, "loss": 2.5329, "step": 569 }, { "epoch": 0.06, "learning_rate": 1.9961639966026137e-05, "loss": 2.5204, "step": 570 }, { "epoch": 0.06, "learning_rate": 1.9961355474918846e-05, "loss": 2.4488, "step": 571 }, { "epoch": 0.06, "learning_rate": 1.996106993480612e-05, "loss": 2.4942, "step": 572 }, { "epoch": 0.06, "learning_rate": 1.9960783345718023e-05, "loss": 2.461, "step": 573 }, { "epoch": 0.06, "learning_rate": 1.9960495707684738e-05, "loss": 2.3387, "step": 574 }, { "epoch": 0.06, "learning_rate": 1.9960207020736554e-05, "loss": 2.4938, "step": 575 }, { "epoch": 0.06, "learning_rate": 1.995991728490387e-05, "loss": 2.475, "step": 576 }, { "epoch": 0.06, "learning_rate": 1.9959626500217203e-05, "loss": 2.5129, "step": 577 }, { "epoch": 0.06, "learning_rate": 1.995933466670717e-05, "loss": 2.456, "step": 578 }, { "epoch": 0.06, "learning_rate": 1.995904178440451e-05, "loss": 2.4786, "step": 579 }, { "epoch": 0.06, "learning_rate": 1.9958747853340057e-05, "loss": 2.4605, "step": 580 }, { "epoch": 0.06, "learning_rate": 1.9958452873544768e-05, "loss": 2.4717, "step": 581 }, { "epoch": 0.06, "learning_rate": 1.9958156845049705e-05, "loss": 2.538, "step": 582 }, { "epoch": 0.06, "learning_rate": 1.9957859767886045e-05, "loss": 2.5705, "step": 583 }, { "epoch": 0.06, "learning_rate": 1.995756164208507e-05, "loss": 2.5451, "step": 584 }, { "epoch": 0.06, "learning_rate": 1.995726246767818e-05, "loss": 2.4095, "step": 585 }, { "epoch": 0.06, "learning_rate": 1.9956962244696873e-05, "loss": 2.5196, "step": 586 }, { "epoch": 0.06, "learning_rate": 1.9956660973172767e-05, "loss": 2.5121, "step": 587 }, { "epoch": 0.06, "learning_rate": 1.9956358653137588e-05, "loss": 2.5874, "step": 588 }, { "epoch": 0.06, "learning_rate": 1.9956055284623176e-05, "loss": 2.5204, "step": 589 }, { "epoch": 0.06, "learning_rate": 1.9955750867661475e-05, "loss": 2.4519, "step": 590 }, { "epoch": 0.06, "learning_rate": 1.9955445402284538e-05, "loss": 2.578, "step": 591 }, { "epoch": 0.06, "learning_rate": 1.9955138888524543e-05, "loss": 2.5777, "step": 592 }, { "epoch": 0.06, "learning_rate": 1.9954831326413764e-05, "loss": 2.5298, "step": 593 }, { "epoch": 0.06, "learning_rate": 1.9954522715984584e-05, "loss": 2.4366, "step": 594 }, { "epoch": 0.06, "learning_rate": 1.995421305726951e-05, "loss": 2.5709, "step": 595 }, { "epoch": 0.06, "learning_rate": 1.9953902350301146e-05, "loss": 2.5624, "step": 596 }, { "epoch": 0.06, "learning_rate": 1.9953590595112217e-05, "loss": 2.5055, "step": 597 }, { "epoch": 0.06, "learning_rate": 1.9953277791735544e-05, "loss": 2.5771, "step": 598 }, { "epoch": 0.06, "learning_rate": 1.9952963940204077e-05, "loss": 2.4554, "step": 599 }, { "epoch": 0.06, "learning_rate": 1.9952649040550866e-05, "loss": 2.5577, "step": 600 }, { "epoch": 0.06, "learning_rate": 1.9952333092809067e-05, "loss": 2.4373, "step": 601 }, { "epoch": 0.06, "learning_rate": 1.9952016097011952e-05, "loss": 2.42, "step": 602 }, { "epoch": 0.06, "learning_rate": 1.995169805319291e-05, "loss": 2.4544, "step": 603 }, { "epoch": 0.06, "learning_rate": 1.9951378961385424e-05, "loss": 2.4869, "step": 604 }, { "epoch": 0.06, "learning_rate": 1.9951058821623102e-05, "loss": 2.489, "step": 605 }, { "epoch": 0.06, "learning_rate": 1.9950737633939658e-05, "loss": 2.4768, "step": 606 }, { "epoch": 0.06, "learning_rate": 1.9950415398368915e-05, "loss": 2.3792, "step": 607 }, { "epoch": 0.06, "learning_rate": 1.9950092114944802e-05, "loss": 2.4233, "step": 608 }, { "epoch": 0.06, "learning_rate": 1.994976778370137e-05, "loss": 2.4006, "step": 609 }, { "epoch": 0.06, "learning_rate": 1.994944240467277e-05, "loss": 2.4594, "step": 610 }, { "epoch": 0.06, "learning_rate": 1.994911597789327e-05, "loss": 2.4967, "step": 611 }, { "epoch": 0.06, "learning_rate": 1.9948788503397235e-05, "loss": 2.5595, "step": 612 }, { "epoch": 0.06, "learning_rate": 1.9948459981219166e-05, "loss": 2.5119, "step": 613 }, { "epoch": 0.06, "learning_rate": 1.994813041139365e-05, "loss": 2.4373, "step": 614 }, { "epoch": 0.06, "learning_rate": 1.994779979395539e-05, "loss": 2.5018, "step": 615 }, { "epoch": 0.06, "learning_rate": 1.994746812893921e-05, "loss": 2.4677, "step": 616 }, { "epoch": 0.06, "learning_rate": 1.994713541638003e-05, "loss": 2.5976, "step": 617 }, { "epoch": 0.06, "learning_rate": 1.994680165631289e-05, "loss": 2.4473, "step": 618 }, { "epoch": 0.06, "learning_rate": 1.9946466848772943e-05, "loss": 2.4516, "step": 619 }, { "epoch": 0.06, "learning_rate": 1.994613099379544e-05, "loss": 2.4761, "step": 620 }, { "epoch": 0.06, "learning_rate": 1.9945794091415748e-05, "loss": 2.4801, "step": 621 }, { "epoch": 0.06, "learning_rate": 1.9945456141669354e-05, "loss": 2.5862, "step": 622 }, { "epoch": 0.06, "learning_rate": 1.9945117144591834e-05, "loss": 2.4868, "step": 623 }, { "epoch": 0.06, "learning_rate": 1.9944777100218898e-05, "loss": 2.4273, "step": 624 }, { "epoch": 0.06, "learning_rate": 1.994443600858635e-05, "loss": 2.3495, "step": 625 }, { "epoch": 0.06, "learning_rate": 1.994409386973011e-05, "loss": 2.2988, "step": 626 }, { "epoch": 0.06, "learning_rate": 1.9943750683686205e-05, "loss": 2.5089, "step": 627 }, { "epoch": 0.06, "learning_rate": 1.9943406450490783e-05, "loss": 2.4375, "step": 628 }, { "epoch": 0.06, "learning_rate": 1.994306117018009e-05, "loss": 2.483, "step": 629 }, { "epoch": 0.06, "learning_rate": 1.9942714842790484e-05, "loss": 2.5405, "step": 630 }, { "epoch": 0.06, "learning_rate": 1.9942367468358436e-05, "loss": 2.4379, "step": 631 }, { "epoch": 0.06, "learning_rate": 1.9942019046920535e-05, "loss": 2.5394, "step": 632 }, { "epoch": 0.06, "learning_rate": 1.994166957851346e-05, "loss": 2.392, "step": 633 }, { "epoch": 0.06, "learning_rate": 1.994131906317402e-05, "loss": 2.552, "step": 634 }, { "epoch": 0.06, "learning_rate": 1.994096750093913e-05, "loss": 2.4712, "step": 635 }, { "epoch": 0.06, "learning_rate": 1.994061489184581e-05, "loss": 2.4824, "step": 636 }, { "epoch": 0.06, "learning_rate": 1.9940261235931188e-05, "loss": 2.4267, "step": 637 }, { "epoch": 0.06, "learning_rate": 1.9939906533232507e-05, "loss": 2.515, "step": 638 }, { "epoch": 0.06, "learning_rate": 1.9939550783787123e-05, "loss": 2.4856, "step": 639 }, { "epoch": 0.06, "learning_rate": 1.99391939876325e-05, "loss": 2.5152, "step": 640 }, { "epoch": 0.06, "learning_rate": 1.993883614480621e-05, "loss": 2.4609, "step": 641 }, { "epoch": 0.06, "learning_rate": 1.9938477255345935e-05, "loss": 2.4234, "step": 642 }, { "epoch": 0.06, "learning_rate": 1.993811731928947e-05, "loss": 2.4664, "step": 643 }, { "epoch": 0.06, "learning_rate": 1.993775633667472e-05, "loss": 2.5028, "step": 644 }, { "epoch": 0.06, "learning_rate": 1.9937394307539693e-05, "loss": 2.535, "step": 645 }, { "epoch": 0.06, "learning_rate": 1.993703123192252e-05, "loss": 2.6574, "step": 646 }, { "epoch": 0.06, "learning_rate": 1.993666710986144e-05, "loss": 2.3997, "step": 647 }, { "epoch": 0.06, "learning_rate": 1.9936301941394786e-05, "loss": 2.5471, "step": 648 }, { "epoch": 0.07, "learning_rate": 1.993593572656102e-05, "loss": 2.4903, "step": 649 }, { "epoch": 0.07, "learning_rate": 1.9935568465398707e-05, "loss": 2.5552, "step": 650 }, { "epoch": 0.07, "learning_rate": 1.993520015794652e-05, "loss": 2.5171, "step": 651 }, { "epoch": 0.07, "learning_rate": 1.9934830804243245e-05, "loss": 2.4222, "step": 652 }, { "epoch": 0.07, "learning_rate": 1.993446040432778e-05, "loss": 2.3696, "step": 653 }, { "epoch": 0.07, "learning_rate": 1.9934088958239127e-05, "loss": 2.57, "step": 654 }, { "epoch": 0.07, "learning_rate": 1.993371646601641e-05, "loss": 2.5116, "step": 655 }, { "epoch": 0.07, "learning_rate": 1.9933342927698845e-05, "loss": 2.3706, "step": 656 }, { "epoch": 0.07, "learning_rate": 1.9932968343325774e-05, "loss": 2.467, "step": 657 }, { "epoch": 0.07, "learning_rate": 1.993259271293664e-05, "loss": 2.5279, "step": 658 }, { "epoch": 0.07, "learning_rate": 1.9932216036571006e-05, "loss": 2.4754, "step": 659 }, { "epoch": 0.07, "learning_rate": 1.9931838314268534e-05, "loss": 2.5019, "step": 660 }, { "epoch": 0.07, "learning_rate": 1.9931459546069004e-05, "loss": 2.4805, "step": 661 }, { "epoch": 0.07, "learning_rate": 1.9931079732012296e-05, "loss": 2.444, "step": 662 }, { "epoch": 0.07, "learning_rate": 1.9930698872138418e-05, "loss": 2.4675, "step": 663 }, { "epoch": 0.07, "learning_rate": 1.993031696648747e-05, "loss": 2.4565, "step": 664 }, { "epoch": 0.07, "learning_rate": 1.992993401509967e-05, "loss": 2.4008, "step": 665 }, { "epoch": 0.07, "learning_rate": 1.992955001801535e-05, "loss": 2.4534, "step": 666 }, { "epoch": 0.07, "learning_rate": 1.9929164975274942e-05, "loss": 2.5633, "step": 667 }, { "epoch": 0.07, "learning_rate": 1.9928778886918998e-05, "loss": 2.4938, "step": 668 }, { "epoch": 0.07, "learning_rate": 1.9928391752988176e-05, "loss": 2.4902, "step": 669 }, { "epoch": 0.07, "learning_rate": 1.992800357352324e-05, "loss": 2.4448, "step": 670 }, { "epoch": 0.07, "learning_rate": 1.9927614348565073e-05, "loss": 2.4471, "step": 671 }, { "epoch": 0.07, "learning_rate": 1.992722407815466e-05, "loss": 2.4865, "step": 672 }, { "epoch": 0.07, "learning_rate": 1.9926832762333103e-05, "loss": 2.4832, "step": 673 }, { "epoch": 0.07, "learning_rate": 1.9926440401141606e-05, "loss": 2.5086, "step": 674 }, { "epoch": 0.07, "learning_rate": 1.9926046994621494e-05, "loss": 2.5102, "step": 675 }, { "epoch": 0.07, "learning_rate": 1.9925652542814186e-05, "loss": 2.4231, "step": 676 }, { "epoch": 0.07, "learning_rate": 1.992525704576123e-05, "loss": 2.4154, "step": 677 }, { "epoch": 0.07, "learning_rate": 1.992486050350427e-05, "loss": 2.4144, "step": 678 }, { "epoch": 0.07, "learning_rate": 1.9924462916085067e-05, "loss": 2.3594, "step": 679 }, { "epoch": 0.07, "learning_rate": 1.9924064283545485e-05, "loss": 2.5373, "step": 680 }, { "epoch": 0.07, "learning_rate": 1.9923664605927508e-05, "loss": 2.5568, "step": 681 }, { "epoch": 0.07, "learning_rate": 1.9923263883273226e-05, "loss": 2.4461, "step": 682 }, { "epoch": 0.07, "learning_rate": 1.9922862115624837e-05, "loss": 2.5864, "step": 683 }, { "epoch": 0.07, "learning_rate": 1.9922459303024647e-05, "loss": 2.4412, "step": 684 }, { "epoch": 0.07, "learning_rate": 1.992205544551508e-05, "loss": 2.4555, "step": 685 }, { "epoch": 0.07, "learning_rate": 1.9921650543138657e-05, "loss": 2.5765, "step": 686 }, { "epoch": 0.07, "learning_rate": 1.9921244595938028e-05, "loss": 2.44, "step": 687 }, { "epoch": 0.07, "learning_rate": 1.9920837603955933e-05, "loss": 2.4603, "step": 688 }, { "epoch": 0.07, "learning_rate": 1.9920429567235236e-05, "loss": 2.4852, "step": 689 }, { "epoch": 0.07, "learning_rate": 1.992002048581891e-05, "loss": 2.5298, "step": 690 }, { "epoch": 0.07, "learning_rate": 1.9919610359750026e-05, "loss": 2.4307, "step": 691 }, { "epoch": 0.07, "learning_rate": 1.9919199189071782e-05, "loss": 2.4184, "step": 692 }, { "epoch": 0.07, "learning_rate": 1.9918786973827465e-05, "loss": 2.4742, "step": 693 }, { "epoch": 0.07, "learning_rate": 1.99183737140605e-05, "loss": 2.5088, "step": 694 }, { "epoch": 0.07, "learning_rate": 1.9917959409814394e-05, "loss": 2.4525, "step": 695 }, { "epoch": 0.07, "learning_rate": 1.9917544061132784e-05, "loss": 2.3996, "step": 696 }, { "epoch": 0.07, "learning_rate": 1.9917127668059405e-05, "loss": 2.4853, "step": 697 }, { "epoch": 0.07, "learning_rate": 1.9916710230638106e-05, "loss": 2.4421, "step": 698 }, { "epoch": 0.07, "learning_rate": 1.9916291748912847e-05, "loss": 2.4668, "step": 699 }, { "epoch": 0.07, "learning_rate": 1.99158722229277e-05, "loss": 2.3954, "step": 700 }, { "epoch": 0.07, "learning_rate": 1.9915451652726844e-05, "loss": 2.3597, "step": 701 }, { "epoch": 0.07, "learning_rate": 1.9915030038354564e-05, "loss": 2.5351, "step": 702 }, { "epoch": 0.07, "learning_rate": 1.9914607379855262e-05, "loss": 2.6089, "step": 703 }, { "epoch": 0.07, "learning_rate": 1.9914183677273447e-05, "loss": 2.3936, "step": 704 }, { "epoch": 0.07, "learning_rate": 1.9913758930653735e-05, "loss": 2.5455, "step": 705 }, { "epoch": 0.07, "learning_rate": 1.991333314004086e-05, "loss": 2.4613, "step": 706 }, { "epoch": 0.07, "learning_rate": 1.991290630547966e-05, "loss": 2.5119, "step": 707 }, { "epoch": 0.07, "learning_rate": 1.991247842701508e-05, "loss": 2.5179, "step": 708 }, { "epoch": 0.07, "learning_rate": 1.9912049504692187e-05, "loss": 2.4332, "step": 709 }, { "epoch": 0.07, "learning_rate": 1.9911619538556138e-05, "loss": 2.4755, "step": 710 }, { "epoch": 0.07, "learning_rate": 1.991118852865222e-05, "loss": 2.5133, "step": 711 }, { "epoch": 0.07, "learning_rate": 1.991075647502582e-05, "loss": 2.4888, "step": 712 }, { "epoch": 0.07, "learning_rate": 1.9910323377722435e-05, "loss": 2.4646, "step": 713 }, { "epoch": 0.07, "learning_rate": 1.9909889236787675e-05, "loss": 2.4977, "step": 714 }, { "epoch": 0.07, "learning_rate": 1.990945405226726e-05, "loss": 2.4874, "step": 715 }, { "epoch": 0.07, "learning_rate": 1.990901782420701e-05, "loss": 2.426, "step": 716 }, { "epoch": 0.07, "learning_rate": 1.9908580552652874e-05, "loss": 2.5031, "step": 717 }, { "epoch": 0.07, "learning_rate": 1.990814223765089e-05, "loss": 2.483, "step": 718 }, { "epoch": 0.07, "learning_rate": 1.9907702879247224e-05, "loss": 2.5668, "step": 719 }, { "epoch": 0.07, "learning_rate": 1.990726247748814e-05, "loss": 2.4303, "step": 720 }, { "epoch": 0.07, "learning_rate": 1.9906821032420018e-05, "loss": 2.544, "step": 721 }, { "epoch": 0.07, "learning_rate": 1.990637854408934e-05, "loss": 2.5572, "step": 722 }, { "epoch": 0.07, "learning_rate": 1.990593501254271e-05, "loss": 2.4689, "step": 723 }, { "epoch": 0.07, "learning_rate": 1.990549043782683e-05, "loss": 2.4274, "step": 724 }, { "epoch": 0.07, "learning_rate": 1.990504481998852e-05, "loss": 2.5979, "step": 725 }, { "epoch": 0.07, "learning_rate": 1.9904598159074706e-05, "loss": 2.5966, "step": 726 }, { "epoch": 0.07, "learning_rate": 1.9904150455132424e-05, "loss": 2.3793, "step": 727 }, { "epoch": 0.07, "learning_rate": 1.990370170820882e-05, "loss": 2.4348, "step": 728 }, { "epoch": 0.07, "learning_rate": 1.9903251918351155e-05, "loss": 2.4944, "step": 729 }, { "epoch": 0.07, "learning_rate": 1.990280108560679e-05, "loss": 2.3645, "step": 730 }, { "epoch": 0.07, "learning_rate": 1.9902349210023203e-05, "loss": 2.4637, "step": 731 }, { "epoch": 0.07, "learning_rate": 1.990189629164798e-05, "loss": 2.3831, "step": 732 }, { "epoch": 0.07, "learning_rate": 1.9901442330528814e-05, "loss": 2.4449, "step": 733 }, { "epoch": 0.07, "learning_rate": 1.990098732671352e-05, "loss": 2.4393, "step": 734 }, { "epoch": 0.07, "learning_rate": 1.990053128025e-05, "loss": 2.4796, "step": 735 }, { "epoch": 0.07, "learning_rate": 1.990007419118629e-05, "loss": 2.4601, "step": 736 }, { "epoch": 0.07, "learning_rate": 1.9899616059570518e-05, "loss": 2.5696, "step": 737 }, { "epoch": 0.07, "learning_rate": 1.9899156885450933e-05, "loss": 2.5292, "step": 738 }, { "epoch": 0.07, "learning_rate": 1.9898696668875886e-05, "loss": 2.399, "step": 739 }, { "epoch": 0.07, "learning_rate": 1.9898235409893844e-05, "loss": 2.3939, "step": 740 }, { "epoch": 0.07, "learning_rate": 1.9897773108553378e-05, "loss": 2.39, "step": 741 }, { "epoch": 0.07, "learning_rate": 1.9897309764903174e-05, "loss": 2.4454, "step": 742 }, { "epoch": 0.07, "learning_rate": 1.9896845378992026e-05, "loss": 2.4445, "step": 743 }, { "epoch": 0.07, "learning_rate": 1.9896379950868837e-05, "loss": 2.514, "step": 744 }, { "epoch": 0.07, "learning_rate": 1.9895913480582624e-05, "loss": 2.462, "step": 745 }, { "epoch": 0.07, "learning_rate": 1.98954459681825e-05, "loss": 2.4631, "step": 746 }, { "epoch": 0.07, "learning_rate": 1.9894977413717704e-05, "loss": 2.4677, "step": 747 }, { "epoch": 0.07, "learning_rate": 1.9894507817237577e-05, "loss": 2.546, "step": 748 }, { "epoch": 0.08, "learning_rate": 1.9894037178791573e-05, "loss": 2.4689, "step": 749 }, { "epoch": 0.08, "learning_rate": 1.989356549842925e-05, "loss": 2.4342, "step": 750 }, { "epoch": 0.08, "learning_rate": 1.9893092776200284e-05, "loss": 2.3229, "step": 751 }, { "epoch": 0.08, "learning_rate": 1.9892619012154454e-05, "loss": 2.5159, "step": 752 }, { "epoch": 0.08, "learning_rate": 1.989214420634165e-05, "loss": 2.4091, "step": 753 }, { "epoch": 0.08, "learning_rate": 1.989166835881187e-05, "loss": 2.497, "step": 754 }, { "epoch": 0.08, "learning_rate": 1.989119146961523e-05, "loss": 2.3891, "step": 755 }, { "epoch": 0.08, "learning_rate": 1.9890713538801952e-05, "loss": 2.5451, "step": 756 }, { "epoch": 0.08, "learning_rate": 1.9890234566422358e-05, "loss": 2.5554, "step": 757 }, { "epoch": 0.08, "learning_rate": 1.988975455252689e-05, "loss": 2.5993, "step": 758 }, { "epoch": 0.08, "learning_rate": 1.98892734971661e-05, "loss": 2.3485, "step": 759 }, { "epoch": 0.08, "learning_rate": 1.988879140039064e-05, "loss": 2.4788, "step": 760 }, { "epoch": 0.08, "learning_rate": 1.9888308262251286e-05, "loss": 2.375, "step": 761 }, { "epoch": 0.08, "learning_rate": 1.9887824082798916e-05, "loss": 2.5171, "step": 762 }, { "epoch": 0.08, "learning_rate": 1.9887338862084512e-05, "loss": 2.4336, "step": 763 }, { "epoch": 0.08, "learning_rate": 1.9886852600159174e-05, "loss": 2.4599, "step": 764 }, { "epoch": 0.08, "learning_rate": 1.9886365297074107e-05, "loss": 2.4154, "step": 765 }, { "epoch": 0.08, "learning_rate": 1.988587695288063e-05, "loss": 2.5439, "step": 766 }, { "epoch": 0.08, "learning_rate": 1.9885387567630174e-05, "loss": 2.5763, "step": 767 }, { "epoch": 0.08, "learning_rate": 1.9884897141374266e-05, "loss": 2.4262, "step": 768 }, { "epoch": 0.08, "learning_rate": 1.9884405674164557e-05, "loss": 2.5104, "step": 769 }, { "epoch": 0.08, "learning_rate": 1.9883913166052803e-05, "loss": 2.4405, "step": 770 }, { "epoch": 0.08, "learning_rate": 1.9883419617090863e-05, "loss": 2.4546, "step": 771 }, { "epoch": 0.08, "learning_rate": 1.9882925027330718e-05, "loss": 2.4822, "step": 772 }, { "epoch": 0.08, "learning_rate": 1.9882429396824447e-05, "loss": 2.4114, "step": 773 }, { "epoch": 0.08, "learning_rate": 1.9881932725624247e-05, "loss": 2.4067, "step": 774 }, { "epoch": 0.08, "learning_rate": 1.9881435013782417e-05, "loss": 2.4351, "step": 775 }, { "epoch": 0.08, "learning_rate": 1.9880936261351375e-05, "loss": 2.4951, "step": 776 }, { "epoch": 0.08, "learning_rate": 1.988043646838364e-05, "loss": 2.4349, "step": 777 }, { "epoch": 0.08, "learning_rate": 1.9879935634931847e-05, "loss": 2.3933, "step": 778 }, { "epoch": 0.08, "learning_rate": 1.9879433761048734e-05, "loss": 2.3671, "step": 779 }, { "epoch": 0.08, "learning_rate": 1.9878930846787154e-05, "loss": 2.5079, "step": 780 }, { "epoch": 0.08, "learning_rate": 1.9878426892200068e-05, "loss": 2.4366, "step": 781 }, { "epoch": 0.08, "learning_rate": 1.9877921897340544e-05, "loss": 2.5014, "step": 782 }, { "epoch": 0.08, "learning_rate": 1.9877415862261764e-05, "loss": 2.4732, "step": 783 }, { "epoch": 0.08, "learning_rate": 1.9876908787017015e-05, "loss": 2.5147, "step": 784 }, { "epoch": 0.08, "learning_rate": 1.98764006716597e-05, "loss": 2.4848, "step": 785 }, { "epoch": 0.08, "learning_rate": 1.987589151624332e-05, "loss": 2.5249, "step": 786 }, { "epoch": 0.08, "learning_rate": 1.9875381320821502e-05, "loss": 2.4381, "step": 787 }, { "epoch": 0.08, "learning_rate": 1.987487008544797e-05, "loss": 2.6981, "step": 788 }, { "epoch": 0.08, "learning_rate": 1.9874357810176558e-05, "loss": 2.4923, "step": 789 }, { "epoch": 0.08, "learning_rate": 1.9873844495061213e-05, "loss": 2.5115, "step": 790 }, { "epoch": 0.08, "learning_rate": 1.987333014015599e-05, "loss": 2.4483, "step": 791 }, { "epoch": 0.08, "learning_rate": 1.987281474551506e-05, "loss": 2.4953, "step": 792 }, { "epoch": 0.08, "learning_rate": 1.9872298311192696e-05, "loss": 2.4601, "step": 793 }, { "epoch": 0.08, "learning_rate": 1.9871780837243276e-05, "loss": 2.4553, "step": 794 }, { "epoch": 0.08, "learning_rate": 1.9871262323721305e-05, "loss": 2.381, "step": 795 }, { "epoch": 0.08, "learning_rate": 1.9870742770681378e-05, "loss": 2.4812, "step": 796 }, { "epoch": 0.08, "learning_rate": 1.987022217817821e-05, "loss": 2.4848, "step": 797 }, { "epoch": 0.08, "learning_rate": 1.986970054626662e-05, "loss": 2.4769, "step": 798 }, { "epoch": 0.08, "learning_rate": 1.9869177875001545e-05, "loss": 2.3616, "step": 799 }, { "epoch": 0.08, "learning_rate": 1.9868654164438026e-05, "loss": 2.5009, "step": 800 }, { "epoch": 0.08, "learning_rate": 1.986812941463121e-05, "loss": 2.4694, "step": 801 }, { "epoch": 0.08, "learning_rate": 1.986760362563636e-05, "loss": 2.4819, "step": 802 }, { "epoch": 0.08, "learning_rate": 1.9867076797508848e-05, "loss": 2.3373, "step": 803 }, { "epoch": 0.08, "learning_rate": 1.9866548930304145e-05, "loss": 2.4227, "step": 804 }, { "epoch": 0.08, "learning_rate": 1.9866020024077844e-05, "loss": 2.3986, "step": 805 }, { "epoch": 0.08, "learning_rate": 1.9865490078885643e-05, "loss": 2.4474, "step": 806 }, { "epoch": 0.08, "learning_rate": 1.986495909478335e-05, "loss": 2.4272, "step": 807 }, { "epoch": 0.08, "learning_rate": 1.986442707182688e-05, "loss": 2.3572, "step": 808 }, { "epoch": 0.08, "learning_rate": 1.9863894010072257e-05, "loss": 2.5565, "step": 809 }, { "epoch": 0.08, "learning_rate": 1.9863359909575622e-05, "loss": 2.4443, "step": 810 }, { "epoch": 0.08, "learning_rate": 1.9862824770393218e-05, "loss": 2.4679, "step": 811 }, { "epoch": 0.08, "learning_rate": 1.9862288592581395e-05, "loss": 2.5257, "step": 812 }, { "epoch": 0.08, "learning_rate": 1.986175137619662e-05, "loss": 2.449, "step": 813 }, { "epoch": 0.08, "learning_rate": 1.9861213121295465e-05, "loss": 2.4766, "step": 814 }, { "epoch": 0.08, "learning_rate": 1.9860673827934615e-05, "loss": 2.5498, "step": 815 }, { "epoch": 0.08, "learning_rate": 1.9860133496170857e-05, "loss": 2.5213, "step": 816 }, { "epoch": 0.08, "learning_rate": 1.9859592126061095e-05, "loss": 2.528, "step": 817 }, { "epoch": 0.08, "learning_rate": 1.9859049717662337e-05, "loss": 2.4627, "step": 818 }, { "epoch": 0.08, "learning_rate": 1.9858506271031705e-05, "loss": 2.4724, "step": 819 }, { "epoch": 0.08, "learning_rate": 1.9857961786226426e-05, "loss": 2.4431, "step": 820 }, { "epoch": 0.08, "learning_rate": 1.9857416263303845e-05, "loss": 2.4888, "step": 821 }, { "epoch": 0.08, "learning_rate": 1.9856869702321398e-05, "loss": 2.4897, "step": 822 }, { "epoch": 0.08, "learning_rate": 1.9856322103336653e-05, "loss": 2.4868, "step": 823 }, { "epoch": 0.08, "learning_rate": 1.9855773466407268e-05, "loss": 2.5493, "step": 824 }, { "epoch": 0.08, "learning_rate": 1.9855223791591025e-05, "loss": 2.4968, "step": 825 }, { "epoch": 0.08, "learning_rate": 1.9854673078945803e-05, "loss": 2.493, "step": 826 }, { "epoch": 0.08, "learning_rate": 1.98541213285296e-05, "loss": 2.405, "step": 827 }, { "epoch": 0.08, "learning_rate": 1.985356854040052e-05, "loss": 2.4369, "step": 828 }, { "epoch": 0.08, "learning_rate": 1.985301471461677e-05, "loss": 2.4622, "step": 829 }, { "epoch": 0.08, "learning_rate": 1.985245985123668e-05, "loss": 2.5218, "step": 830 }, { "epoch": 0.08, "learning_rate": 1.9851903950318678e-05, "loss": 2.4133, "step": 831 }, { "epoch": 0.08, "learning_rate": 1.9851347011921304e-05, "loss": 2.4688, "step": 832 }, { "epoch": 0.08, "learning_rate": 1.9850789036103207e-05, "loss": 2.5139, "step": 833 }, { "epoch": 0.08, "learning_rate": 1.9850230022923148e-05, "loss": 2.4202, "step": 834 }, { "epoch": 0.08, "learning_rate": 1.984966997243999e-05, "loss": 2.4866, "step": 835 }, { "epoch": 0.08, "learning_rate": 1.984910888471272e-05, "loss": 2.5632, "step": 836 }, { "epoch": 0.08, "learning_rate": 1.9848546759800416e-05, "loss": 2.609, "step": 837 }, { "epoch": 0.08, "learning_rate": 1.984798359776228e-05, "loss": 2.5892, "step": 838 }, { "epoch": 0.08, "learning_rate": 1.9847419398657616e-05, "loss": 2.4333, "step": 839 }, { "epoch": 0.08, "learning_rate": 1.984685416254583e-05, "loss": 2.3877, "step": 840 }, { "epoch": 0.08, "learning_rate": 1.984628788948646e-05, "loss": 2.4043, "step": 841 }, { "epoch": 0.08, "learning_rate": 1.984572057953913e-05, "loss": 2.4735, "step": 842 }, { "epoch": 0.08, "learning_rate": 1.984515223276358e-05, "loss": 2.4709, "step": 843 }, { "epoch": 0.08, "learning_rate": 1.984458284921967e-05, "loss": 2.4564, "step": 844 }, { "epoch": 0.08, "learning_rate": 1.984401242896735e-05, "loss": 2.4843, "step": 845 }, { "epoch": 0.08, "learning_rate": 1.9843440972066696e-05, "loss": 2.4175, "step": 846 }, { "epoch": 0.08, "learning_rate": 1.9842868478577886e-05, "loss": 2.612, "step": 847 }, { "epoch": 0.08, "learning_rate": 1.9842294948561208e-05, "loss": 2.4113, "step": 848 }, { "epoch": 0.09, "learning_rate": 1.9841720382077055e-05, "loss": 2.4621, "step": 849 }, { "epoch": 0.09, "learning_rate": 1.9841144779185936e-05, "loss": 2.463, "step": 850 }, { "epoch": 0.09, "learning_rate": 1.984056813994847e-05, "loss": 2.4984, "step": 851 }, { "epoch": 0.09, "learning_rate": 1.9839990464425376e-05, "loss": 2.4712, "step": 852 }, { "epoch": 0.09, "learning_rate": 1.983941175267749e-05, "loss": 2.459, "step": 853 }, { "epoch": 0.09, "learning_rate": 1.9838832004765754e-05, "loss": 2.3685, "step": 854 }, { "epoch": 0.09, "learning_rate": 1.983825122075122e-05, "loss": 2.5373, "step": 855 }, { "epoch": 0.09, "learning_rate": 1.9837669400695048e-05, "loss": 2.4083, "step": 856 }, { "epoch": 0.09, "learning_rate": 1.983708654465851e-05, "loss": 2.4044, "step": 857 }, { "epoch": 0.09, "learning_rate": 1.9836502652702984e-05, "loss": 2.4533, "step": 858 }, { "epoch": 0.09, "learning_rate": 1.9835917724889957e-05, "loss": 2.5148, "step": 859 }, { "epoch": 0.09, "learning_rate": 1.983533176128103e-05, "loss": 2.4216, "step": 860 }, { "epoch": 0.09, "learning_rate": 1.9834744761937905e-05, "loss": 2.4482, "step": 861 }, { "epoch": 0.09, "learning_rate": 1.98341567269224e-05, "loss": 2.3908, "step": 862 }, { "epoch": 0.09, "learning_rate": 1.983356765629644e-05, "loss": 2.442, "step": 863 }, { "epoch": 0.09, "learning_rate": 1.9832977550122056e-05, "loss": 2.369, "step": 864 }, { "epoch": 0.09, "learning_rate": 1.9832386408461393e-05, "loss": 2.5018, "step": 865 }, { "epoch": 0.09, "learning_rate": 1.98317942313767e-05, "loss": 2.4463, "step": 866 }, { "epoch": 0.09, "learning_rate": 1.9831201018930343e-05, "loss": 2.4414, "step": 867 }, { "epoch": 0.09, "learning_rate": 1.9830606771184785e-05, "loss": 2.4237, "step": 868 }, { "epoch": 0.09, "learning_rate": 1.9830011488202606e-05, "loss": 2.4054, "step": 869 }, { "epoch": 0.09, "learning_rate": 1.9829415170046497e-05, "loss": 2.5519, "step": 870 }, { "epoch": 0.09, "learning_rate": 1.9828817816779257e-05, "loss": 2.4888, "step": 871 }, { "epoch": 0.09, "learning_rate": 1.9828219428463783e-05, "loss": 2.5177, "step": 872 }, { "epoch": 0.09, "learning_rate": 1.9827620005163097e-05, "loss": 2.4215, "step": 873 }, { "epoch": 0.09, "learning_rate": 1.982701954694032e-05, "loss": 2.4626, "step": 874 }, { "epoch": 0.09, "learning_rate": 1.9826418053858688e-05, "loss": 2.4411, "step": 875 }, { "epoch": 0.09, "learning_rate": 1.9825815525981538e-05, "loss": 2.5298, "step": 876 }, { "epoch": 0.09, "learning_rate": 1.982521196337232e-05, "loss": 2.5026, "step": 877 }, { "epoch": 0.09, "learning_rate": 1.9824607366094605e-05, "loss": 2.343, "step": 878 }, { "epoch": 0.09, "learning_rate": 1.9824001734212043e-05, "loss": 2.425, "step": 879 }, { "epoch": 0.09, "learning_rate": 1.982339506778843e-05, "loss": 2.5101, "step": 880 }, { "epoch": 0.09, "learning_rate": 1.982278736688764e-05, "loss": 2.5373, "step": 881 }, { "epoch": 0.09, "learning_rate": 1.9822178631573676e-05, "loss": 2.4891, "step": 882 }, { "epoch": 0.09, "learning_rate": 1.9821568861910633e-05, "loss": 2.4746, "step": 883 }, { "epoch": 0.09, "learning_rate": 1.9820958057962736e-05, "loss": 2.519, "step": 884 }, { "epoch": 0.09, "learning_rate": 1.98203462197943e-05, "loss": 2.5301, "step": 885 }, { "epoch": 0.09, "learning_rate": 1.9819733347469757e-05, "loss": 2.4353, "step": 886 }, { "epoch": 0.09, "learning_rate": 1.981911944105365e-05, "loss": 2.4596, "step": 887 }, { "epoch": 0.09, "learning_rate": 1.981850450061062e-05, "loss": 2.4815, "step": 888 }, { "epoch": 0.09, "learning_rate": 1.9817888526205435e-05, "loss": 2.4443, "step": 889 }, { "epoch": 0.09, "learning_rate": 1.981727151790296e-05, "loss": 2.4752, "step": 890 }, { "epoch": 0.09, "learning_rate": 1.9816653475768165e-05, "loss": 2.5356, "step": 891 }, { "epoch": 0.09, "learning_rate": 1.981603439986614e-05, "loss": 2.4629, "step": 892 }, { "epoch": 0.09, "learning_rate": 1.9815414290262072e-05, "loss": 2.4751, "step": 893 }, { "epoch": 0.09, "learning_rate": 1.9814793147021267e-05, "loss": 2.4542, "step": 894 }, { "epoch": 0.09, "learning_rate": 1.9814170970209138e-05, "loss": 2.5082, "step": 895 }, { "epoch": 0.09, "learning_rate": 1.9813547759891202e-05, "loss": 2.4382, "step": 896 }, { "epoch": 0.09, "learning_rate": 1.981292351613309e-05, "loss": 2.4424, "step": 897 }, { "epoch": 0.09, "learning_rate": 1.9812298239000535e-05, "loss": 2.3675, "step": 898 }, { "epoch": 0.09, "learning_rate": 1.981167192855939e-05, "loss": 2.4274, "step": 899 }, { "epoch": 0.09, "learning_rate": 1.9811044584875604e-05, "loss": 2.4396, "step": 900 }, { "epoch": 0.09, "learning_rate": 1.981041620801525e-05, "loss": 2.556, "step": 901 }, { "epoch": 0.09, "learning_rate": 1.9809786798044488e-05, "loss": 2.5381, "step": 902 }, { "epoch": 0.09, "learning_rate": 1.9809156355029607e-05, "loss": 2.5152, "step": 903 }, { "epoch": 0.09, "learning_rate": 1.9808524879036997e-05, "loss": 2.5125, "step": 904 }, { "epoch": 0.09, "learning_rate": 1.9807892370133156e-05, "loss": 2.4861, "step": 905 }, { "epoch": 0.09, "learning_rate": 1.9807258828384695e-05, "loss": 2.471, "step": 906 }, { "epoch": 0.09, "learning_rate": 1.9806624253858326e-05, "loss": 2.5064, "step": 907 }, { "epoch": 0.09, "learning_rate": 1.980598864662088e-05, "loss": 2.4896, "step": 908 }, { "epoch": 0.09, "learning_rate": 1.9805352006739286e-05, "loss": 2.4038, "step": 909 }, { "epoch": 0.09, "learning_rate": 1.9804714334280586e-05, "loss": 2.4535, "step": 910 }, { "epoch": 0.09, "learning_rate": 1.9804075629311938e-05, "loss": 2.4022, "step": 911 }, { "epoch": 0.09, "learning_rate": 1.9803435891900597e-05, "loss": 2.5097, "step": 912 }, { "epoch": 0.09, "learning_rate": 1.9802795122113937e-05, "loss": 2.4925, "step": 913 }, { "epoch": 0.09, "learning_rate": 1.9802153320019432e-05, "loss": 2.4692, "step": 914 }, { "epoch": 0.09, "learning_rate": 1.9801510485684668e-05, "loss": 2.501, "step": 915 }, { "epoch": 0.09, "learning_rate": 1.980086661917734e-05, "loss": 2.4398, "step": 916 }, { "epoch": 0.09, "learning_rate": 1.9800221720565258e-05, "loss": 2.4797, "step": 917 }, { "epoch": 0.09, "learning_rate": 1.979957578991633e-05, "loss": 2.4953, "step": 918 }, { "epoch": 0.09, "learning_rate": 1.9798928827298578e-05, "loss": 2.439, "step": 919 }, { "epoch": 0.09, "learning_rate": 1.979828083278013e-05, "loss": 2.3987, "step": 920 }, { "epoch": 0.09, "learning_rate": 1.9797631806429227e-05, "loss": 2.469, "step": 921 }, { "epoch": 0.09, "learning_rate": 1.9796981748314213e-05, "loss": 2.3867, "step": 922 }, { "epoch": 0.09, "learning_rate": 1.9796330658503553e-05, "loss": 2.4074, "step": 923 }, { "epoch": 0.09, "learning_rate": 1.9795678537065805e-05, "loss": 2.5085, "step": 924 }, { "epoch": 0.09, "learning_rate": 1.979502538406964e-05, "loss": 2.5, "step": 925 }, { "epoch": 0.09, "learning_rate": 1.979437119958384e-05, "loss": 2.4917, "step": 926 }, { "epoch": 0.09, "learning_rate": 1.9793715983677303e-05, "loss": 2.4405, "step": 927 }, { "epoch": 0.09, "learning_rate": 1.9793059736419023e-05, "loss": 2.4696, "step": 928 }, { "epoch": 0.09, "learning_rate": 1.9792402457878106e-05, "loss": 2.4366, "step": 929 }, { "epoch": 0.09, "learning_rate": 1.979174414812377e-05, "loss": 2.5184, "step": 930 }, { "epoch": 0.09, "learning_rate": 1.9791084807225344e-05, "loss": 2.3717, "step": 931 }, { "epoch": 0.09, "learning_rate": 1.9790424435252256e-05, "loss": 2.4147, "step": 932 }, { "epoch": 0.09, "learning_rate": 1.978976303227405e-05, "loss": 2.4834, "step": 933 }, { "epoch": 0.09, "learning_rate": 1.9789100598360374e-05, "loss": 2.4404, "step": 934 }, { "epoch": 0.09, "learning_rate": 1.9788437133580995e-05, "loss": 2.5933, "step": 935 }, { "epoch": 0.09, "learning_rate": 1.9787772638005776e-05, "loss": 2.3761, "step": 936 }, { "epoch": 0.09, "learning_rate": 1.9787107111704687e-05, "loss": 2.4452, "step": 937 }, { "epoch": 0.09, "learning_rate": 1.9786440554747827e-05, "loss": 2.5655, "step": 938 }, { "epoch": 0.09, "learning_rate": 1.9785772967205377e-05, "loss": 2.3618, "step": 939 }, { "epoch": 0.09, "learning_rate": 1.9785104349147647e-05, "loss": 2.487, "step": 940 }, { "epoch": 0.09, "learning_rate": 1.978443470064504e-05, "loss": 2.581, "step": 941 }, { "epoch": 0.09, "learning_rate": 1.978376402176808e-05, "loss": 2.6028, "step": 942 }, { "epoch": 0.09, "learning_rate": 1.9783092312587394e-05, "loss": 2.4249, "step": 943 }, { "epoch": 0.09, "learning_rate": 1.9782419573173718e-05, "loss": 2.4371, "step": 944 }, { "epoch": 0.09, "learning_rate": 1.9781745803597898e-05, "loss": 2.4586, "step": 945 }, { "epoch": 0.09, "learning_rate": 1.9781071003930883e-05, "loss": 2.5464, "step": 946 }, { "epoch": 0.09, "learning_rate": 1.9780395174243735e-05, "loss": 2.4556, "step": 947 }, { "epoch": 0.09, "learning_rate": 1.977971831460763e-05, "loss": 2.5919, "step": 948 }, { "epoch": 0.1, "learning_rate": 1.977904042509384e-05, "loss": 2.4944, "step": 949 }, { "epoch": 0.1, "learning_rate": 1.977836150577375e-05, "loss": 2.4225, "step": 950 }, { "epoch": 0.1, "learning_rate": 1.9777681556718862e-05, "loss": 2.4488, "step": 951 }, { "epoch": 0.1, "learning_rate": 1.977700057800078e-05, "loss": 2.4619, "step": 952 }, { "epoch": 0.1, "learning_rate": 1.9776318569691207e-05, "loss": 2.4552, "step": 953 }, { "epoch": 0.1, "learning_rate": 1.9775635531861976e-05, "loss": 2.5808, "step": 954 }, { "epoch": 0.1, "learning_rate": 1.9774951464585004e-05, "loss": 2.5278, "step": 955 }, { "epoch": 0.1, "learning_rate": 1.9774266367932337e-05, "loss": 2.3608, "step": 956 }, { "epoch": 0.1, "learning_rate": 1.977358024197612e-05, "loss": 2.5201, "step": 957 }, { "epoch": 0.1, "learning_rate": 1.9772893086788598e-05, "loss": 2.4137, "step": 958 }, { "epoch": 0.1, "learning_rate": 1.9772204902442147e-05, "loss": 2.5136, "step": 959 }, { "epoch": 0.1, "learning_rate": 1.977151568900923e-05, "loss": 2.429, "step": 960 }, { "epoch": 0.1, "learning_rate": 1.9770825446562426e-05, "loss": 2.4269, "step": 961 }, { "epoch": 0.1, "learning_rate": 1.9770134175174425e-05, "loss": 2.5085, "step": 962 }, { "epoch": 0.1, "learning_rate": 1.9769441874918024e-05, "loss": 2.5548, "step": 963 }, { "epoch": 0.1, "learning_rate": 1.9768748545866125e-05, "loss": 2.4423, "step": 964 }, { "epoch": 0.1, "learning_rate": 1.9768054188091742e-05, "loss": 2.522, "step": 965 }, { "epoch": 0.1, "learning_rate": 1.9767358801668e-05, "loss": 2.4583, "step": 966 }, { "epoch": 0.1, "learning_rate": 1.9766662386668116e-05, "loss": 2.4423, "step": 967 }, { "epoch": 0.1, "learning_rate": 1.9765964943165442e-05, "loss": 2.5134, "step": 968 }, { "epoch": 0.1, "learning_rate": 1.9765266471233416e-05, "loss": 2.4979, "step": 969 }, { "epoch": 0.1, "learning_rate": 1.9764566970945594e-05, "loss": 2.5036, "step": 970 }, { "epoch": 0.1, "learning_rate": 1.976386644237564e-05, "loss": 2.4452, "step": 971 }, { "epoch": 0.1, "learning_rate": 1.9763164885597326e-05, "loss": 2.3947, "step": 972 }, { "epoch": 0.1, "learning_rate": 1.9762462300684525e-05, "loss": 2.3559, "step": 973 }, { "epoch": 0.1, "learning_rate": 1.9761758687711233e-05, "loss": 2.4651, "step": 974 }, { "epoch": 0.1, "learning_rate": 1.976105404675154e-05, "loss": 2.5634, "step": 975 }, { "epoch": 0.1, "learning_rate": 1.976034837787965e-05, "loss": 2.4293, "step": 976 }, { "epoch": 0.1, "learning_rate": 1.9759641681169878e-05, "loss": 2.5847, "step": 977 }, { "epoch": 0.1, "learning_rate": 1.975893395669664e-05, "loss": 2.4579, "step": 978 }, { "epoch": 0.1, "learning_rate": 1.975822520453447e-05, "loss": 2.5722, "step": 979 }, { "epoch": 0.1, "learning_rate": 1.9757515424758003e-05, "loss": 2.3393, "step": 980 }, { "epoch": 0.1, "learning_rate": 1.975680461744198e-05, "loss": 2.5065, "step": 981 }, { "epoch": 0.1, "learning_rate": 1.9756092782661266e-05, "loss": 2.4205, "step": 982 }, { "epoch": 0.1, "learning_rate": 1.975537992049081e-05, "loss": 2.4817, "step": 983 }, { "epoch": 0.1, "learning_rate": 1.9754666031005685e-05, "loss": 2.4021, "step": 984 }, { "epoch": 0.1, "learning_rate": 1.9753951114281072e-05, "loss": 2.439, "step": 985 }, { "epoch": 0.1, "learning_rate": 1.9753235170392253e-05, "loss": 2.4722, "step": 986 }, { "epoch": 0.1, "learning_rate": 1.975251819941463e-05, "loss": 2.4749, "step": 987 }, { "epoch": 0.1, "learning_rate": 1.9751800201423696e-05, "loss": 2.5006, "step": 988 }, { "epoch": 0.1, "learning_rate": 1.9751081176495065e-05, "loss": 2.4535, "step": 989 }, { "epoch": 0.1, "learning_rate": 1.9750361124704456e-05, "loss": 2.4629, "step": 990 }, { "epoch": 0.1, "learning_rate": 1.9749640046127697e-05, "loss": 2.454, "step": 991 }, { "epoch": 0.1, "learning_rate": 1.9748917940840724e-05, "loss": 2.4939, "step": 992 }, { "epoch": 0.1, "learning_rate": 1.9748194808919577e-05, "loss": 2.3416, "step": 993 }, { "epoch": 0.1, "learning_rate": 1.9747470650440407e-05, "loss": 2.5071, "step": 994 }, { "epoch": 0.1, "learning_rate": 1.9746745465479477e-05, "loss": 2.5432, "step": 995 }, { "epoch": 0.1, "learning_rate": 1.9746019254113153e-05, "loss": 2.4846, "step": 996 }, { "epoch": 0.1, "learning_rate": 1.9745292016417908e-05, "loss": 2.4517, "step": 997 }, { "epoch": 0.1, "learning_rate": 1.9744563752470327e-05, "loss": 2.3573, "step": 998 }, { "epoch": 0.1, "learning_rate": 1.9743834462347102e-05, "loss": 2.4072, "step": 999 }, { "epoch": 0.1, "learning_rate": 1.9743104146125033e-05, "loss": 2.442, "step": 1000 }, { "epoch": 0.1, "learning_rate": 1.974237280388103e-05, "loss": 2.5488, "step": 1001 }, { "epoch": 0.1, "learning_rate": 1.97416404356921e-05, "loss": 2.4362, "step": 1002 }, { "epoch": 0.1, "learning_rate": 1.974090704163538e-05, "loss": 2.4406, "step": 1003 }, { "epoch": 0.1, "learning_rate": 1.9740172621788094e-05, "loss": 2.436, "step": 1004 }, { "epoch": 0.1, "learning_rate": 1.973943717622758e-05, "loss": 2.4657, "step": 1005 }, { "epoch": 0.1, "learning_rate": 1.973870070503129e-05, "loss": 2.5037, "step": 1006 }, { "epoch": 0.1, "learning_rate": 1.973796320827678e-05, "loss": 2.4439, "step": 1007 }, { "epoch": 0.1, "learning_rate": 1.9737224686041712e-05, "loss": 2.4881, "step": 1008 }, { "epoch": 0.1, "learning_rate": 1.9736485138403858e-05, "loss": 2.518, "step": 1009 }, { "epoch": 0.1, "learning_rate": 1.9735744565441098e-05, "loss": 2.4324, "step": 1010 }, { "epoch": 0.1, "learning_rate": 1.9735002967231424e-05, "loss": 2.4948, "step": 1011 }, { "epoch": 0.1, "learning_rate": 1.9734260343852926e-05, "loss": 2.5142, "step": 1012 }, { "epoch": 0.1, "learning_rate": 1.9733516695383808e-05, "loss": 2.5482, "step": 1013 }, { "epoch": 0.1, "learning_rate": 1.9732772021902383e-05, "loss": 2.5354, "step": 1014 }, { "epoch": 0.1, "learning_rate": 1.9732026323487078e-05, "loss": 2.4362, "step": 1015 }, { "epoch": 0.1, "learning_rate": 1.9731279600216408e-05, "loss": 2.5119, "step": 1016 }, { "epoch": 0.1, "learning_rate": 1.9730531852169018e-05, "loss": 2.4857, "step": 1017 }, { "epoch": 0.1, "learning_rate": 1.972978307942365e-05, "loss": 2.6166, "step": 1018 }, { "epoch": 0.1, "learning_rate": 1.972903328205915e-05, "loss": 2.5604, "step": 1019 }, { "epoch": 0.1, "learning_rate": 1.9728282460154484e-05, "loss": 2.4336, "step": 1020 }, { "epoch": 0.1, "learning_rate": 1.9727530613788716e-05, "loss": 2.4108, "step": 1021 }, { "epoch": 0.1, "learning_rate": 1.9726777743041018e-05, "loss": 2.3173, "step": 1022 }, { "epoch": 0.1, "learning_rate": 1.972602384799068e-05, "loss": 2.4854, "step": 1023 }, { "epoch": 0.1, "learning_rate": 1.9725268928717086e-05, "loss": 2.4914, "step": 1024 }, { "epoch": 0.1, "learning_rate": 1.9724512985299736e-05, "loss": 2.404, "step": 1025 }, { "epoch": 0.1, "learning_rate": 1.9723756017818245e-05, "loss": 2.4092, "step": 1026 }, { "epoch": 0.1, "learning_rate": 1.9722998026352315e-05, "loss": 2.5158, "step": 1027 }, { "epoch": 0.1, "learning_rate": 1.9722239010981778e-05, "loss": 2.4362, "step": 1028 }, { "epoch": 0.1, "learning_rate": 1.9721478971786556e-05, "loss": 2.4316, "step": 1029 }, { "epoch": 0.1, "learning_rate": 1.972071790884669e-05, "loss": 2.4404, "step": 1030 }, { "epoch": 0.1, "learning_rate": 1.9719955822242327e-05, "loss": 2.4665, "step": 1031 }, { "epoch": 0.1, "learning_rate": 1.9719192712053718e-05, "loss": 2.4293, "step": 1032 }, { "epoch": 0.1, "learning_rate": 1.971842857836123e-05, "loss": 2.4945, "step": 1033 }, { "epoch": 0.1, "learning_rate": 1.9717663421245326e-05, "loss": 2.4864, "step": 1034 }, { "epoch": 0.1, "learning_rate": 1.971689724078658e-05, "loss": 2.3636, "step": 1035 }, { "epoch": 0.1, "learning_rate": 1.9716130037065685e-05, "loss": 2.4073, "step": 1036 }, { "epoch": 0.1, "learning_rate": 1.9715361810163434e-05, "loss": 2.4591, "step": 1037 }, { "epoch": 0.1, "learning_rate": 1.9714592560160717e-05, "loss": 2.3701, "step": 1038 }, { "epoch": 0.1, "learning_rate": 1.971382228713855e-05, "loss": 2.3447, "step": 1039 }, { "epoch": 0.1, "learning_rate": 1.9713050991178042e-05, "loss": 2.4433, "step": 1040 }, { "epoch": 0.1, "learning_rate": 1.9712278672360423e-05, "loss": 2.5141, "step": 1041 }, { "epoch": 0.1, "learning_rate": 1.971150533076702e-05, "loss": 2.3123, "step": 1042 }, { "epoch": 0.1, "learning_rate": 1.9710730966479273e-05, "loss": 2.4467, "step": 1043 }, { "epoch": 0.1, "learning_rate": 1.970995557957873e-05, "loss": 2.5245, "step": 1044 }, { "epoch": 0.1, "learning_rate": 1.970917917014704e-05, "loss": 2.4534, "step": 1045 }, { "epoch": 0.1, "learning_rate": 1.9708401738265967e-05, "loss": 2.4331, "step": 1046 }, { "epoch": 0.1, "learning_rate": 1.9707623284017385e-05, "loss": 2.5309, "step": 1047 }, { "epoch": 0.1, "learning_rate": 1.9706843807483268e-05, "loss": 2.4667, "step": 1048 }, { "epoch": 0.11, "learning_rate": 1.9706063308745694e-05, "loss": 2.4509, "step": 1049 }, { "epoch": 0.11, "learning_rate": 1.9705281787886867e-05, "loss": 2.4917, "step": 1050 }, { "epoch": 0.11, "learning_rate": 1.970449924498908e-05, "loss": 2.4956, "step": 1051 }, { "epoch": 0.11, "learning_rate": 1.970371568013474e-05, "loss": 2.4184, "step": 1052 }, { "epoch": 0.11, "learning_rate": 1.9702931093406364e-05, "loss": 2.4254, "step": 1053 }, { "epoch": 0.11, "learning_rate": 1.970214548488658e-05, "loss": 2.4489, "step": 1054 }, { "epoch": 0.11, "learning_rate": 1.970135885465811e-05, "loss": 2.4288, "step": 1055 }, { "epoch": 0.11, "learning_rate": 1.9700571202803797e-05, "loss": 2.5244, "step": 1056 }, { "epoch": 0.11, "learning_rate": 1.9699782529406585e-05, "loss": 2.4184, "step": 1057 }, { "epoch": 0.11, "learning_rate": 1.969899283454953e-05, "loss": 2.4596, "step": 1058 }, { "epoch": 0.11, "learning_rate": 1.9698202118315784e-05, "loss": 2.5451, "step": 1059 }, { "epoch": 0.11, "learning_rate": 1.9697410380788628e-05, "loss": 2.4851, "step": 1060 }, { "epoch": 0.11, "learning_rate": 1.9696617622051432e-05, "loss": 2.3658, "step": 1061 }, { "epoch": 0.11, "learning_rate": 1.9695823842187673e-05, "loss": 2.4304, "step": 1062 }, { "epoch": 0.11, "learning_rate": 1.969502904128095e-05, "loss": 2.3976, "step": 1063 }, { "epoch": 0.11, "learning_rate": 1.9694233219414963e-05, "loss": 2.4402, "step": 1064 }, { "epoch": 0.11, "learning_rate": 1.9693436376673514e-05, "loss": 2.5219, "step": 1065 }, { "epoch": 0.11, "learning_rate": 1.9692638513140517e-05, "loss": 2.4342, "step": 1066 }, { "epoch": 0.11, "learning_rate": 1.9691839628899988e-05, "loss": 2.3862, "step": 1067 }, { "epoch": 0.11, "learning_rate": 1.9691039724036067e-05, "loss": 2.5265, "step": 1068 }, { "epoch": 0.11, "learning_rate": 1.969023879863298e-05, "loss": 2.5235, "step": 1069 }, { "epoch": 0.11, "learning_rate": 1.9689436852775075e-05, "loss": 2.4904, "step": 1070 }, { "epoch": 0.11, "learning_rate": 1.96886338865468e-05, "loss": 2.3799, "step": 1071 }, { "epoch": 0.11, "learning_rate": 1.968782990003272e-05, "loss": 2.5514, "step": 1072 }, { "epoch": 0.11, "learning_rate": 1.9687024893317493e-05, "loss": 2.3703, "step": 1073 }, { "epoch": 0.11, "learning_rate": 1.9686218866485896e-05, "loss": 2.4938, "step": 1074 }, { "epoch": 0.11, "learning_rate": 1.9685411819622805e-05, "loss": 2.4346, "step": 1075 }, { "epoch": 0.11, "learning_rate": 1.968460375281322e-05, "loss": 2.4785, "step": 1076 }, { "epoch": 0.11, "learning_rate": 1.968379466614222e-05, "loss": 2.412, "step": 1077 }, { "epoch": 0.11, "learning_rate": 1.9682984559695025e-05, "loss": 2.4635, "step": 1078 }, { "epoch": 0.11, "learning_rate": 1.968217343355693e-05, "loss": 2.4369, "step": 1079 }, { "epoch": 0.11, "learning_rate": 1.9681361287813363e-05, "loss": 2.457, "step": 1080 }, { "epoch": 0.11, "learning_rate": 1.9680548122549845e-05, "loss": 2.4897, "step": 1081 }, { "epoch": 0.11, "learning_rate": 1.9679733937852007e-05, "loss": 2.4253, "step": 1082 }, { "epoch": 0.11, "learning_rate": 1.9678918733805596e-05, "loss": 2.4053, "step": 1083 }, { "epoch": 0.11, "learning_rate": 1.967810251049645e-05, "loss": 2.5043, "step": 1084 }, { "epoch": 0.11, "learning_rate": 1.9677285268010523e-05, "loss": 2.3831, "step": 1085 }, { "epoch": 0.11, "learning_rate": 1.9676467006433886e-05, "loss": 2.506, "step": 1086 }, { "epoch": 0.11, "learning_rate": 1.9675647725852704e-05, "loss": 2.4206, "step": 1087 }, { "epoch": 0.11, "learning_rate": 1.967482742635325e-05, "loss": 2.5057, "step": 1088 }, { "epoch": 0.11, "learning_rate": 1.967400610802191e-05, "loss": 2.4662, "step": 1089 }, { "epoch": 0.11, "learning_rate": 1.9673183770945177e-05, "loss": 2.4922, "step": 1090 }, { "epoch": 0.11, "learning_rate": 1.9672360415209647e-05, "loss": 2.5259, "step": 1091 }, { "epoch": 0.11, "learning_rate": 1.9671536040902023e-05, "loss": 2.4089, "step": 1092 }, { "epoch": 0.11, "learning_rate": 1.967071064810912e-05, "loss": 2.5044, "step": 1093 }, { "epoch": 0.11, "learning_rate": 1.9669884236917866e-05, "loss": 2.4373, "step": 1094 }, { "epoch": 0.11, "learning_rate": 1.9669056807415276e-05, "loss": 2.4901, "step": 1095 }, { "epoch": 0.11, "learning_rate": 1.9668228359688488e-05, "loss": 2.4525, "step": 1096 }, { "epoch": 0.11, "learning_rate": 1.966739889382475e-05, "loss": 2.423, "step": 1097 }, { "epoch": 0.11, "learning_rate": 1.96665684099114e-05, "loss": 2.4926, "step": 1098 }, { "epoch": 0.11, "learning_rate": 1.9665736908035907e-05, "loss": 2.4273, "step": 1099 }, { "epoch": 0.11, "learning_rate": 1.9664904388285825e-05, "loss": 2.4384, "step": 1100 }, { "epoch": 0.11, "learning_rate": 1.9664070850748825e-05, "loss": 2.4028, "step": 1101 }, { "epoch": 0.11, "learning_rate": 1.9663236295512692e-05, "loss": 2.4759, "step": 1102 }, { "epoch": 0.11, "learning_rate": 1.9662400722665302e-05, "loss": 2.3845, "step": 1103 }, { "epoch": 0.11, "learning_rate": 1.9661564132294654e-05, "loss": 2.382, "step": 1104 }, { "epoch": 0.11, "learning_rate": 1.9660726524488843e-05, "loss": 2.4535, "step": 1105 }, { "epoch": 0.11, "learning_rate": 1.9659887899336075e-05, "loss": 2.5064, "step": 1106 }, { "epoch": 0.11, "learning_rate": 1.965904825692467e-05, "loss": 2.3997, "step": 1107 }, { "epoch": 0.11, "learning_rate": 1.965820759734304e-05, "loss": 2.4248, "step": 1108 }, { "epoch": 0.11, "learning_rate": 1.9657365920679718e-05, "loss": 2.4506, "step": 1109 }, { "epoch": 0.11, "learning_rate": 1.965652322702334e-05, "loss": 2.3654, "step": 1110 }, { "epoch": 0.11, "learning_rate": 1.9655679516462644e-05, "loss": 2.4951, "step": 1111 }, { "epoch": 0.11, "learning_rate": 1.9654834789086478e-05, "loss": 2.4771, "step": 1112 }, { "epoch": 0.11, "learning_rate": 1.9653989044983804e-05, "loss": 2.3956, "step": 1113 }, { "epoch": 0.11, "learning_rate": 1.965314228424368e-05, "loss": 2.3612, "step": 1114 }, { "epoch": 0.11, "learning_rate": 1.9652294506955275e-05, "loss": 2.4481, "step": 1115 }, { "epoch": 0.11, "learning_rate": 1.9651445713207877e-05, "loss": 2.5497, "step": 1116 }, { "epoch": 0.11, "learning_rate": 1.965059590309086e-05, "loss": 2.4646, "step": 1117 }, { "epoch": 0.11, "learning_rate": 1.9649745076693716e-05, "loss": 2.4375, "step": 1118 }, { "epoch": 0.11, "learning_rate": 1.9648893234106044e-05, "loss": 2.4967, "step": 1119 }, { "epoch": 0.11, "learning_rate": 1.9648040375417557e-05, "loss": 2.4216, "step": 1120 }, { "epoch": 0.11, "learning_rate": 1.9647186500718057e-05, "loss": 2.4709, "step": 1121 }, { "epoch": 0.11, "learning_rate": 1.9646331610097473e-05, "loss": 2.3939, "step": 1122 }, { "epoch": 0.11, "learning_rate": 1.964547570364582e-05, "loss": 2.3923, "step": 1123 }, { "epoch": 0.11, "learning_rate": 1.964461878145324e-05, "loss": 2.4231, "step": 1124 }, { "epoch": 0.11, "learning_rate": 1.9643760843609972e-05, "loss": 2.4012, "step": 1125 }, { "epoch": 0.11, "learning_rate": 1.9642901890206363e-05, "loss": 2.5561, "step": 1126 }, { "epoch": 0.11, "learning_rate": 1.9642041921332863e-05, "loss": 2.4366, "step": 1127 }, { "epoch": 0.11, "learning_rate": 1.964118093708004e-05, "loss": 2.5733, "step": 1128 }, { "epoch": 0.11, "learning_rate": 1.9640318937538558e-05, "loss": 2.4791, "step": 1129 }, { "epoch": 0.11, "learning_rate": 1.9639455922799195e-05, "loss": 2.5335, "step": 1130 }, { "epoch": 0.11, "learning_rate": 1.9638591892952827e-05, "loss": 2.3568, "step": 1131 }, { "epoch": 0.11, "learning_rate": 1.9637726848090445e-05, "loss": 2.2835, "step": 1132 }, { "epoch": 0.11, "learning_rate": 1.9636860788303148e-05, "loss": 2.4744, "step": 1133 }, { "epoch": 0.11, "learning_rate": 1.963599371368214e-05, "loss": 2.5088, "step": 1134 }, { "epoch": 0.11, "learning_rate": 1.9635125624318725e-05, "loss": 2.4973, "step": 1135 }, { "epoch": 0.11, "learning_rate": 1.963425652030432e-05, "loss": 2.4829, "step": 1136 }, { "epoch": 0.11, "learning_rate": 1.9633386401730453e-05, "loss": 2.4408, "step": 1137 }, { "epoch": 0.11, "learning_rate": 1.9632515268688747e-05, "loss": 2.448, "step": 1138 }, { "epoch": 0.11, "learning_rate": 1.9631643121270945e-05, "loss": 2.4859, "step": 1139 }, { "epoch": 0.11, "learning_rate": 1.9630769959568888e-05, "loss": 2.3148, "step": 1140 }, { "epoch": 0.11, "learning_rate": 1.9629895783674527e-05, "loss": 2.4532, "step": 1141 }, { "epoch": 0.11, "learning_rate": 1.9629020593679917e-05, "loss": 2.4665, "step": 1142 }, { "epoch": 0.11, "learning_rate": 1.9628144389677226e-05, "loss": 2.354, "step": 1143 }, { "epoch": 0.11, "learning_rate": 1.9627267171758723e-05, "loss": 2.4573, "step": 1144 }, { "epoch": 0.11, "learning_rate": 1.9626388940016788e-05, "loss": 2.4113, "step": 1145 }, { "epoch": 0.11, "learning_rate": 1.96255096945439e-05, "loss": 2.361, "step": 1146 }, { "epoch": 0.11, "learning_rate": 1.9624629435432653e-05, "loss": 2.4468, "step": 1147 }, { "epoch": 0.12, "learning_rate": 1.9623748162775746e-05, "loss": 2.4271, "step": 1148 }, { "epoch": 0.12, "learning_rate": 1.962286587666598e-05, "loss": 2.3976, "step": 1149 }, { "epoch": 0.12, "learning_rate": 1.9621982577196274e-05, "loss": 2.4438, "step": 1150 }, { "epoch": 0.12, "learning_rate": 1.9621098264459636e-05, "loss": 2.5087, "step": 1151 }, { "epoch": 0.12, "learning_rate": 1.96202129385492e-05, "loss": 2.4252, "step": 1152 }, { "epoch": 0.12, "learning_rate": 1.9619326599558192e-05, "loss": 2.5471, "step": 1153 }, { "epoch": 0.12, "learning_rate": 1.961843924757995e-05, "loss": 2.4747, "step": 1154 }, { "epoch": 0.12, "learning_rate": 1.961755088270792e-05, "loss": 2.5854, "step": 1155 }, { "epoch": 0.12, "learning_rate": 1.9616661505035654e-05, "loss": 2.4684, "step": 1156 }, { "epoch": 0.12, "learning_rate": 1.9615771114656813e-05, "loss": 2.4948, "step": 1157 }, { "epoch": 0.12, "learning_rate": 1.9614879711665156e-05, "loss": 2.4797, "step": 1158 }, { "epoch": 0.12, "learning_rate": 1.9613987296154557e-05, "loss": 2.4612, "step": 1159 }, { "epoch": 0.12, "learning_rate": 1.9613093868218994e-05, "loss": 2.4759, "step": 1160 }, { "epoch": 0.12, "learning_rate": 1.9612199427952554e-05, "loss": 2.4328, "step": 1161 }, { "epoch": 0.12, "learning_rate": 1.961130397544942e-05, "loss": 2.4697, "step": 1162 }, { "epoch": 0.12, "learning_rate": 1.96104075108039e-05, "loss": 2.4874, "step": 1163 }, { "epoch": 0.12, "learning_rate": 1.9609510034110396e-05, "loss": 2.3976, "step": 1164 }, { "epoch": 0.12, "learning_rate": 1.9608611545463415e-05, "loss": 2.36, "step": 1165 }, { "epoch": 0.12, "learning_rate": 1.960771204495758e-05, "loss": 2.4723, "step": 1166 }, { "epoch": 0.12, "learning_rate": 1.960681153268761e-05, "loss": 2.4779, "step": 1167 }, { "epoch": 0.12, "learning_rate": 1.9605910008748338e-05, "loss": 2.3911, "step": 1168 }, { "epoch": 0.12, "learning_rate": 1.96050074732347e-05, "loss": 2.4525, "step": 1169 }, { "epoch": 0.12, "learning_rate": 1.9604103926241738e-05, "loss": 2.4501, "step": 1170 }, { "epoch": 0.12, "learning_rate": 1.9603199367864613e-05, "loss": 2.4809, "step": 1171 }, { "epoch": 0.12, "learning_rate": 1.9602293798198565e-05, "loss": 2.5545, "step": 1172 }, { "epoch": 0.12, "learning_rate": 1.9601387217338974e-05, "loss": 2.4395, "step": 1173 }, { "epoch": 0.12, "learning_rate": 1.9600479625381297e-05, "loss": 2.4756, "step": 1174 }, { "epoch": 0.12, "learning_rate": 1.9599571022421116e-05, "loss": 2.5044, "step": 1175 }, { "epoch": 0.12, "learning_rate": 1.9598661408554114e-05, "loss": 2.462, "step": 1176 }, { "epoch": 0.12, "learning_rate": 1.9597750783876077e-05, "loss": 2.5223, "step": 1177 }, { "epoch": 0.12, "learning_rate": 1.9596839148482906e-05, "loss": 2.4166, "step": 1178 }, { "epoch": 0.12, "learning_rate": 1.9595926502470598e-05, "loss": 2.492, "step": 1179 }, { "epoch": 0.12, "learning_rate": 1.959501284593526e-05, "loss": 2.4646, "step": 1180 }, { "epoch": 0.12, "learning_rate": 1.9594098178973112e-05, "loss": 2.4127, "step": 1181 }, { "epoch": 0.12, "learning_rate": 1.9593182501680476e-05, "loss": 2.391, "step": 1182 }, { "epoch": 0.12, "learning_rate": 1.9592265814153774e-05, "loss": 2.4557, "step": 1183 }, { "epoch": 0.12, "learning_rate": 1.9591348116489546e-05, "loss": 2.3394, "step": 1184 }, { "epoch": 0.12, "learning_rate": 1.9590429408784427e-05, "loss": 2.4483, "step": 1185 }, { "epoch": 0.12, "learning_rate": 1.9589509691135165e-05, "loss": 2.4582, "step": 1186 }, { "epoch": 0.12, "learning_rate": 1.9588588963638618e-05, "loss": 2.5286, "step": 1187 }, { "epoch": 0.12, "learning_rate": 1.958766722639174e-05, "loss": 2.3345, "step": 1188 }, { "epoch": 0.12, "learning_rate": 1.95867444794916e-05, "loss": 2.5839, "step": 1189 }, { "epoch": 0.12, "learning_rate": 1.958582072303537e-05, "loss": 2.4548, "step": 1190 }, { "epoch": 0.12, "learning_rate": 1.9584895957120324e-05, "loss": 2.4054, "step": 1191 }, { "epoch": 0.12, "learning_rate": 1.958397018184385e-05, "loss": 2.4216, "step": 1192 }, { "epoch": 0.12, "learning_rate": 1.9583043397303443e-05, "loss": 2.4738, "step": 1193 }, { "epoch": 0.12, "learning_rate": 1.9582115603596696e-05, "loss": 2.4992, "step": 1194 }, { "epoch": 0.12, "learning_rate": 1.958118680082131e-05, "loss": 2.4637, "step": 1195 }, { "epoch": 0.12, "learning_rate": 1.9580256989075103e-05, "loss": 2.3953, "step": 1196 }, { "epoch": 0.12, "learning_rate": 1.9579326168455983e-05, "loss": 2.4206, "step": 1197 }, { "epoch": 0.12, "learning_rate": 1.9578394339061975e-05, "loss": 2.4231, "step": 1198 }, { "epoch": 0.12, "learning_rate": 1.957746150099121e-05, "loss": 2.444, "step": 1199 }, { "epoch": 0.12, "learning_rate": 1.9576527654341922e-05, "loss": 2.5367, "step": 1200 }, { "epoch": 0.12, "learning_rate": 1.9575592799212453e-05, "loss": 2.4815, "step": 1201 }, { "epoch": 0.12, "learning_rate": 1.9574656935701248e-05, "loss": 2.4011, "step": 1202 }, { "epoch": 0.12, "learning_rate": 1.9573720063906857e-05, "loss": 2.502, "step": 1203 }, { "epoch": 0.12, "learning_rate": 1.9572782183927947e-05, "loss": 2.4092, "step": 1204 }, { "epoch": 0.12, "learning_rate": 1.9571843295863278e-05, "loss": 2.5165, "step": 1205 }, { "epoch": 0.12, "learning_rate": 1.9570903399811725e-05, "loss": 2.4127, "step": 1206 }, { "epoch": 0.12, "learning_rate": 1.9569962495872268e-05, "loss": 2.464, "step": 1207 }, { "epoch": 0.12, "learning_rate": 1.9569020584143987e-05, "loss": 2.4292, "step": 1208 }, { "epoch": 0.12, "learning_rate": 1.9568077664726073e-05, "loss": 2.3881, "step": 1209 }, { "epoch": 0.12, "learning_rate": 1.9567133737717824e-05, "loss": 2.415, "step": 1210 }, { "epoch": 0.12, "learning_rate": 1.9566188803218643e-05, "loss": 2.4629, "step": 1211 }, { "epoch": 0.12, "learning_rate": 1.9565242861328036e-05, "loss": 2.5124, "step": 1212 }, { "epoch": 0.12, "learning_rate": 1.9564295912145625e-05, "loss": 2.4519, "step": 1213 }, { "epoch": 0.12, "learning_rate": 1.956334795577112e-05, "loss": 2.4463, "step": 1214 }, { "epoch": 0.12, "learning_rate": 1.9562398992304358e-05, "loss": 2.5046, "step": 1215 }, { "epoch": 0.12, "learning_rate": 1.9561449021845264e-05, "loss": 2.502, "step": 1216 }, { "epoch": 0.12, "learning_rate": 1.956049804449388e-05, "loss": 2.4946, "step": 1217 }, { "epoch": 0.12, "learning_rate": 1.9559546060350353e-05, "loss": 2.5372, "step": 1218 }, { "epoch": 0.12, "learning_rate": 1.955859306951493e-05, "loss": 2.3516, "step": 1219 }, { "epoch": 0.12, "learning_rate": 1.9557639072087973e-05, "loss": 2.4498, "step": 1220 }, { "epoch": 0.12, "learning_rate": 1.9556684068169945e-05, "loss": 2.4426, "step": 1221 }, { "epoch": 0.12, "learning_rate": 1.955572805786141e-05, "loss": 2.4574, "step": 1222 }, { "epoch": 0.12, "learning_rate": 1.9554771041263046e-05, "loss": 2.4375, "step": 1223 }, { "epoch": 0.12, "learning_rate": 1.9553813018475633e-05, "loss": 2.3872, "step": 1224 }, { "epoch": 0.12, "learning_rate": 1.955285398960006e-05, "loss": 2.4691, "step": 1225 }, { "epoch": 0.12, "learning_rate": 1.955189395473732e-05, "loss": 2.427, "step": 1226 }, { "epoch": 0.12, "learning_rate": 1.9550932913988507e-05, "loss": 2.4945, "step": 1227 }, { "epoch": 0.12, "learning_rate": 1.954997086745483e-05, "loss": 2.4289, "step": 1228 }, { "epoch": 0.12, "learning_rate": 1.95490078152376e-05, "loss": 2.5135, "step": 1229 }, { "epoch": 0.12, "learning_rate": 1.9548043757438235e-05, "loss": 2.5014, "step": 1230 }, { "epoch": 0.12, "learning_rate": 1.9547078694158253e-05, "loss": 2.58, "step": 1231 }, { "epoch": 0.12, "learning_rate": 1.9546112625499285e-05, "loss": 2.4797, "step": 1232 }, { "epoch": 0.12, "learning_rate": 1.9545145551563064e-05, "loss": 2.4899, "step": 1233 }, { "epoch": 0.12, "learning_rate": 1.9544177472451436e-05, "loss": 2.3244, "step": 1234 }, { "epoch": 0.12, "learning_rate": 1.954320838826634e-05, "loss": 2.4437, "step": 1235 }, { "epoch": 0.12, "learning_rate": 1.9542238299109825e-05, "loss": 2.4641, "step": 1236 }, { "epoch": 0.12, "learning_rate": 1.9541267205084056e-05, "loss": 2.4423, "step": 1237 }, { "epoch": 0.12, "learning_rate": 1.9540295106291294e-05, "loss": 2.3742, "step": 1238 }, { "epoch": 0.12, "learning_rate": 1.9539322002833913e-05, "loss": 2.3938, "step": 1239 }, { "epoch": 0.12, "learning_rate": 1.9538347894814378e-05, "loss": 2.4418, "step": 1240 }, { "epoch": 0.12, "learning_rate": 1.9537372782335277e-05, "loss": 2.446, "step": 1241 }, { "epoch": 0.12, "learning_rate": 1.9536396665499296e-05, "loss": 2.4794, "step": 1242 }, { "epoch": 0.12, "learning_rate": 1.9535419544409225e-05, "loss": 2.4725, "step": 1243 }, { "epoch": 0.12, "learning_rate": 1.9534441419167965e-05, "loss": 2.3718, "step": 1244 }, { "epoch": 0.12, "learning_rate": 1.9533462289878518e-05, "loss": 2.4558, "step": 1245 }, { "epoch": 0.12, "learning_rate": 1.9532482156643992e-05, "loss": 2.5281, "step": 1246 }, { "epoch": 0.12, "learning_rate": 1.9531501019567607e-05, "loss": 2.4572, "step": 1247 }, { "epoch": 0.13, "learning_rate": 1.953051887875268e-05, "loss": 2.4582, "step": 1248 }, { "epoch": 0.13, "learning_rate": 1.952953573430264e-05, "loss": 2.3716, "step": 1249 }, { "epoch": 0.13, "learning_rate": 1.9528551586321018e-05, "loss": 2.5259, "step": 1250 }, { "epoch": 0.13, "learning_rate": 1.9527566434911458e-05, "loss": 2.4886, "step": 1251 }, { "epoch": 0.13, "learning_rate": 1.9526580280177695e-05, "loss": 2.4373, "step": 1252 }, { "epoch": 0.13, "learning_rate": 1.9525593122223584e-05, "loss": 2.4895, "step": 1253 }, { "epoch": 0.13, "learning_rate": 1.9524604961153077e-05, "loss": 2.4232, "step": 1254 }, { "epoch": 0.13, "learning_rate": 1.9523615797070236e-05, "loss": 2.4244, "step": 1255 }, { "epoch": 0.13, "learning_rate": 1.9522625630079227e-05, "loss": 2.4027, "step": 1256 }, { "epoch": 0.13, "learning_rate": 1.9521634460284323e-05, "loss": 2.4466, "step": 1257 }, { "epoch": 0.13, "learning_rate": 1.9520642287789902e-05, "loss": 2.5268, "step": 1258 }, { "epoch": 0.13, "learning_rate": 1.9519649112700447e-05, "loss": 2.4129, "step": 1259 }, { "epoch": 0.13, "learning_rate": 1.9518654935120546e-05, "loss": 2.3729, "step": 1260 }, { "epoch": 0.13, "learning_rate": 1.9517659755154893e-05, "loss": 2.4589, "step": 1261 }, { "epoch": 0.13, "learning_rate": 1.951666357290829e-05, "loss": 2.5174, "step": 1262 }, { "epoch": 0.13, "learning_rate": 1.951566638848564e-05, "loss": 2.4165, "step": 1263 }, { "epoch": 0.13, "learning_rate": 1.9514668201991958e-05, "loss": 2.4652, "step": 1264 }, { "epoch": 0.13, "learning_rate": 1.9513669013532355e-05, "loss": 2.2985, "step": 1265 }, { "epoch": 0.13, "learning_rate": 1.9512668823212056e-05, "loss": 2.4231, "step": 1266 }, { "epoch": 0.13, "learning_rate": 1.9511667631136387e-05, "loss": 2.4421, "step": 1267 }, { "epoch": 0.13, "learning_rate": 1.9510665437410782e-05, "loss": 2.4464, "step": 1268 }, { "epoch": 0.13, "learning_rate": 1.950966224214078e-05, "loss": 2.3625, "step": 1269 }, { "epoch": 0.13, "learning_rate": 1.950865804543203e-05, "loss": 2.4188, "step": 1270 }, { "epoch": 0.13, "learning_rate": 1.9507652847390268e-05, "loss": 2.3153, "step": 1271 }, { "epoch": 0.13, "learning_rate": 1.9506646648121357e-05, "loss": 2.3621, "step": 1272 }, { "epoch": 0.13, "learning_rate": 1.9505639447731264e-05, "loss": 2.452, "step": 1273 }, { "epoch": 0.13, "learning_rate": 1.9504631246326045e-05, "loss": 2.5185, "step": 1274 }, { "epoch": 0.13, "learning_rate": 1.9503622044011874e-05, "loss": 2.4048, "step": 1275 }, { "epoch": 0.13, "learning_rate": 1.9502611840895027e-05, "loss": 2.5023, "step": 1276 }, { "epoch": 0.13, "learning_rate": 1.950160063708189e-05, "loss": 2.3908, "step": 1277 }, { "epoch": 0.13, "learning_rate": 1.9500588432678946e-05, "loss": 2.439, "step": 1278 }, { "epoch": 0.13, "learning_rate": 1.9499575227792788e-05, "loss": 2.4674, "step": 1279 }, { "epoch": 0.13, "learning_rate": 1.9498561022530114e-05, "loss": 2.3716, "step": 1280 }, { "epoch": 0.13, "learning_rate": 1.949754581699773e-05, "loss": 2.4137, "step": 1281 }, { "epoch": 0.13, "learning_rate": 1.949652961130254e-05, "loss": 2.484, "step": 1282 }, { "epoch": 0.13, "learning_rate": 1.9495512405551565e-05, "loss": 2.3733, "step": 1283 }, { "epoch": 0.13, "learning_rate": 1.949449419985192e-05, "loss": 2.4478, "step": 1284 }, { "epoch": 0.13, "learning_rate": 1.949347499431083e-05, "loss": 2.5017, "step": 1285 }, { "epoch": 0.13, "learning_rate": 1.9492454789035623e-05, "loss": 2.4698, "step": 1286 }, { "epoch": 0.13, "learning_rate": 1.9491433584133736e-05, "loss": 2.4553, "step": 1287 }, { "epoch": 0.13, "learning_rate": 1.9490411379712716e-05, "loss": 2.4838, "step": 1288 }, { "epoch": 0.13, "learning_rate": 1.94893881758802e-05, "loss": 2.39, "step": 1289 }, { "epoch": 0.13, "learning_rate": 1.948836397274394e-05, "loss": 2.5133, "step": 1290 }, { "epoch": 0.13, "learning_rate": 1.9487338770411793e-05, "loss": 2.4534, "step": 1291 }, { "epoch": 0.13, "learning_rate": 1.9486312568991726e-05, "loss": 2.3925, "step": 1292 }, { "epoch": 0.13, "learning_rate": 1.9485285368591798e-05, "loss": 2.469, "step": 1293 }, { "epoch": 0.13, "learning_rate": 1.9484257169320187e-05, "loss": 2.4201, "step": 1294 }, { "epoch": 0.13, "learning_rate": 1.9483227971285166e-05, "loss": 2.5294, "step": 1295 }, { "epoch": 0.13, "learning_rate": 1.948219777459512e-05, "loss": 2.4762, "step": 1296 }, { "epoch": 0.13, "learning_rate": 1.948116657935853e-05, "loss": 2.3756, "step": 1297 }, { "epoch": 0.13, "learning_rate": 1.9480134385684e-05, "loss": 2.3903, "step": 1298 }, { "epoch": 0.13, "learning_rate": 1.947910119368022e-05, "loss": 2.5251, "step": 1299 }, { "epoch": 0.13, "learning_rate": 1.947806700345599e-05, "loss": 2.3751, "step": 1300 }, { "epoch": 0.13, "learning_rate": 1.9477031815120227e-05, "loss": 2.4256, "step": 1301 }, { "epoch": 0.13, "learning_rate": 1.947599562878194e-05, "loss": 2.4844, "step": 1302 }, { "epoch": 0.13, "learning_rate": 1.9474958444550244e-05, "loss": 2.292, "step": 1303 }, { "epoch": 0.13, "learning_rate": 1.9473920262534363e-05, "loss": 2.4474, "step": 1304 }, { "epoch": 0.13, "learning_rate": 1.947288108284363e-05, "loss": 2.4948, "step": 1305 }, { "epoch": 0.13, "learning_rate": 1.9471840905587476e-05, "loss": 2.422, "step": 1306 }, { "epoch": 0.13, "learning_rate": 1.9470799730875437e-05, "loss": 2.3683, "step": 1307 }, { "epoch": 0.13, "learning_rate": 1.9469757558817163e-05, "loss": 2.3711, "step": 1308 }, { "epoch": 0.13, "learning_rate": 1.9468714389522392e-05, "loss": 2.4087, "step": 1309 }, { "epoch": 0.13, "learning_rate": 1.946767022310099e-05, "loss": 2.432, "step": 1310 }, { "epoch": 0.13, "learning_rate": 1.9466625059662903e-05, "loss": 2.4318, "step": 1311 }, { "epoch": 0.13, "learning_rate": 1.9465578899318203e-05, "loss": 2.5427, "step": 1312 }, { "epoch": 0.13, "learning_rate": 1.9464531742177056e-05, "loss": 2.4546, "step": 1313 }, { "epoch": 0.13, "learning_rate": 1.9463483588349737e-05, "loss": 2.4897, "step": 1314 }, { "epoch": 0.13, "learning_rate": 1.9462434437946623e-05, "loss": 2.5227, "step": 1315 }, { "epoch": 0.13, "learning_rate": 1.9461384291078196e-05, "loss": 2.4133, "step": 1316 }, { "epoch": 0.13, "learning_rate": 1.946033314785505e-05, "loss": 2.3905, "step": 1317 }, { "epoch": 0.13, "learning_rate": 1.9459281008387872e-05, "loss": 2.5517, "step": 1318 }, { "epoch": 0.13, "learning_rate": 1.9458227872787462e-05, "loss": 2.3821, "step": 1319 }, { "epoch": 0.13, "learning_rate": 1.9457173741164722e-05, "loss": 2.4483, "step": 1320 }, { "epoch": 0.13, "learning_rate": 1.9456118613630665e-05, "loss": 2.4131, "step": 1321 }, { "epoch": 0.13, "learning_rate": 1.9455062490296398e-05, "loss": 2.3504, "step": 1322 }, { "epoch": 0.13, "learning_rate": 1.9454005371273142e-05, "loss": 2.4491, "step": 1323 }, { "epoch": 0.13, "learning_rate": 1.9452947256672216e-05, "loss": 2.4081, "step": 1324 }, { "epoch": 0.13, "learning_rate": 1.9451888146605055e-05, "loss": 2.3493, "step": 1325 }, { "epoch": 0.13, "learning_rate": 1.945082804118318e-05, "loss": 2.4942, "step": 1326 }, { "epoch": 0.13, "learning_rate": 1.9449766940518237e-05, "loss": 2.4248, "step": 1327 }, { "epoch": 0.13, "learning_rate": 1.9448704844721967e-05, "loss": 2.569, "step": 1328 }, { "epoch": 0.13, "learning_rate": 1.9447641753906214e-05, "loss": 2.4629, "step": 1329 }, { "epoch": 0.13, "learning_rate": 1.9446577668182928e-05, "loss": 2.412, "step": 1330 }, { "epoch": 0.13, "learning_rate": 1.944551258766417e-05, "loss": 2.45, "step": 1331 }, { "epoch": 0.13, "learning_rate": 1.9444446512462098e-05, "loss": 2.5064, "step": 1332 }, { "epoch": 0.13, "learning_rate": 1.944337944268898e-05, "loss": 2.3869, "step": 1333 }, { "epoch": 0.13, "learning_rate": 1.944231137845718e-05, "loss": 2.4126, "step": 1334 }, { "epoch": 0.13, "learning_rate": 1.944124231987918e-05, "loss": 2.4617, "step": 1335 }, { "epoch": 0.13, "learning_rate": 1.9440172267067558e-05, "loss": 2.4455, "step": 1336 }, { "epoch": 0.13, "learning_rate": 1.9439101220134997e-05, "loss": 2.4585, "step": 1337 }, { "epoch": 0.13, "learning_rate": 1.9438029179194287e-05, "loss": 2.3753, "step": 1338 }, { "epoch": 0.13, "learning_rate": 1.9436956144358324e-05, "loss": 2.5243, "step": 1339 }, { "epoch": 0.13, "learning_rate": 1.943588211574011e-05, "loss": 2.4974, "step": 1340 }, { "epoch": 0.13, "learning_rate": 1.9434807093452733e-05, "loss": 2.6153, "step": 1341 }, { "epoch": 0.13, "learning_rate": 1.943373107760942e-05, "loss": 2.5346, "step": 1342 }, { "epoch": 0.13, "learning_rate": 1.9432654068323472e-05, "loss": 2.4565, "step": 1343 }, { "epoch": 0.13, "learning_rate": 1.9431576065708306e-05, "loss": 2.4327, "step": 1344 }, { "epoch": 0.13, "learning_rate": 1.9430497069877448e-05, "loss": 2.4874, "step": 1345 }, { "epoch": 0.13, "learning_rate": 1.9429417080944526e-05, "loss": 2.4227, "step": 1346 }, { "epoch": 0.13, "learning_rate": 1.9428336099023264e-05, "loss": 2.5079, "step": 1347 }, { "epoch": 0.14, "learning_rate": 1.9427254124227506e-05, "loss": 2.5671, "step": 1348 }, { "epoch": 0.14, "learning_rate": 1.9426171156671183e-05, "loss": 2.3589, "step": 1349 }, { "epoch": 0.14, "learning_rate": 1.9425087196468346e-05, "loss": 2.4978, "step": 1350 }, { "epoch": 0.14, "learning_rate": 1.9424002243733142e-05, "loss": 2.536, "step": 1351 }, { "epoch": 0.14, "learning_rate": 1.9422916298579826e-05, "loss": 2.4745, "step": 1352 }, { "epoch": 0.14, "learning_rate": 1.9421829361122753e-05, "loss": 2.4297, "step": 1353 }, { "epoch": 0.14, "learning_rate": 1.9420741431476392e-05, "loss": 2.3748, "step": 1354 }, { "epoch": 0.14, "learning_rate": 1.94196525097553e-05, "loss": 2.4249, "step": 1355 }, { "epoch": 0.14, "learning_rate": 1.9418562596074158e-05, "loss": 2.3385, "step": 1356 }, { "epoch": 0.14, "learning_rate": 1.941747169054774e-05, "loss": 2.4146, "step": 1357 }, { "epoch": 0.14, "learning_rate": 1.941637979329092e-05, "loss": 2.4146, "step": 1358 }, { "epoch": 0.14, "learning_rate": 1.9415286904418696e-05, "loss": 2.4619, "step": 1359 }, { "epoch": 0.14, "learning_rate": 1.9414193024046143e-05, "loss": 2.5162, "step": 1360 }, { "epoch": 0.14, "learning_rate": 1.9413098152288464e-05, "loss": 2.4816, "step": 1361 }, { "epoch": 0.14, "learning_rate": 1.9412002289260954e-05, "loss": 2.5671, "step": 1362 }, { "epoch": 0.14, "learning_rate": 1.9410905435079017e-05, "loss": 2.2701, "step": 1363 }, { "epoch": 0.14, "learning_rate": 1.9409807589858157e-05, "loss": 2.4425, "step": 1364 }, { "epoch": 0.14, "learning_rate": 1.9408708753713987e-05, "loss": 2.4151, "step": 1365 }, { "epoch": 0.14, "learning_rate": 1.9407608926762226e-05, "loss": 2.4965, "step": 1366 }, { "epoch": 0.14, "learning_rate": 1.940650810911869e-05, "loss": 2.4212, "step": 1367 }, { "epoch": 0.14, "learning_rate": 1.9405406300899305e-05, "loss": 2.4982, "step": 1368 }, { "epoch": 0.14, "learning_rate": 1.94043035022201e-05, "loss": 2.4125, "step": 1369 }, { "epoch": 0.14, "learning_rate": 1.9403199713197203e-05, "loss": 2.5004, "step": 1370 }, { "epoch": 0.14, "learning_rate": 1.9402094933946858e-05, "loss": 2.306, "step": 1371 }, { "epoch": 0.14, "learning_rate": 1.9400989164585403e-05, "loss": 2.4442, "step": 1372 }, { "epoch": 0.14, "learning_rate": 1.9399882405229288e-05, "loss": 2.3791, "step": 1373 }, { "epoch": 0.14, "learning_rate": 1.9398774655995058e-05, "loss": 2.429, "step": 1374 }, { "epoch": 0.14, "learning_rate": 1.939766591699937e-05, "loss": 2.4058, "step": 1375 }, { "epoch": 0.14, "learning_rate": 1.939655618835898e-05, "loss": 2.4762, "step": 1376 }, { "epoch": 0.14, "learning_rate": 1.939544547019075e-05, "loss": 2.4178, "step": 1377 }, { "epoch": 0.14, "learning_rate": 1.9394333762611652e-05, "loss": 2.4465, "step": 1378 }, { "epoch": 0.14, "learning_rate": 1.9393221065738756e-05, "loss": 2.5346, "step": 1379 }, { "epoch": 0.14, "learning_rate": 1.9392107379689237e-05, "loss": 2.4143, "step": 1380 }, { "epoch": 0.14, "learning_rate": 1.939099270458037e-05, "loss": 2.5296, "step": 1381 }, { "epoch": 0.14, "learning_rate": 1.938987704052954e-05, "loss": 2.4663, "step": 1382 }, { "epoch": 0.14, "learning_rate": 1.938876038765424e-05, "loss": 2.4775, "step": 1383 }, { "epoch": 0.14, "learning_rate": 1.938764274607206e-05, "loss": 2.4213, "step": 1384 }, { "epoch": 0.14, "learning_rate": 1.938652411590069e-05, "loss": 2.4046, "step": 1385 }, { "epoch": 0.14, "learning_rate": 1.938540449725794e-05, "loss": 2.4842, "step": 1386 }, { "epoch": 0.14, "learning_rate": 1.9384283890261704e-05, "loss": 2.5001, "step": 1387 }, { "epoch": 0.14, "learning_rate": 1.9383162295030002e-05, "loss": 2.478, "step": 1388 }, { "epoch": 0.14, "learning_rate": 1.9382039711680936e-05, "loss": 2.3678, "step": 1389 }, { "epoch": 0.14, "learning_rate": 1.938091614033273e-05, "loss": 2.4531, "step": 1390 }, { "epoch": 0.14, "learning_rate": 1.9379791581103693e-05, "loss": 2.423, "step": 1391 }, { "epoch": 0.14, "learning_rate": 1.937866603411226e-05, "loss": 2.5304, "step": 1392 }, { "epoch": 0.14, "learning_rate": 1.937753949947696e-05, "loss": 2.4271, "step": 1393 }, { "epoch": 0.14, "learning_rate": 1.937641197731642e-05, "loss": 2.4135, "step": 1394 }, { "epoch": 0.14, "learning_rate": 1.9375283467749382e-05, "loss": 2.3935, "step": 1395 }, { "epoch": 0.14, "learning_rate": 1.9374153970894683e-05, "loss": 2.478, "step": 1396 }, { "epoch": 0.14, "learning_rate": 1.9373023486871264e-05, "loss": 2.3914, "step": 1397 }, { "epoch": 0.14, "learning_rate": 1.937189201579818e-05, "loss": 2.4724, "step": 1398 }, { "epoch": 0.14, "learning_rate": 1.937075955779458e-05, "loss": 2.3722, "step": 1399 }, { "epoch": 0.14, "learning_rate": 1.936962611297972e-05, "loss": 2.4136, "step": 1400 }, { "epoch": 0.14, "learning_rate": 1.9368491681472963e-05, "loss": 2.4832, "step": 1401 }, { "epoch": 0.14, "learning_rate": 1.9367356263393772e-05, "loss": 2.4454, "step": 1402 }, { "epoch": 0.14, "learning_rate": 1.936621985886171e-05, "loss": 2.4482, "step": 1403 }, { "epoch": 0.14, "learning_rate": 1.936508246799646e-05, "loss": 2.5189, "step": 1404 }, { "epoch": 0.14, "learning_rate": 1.936394409091779e-05, "loss": 2.6204, "step": 1405 }, { "epoch": 0.14, "learning_rate": 1.9362804727745576e-05, "loss": 2.4336, "step": 1406 }, { "epoch": 0.14, "learning_rate": 1.936166437859981e-05, "loss": 2.4185, "step": 1407 }, { "epoch": 0.14, "learning_rate": 1.9360523043600575e-05, "loss": 2.4344, "step": 1408 }, { "epoch": 0.14, "learning_rate": 1.9359380722868063e-05, "loss": 2.3658, "step": 1409 }, { "epoch": 0.14, "learning_rate": 1.9358237416522568e-05, "loss": 2.4998, "step": 1410 }, { "epoch": 0.14, "learning_rate": 1.935709312468449e-05, "loss": 2.3744, "step": 1411 }, { "epoch": 0.14, "learning_rate": 1.935594784747433e-05, "loss": 2.4152, "step": 1412 }, { "epoch": 0.14, "learning_rate": 1.9354801585012696e-05, "loss": 2.4609, "step": 1413 }, { "epoch": 0.14, "learning_rate": 1.93536543374203e-05, "loss": 2.5328, "step": 1414 }, { "epoch": 0.14, "learning_rate": 1.935250610481795e-05, "loss": 2.4698, "step": 1415 }, { "epoch": 0.14, "learning_rate": 1.9351356887326568e-05, "loss": 2.5174, "step": 1416 }, { "epoch": 0.14, "learning_rate": 1.935020668506717e-05, "loss": 2.4095, "step": 1417 }, { "epoch": 0.14, "learning_rate": 1.9349055498160887e-05, "loss": 2.3661, "step": 1418 }, { "epoch": 0.14, "learning_rate": 1.9347903326728946e-05, "loss": 2.4492, "step": 1419 }, { "epoch": 0.14, "learning_rate": 1.9346750170892677e-05, "loss": 2.4923, "step": 1420 }, { "epoch": 0.14, "learning_rate": 1.934559603077352e-05, "loss": 2.4688, "step": 1421 }, { "epoch": 0.14, "learning_rate": 1.934444090649301e-05, "loss": 2.4573, "step": 1422 }, { "epoch": 0.14, "learning_rate": 1.9343284798172798e-05, "loss": 2.5252, "step": 1423 }, { "epoch": 0.14, "learning_rate": 1.9342127705934615e-05, "loss": 2.4096, "step": 1424 }, { "epoch": 0.14, "learning_rate": 1.934096962990033e-05, "loss": 2.45, "step": 1425 }, { "epoch": 0.14, "learning_rate": 1.933981057019189e-05, "loss": 2.5102, "step": 1426 }, { "epoch": 0.14, "learning_rate": 1.9338650526931348e-05, "loss": 2.5056, "step": 1427 }, { "epoch": 0.14, "learning_rate": 1.9337489500240866e-05, "loss": 2.4208, "step": 1428 }, { "epoch": 0.14, "learning_rate": 1.9336327490242714e-05, "loss": 2.4539, "step": 1429 }, { "epoch": 0.14, "learning_rate": 1.933516449705926e-05, "loss": 2.4413, "step": 1430 }, { "epoch": 0.14, "learning_rate": 1.9334000520812975e-05, "loss": 2.4167, "step": 1431 }, { "epoch": 0.14, "learning_rate": 1.9332835561626427e-05, "loss": 2.4169, "step": 1432 }, { "epoch": 0.14, "learning_rate": 1.933166961962231e-05, "loss": 2.5061, "step": 1433 }, { "epoch": 0.14, "learning_rate": 1.933050269492339e-05, "loss": 2.4098, "step": 1434 }, { "epoch": 0.14, "learning_rate": 1.9329334787652564e-05, "loss": 2.4323, "step": 1435 }, { "epoch": 0.14, "learning_rate": 1.9328165897932817e-05, "loss": 2.5054, "step": 1436 }, { "epoch": 0.14, "learning_rate": 1.9326996025887243e-05, "loss": 2.391, "step": 1437 }, { "epoch": 0.14, "learning_rate": 1.932582517163904e-05, "loss": 2.4793, "step": 1438 }, { "epoch": 0.14, "learning_rate": 1.9324653335311504e-05, "loss": 2.5221, "step": 1439 }, { "epoch": 0.14, "learning_rate": 1.932348051702804e-05, "loss": 2.4173, "step": 1440 }, { "epoch": 0.14, "learning_rate": 1.9322306716912155e-05, "loss": 2.4168, "step": 1441 }, { "epoch": 0.14, "learning_rate": 1.9321131935087462e-05, "loss": 2.424, "step": 1442 }, { "epoch": 0.14, "learning_rate": 1.9319956171677665e-05, "loss": 2.4499, "step": 1443 }, { "epoch": 0.14, "learning_rate": 1.931877942680659e-05, "loss": 2.4275, "step": 1444 }, { "epoch": 0.14, "learning_rate": 1.9317601700598154e-05, "loss": 2.4932, "step": 1445 }, { "epoch": 0.14, "learning_rate": 1.931642299317638e-05, "loss": 2.4371, "step": 1446 }, { "epoch": 0.14, "learning_rate": 1.9315243304665393e-05, "loss": 2.5484, "step": 1447 }, { "epoch": 0.15, "learning_rate": 1.9314062635189426e-05, "loss": 2.4396, "step": 1448 }, { "epoch": 0.15, "learning_rate": 1.931288098487281e-05, "loss": 2.4903, "step": 1449 }, { "epoch": 0.15, "learning_rate": 1.9311698353839985e-05, "loss": 2.3733, "step": 1450 }, { "epoch": 0.15, "learning_rate": 1.931051474221549e-05, "loss": 2.4018, "step": 1451 }, { "epoch": 0.15, "learning_rate": 1.9309330150123963e-05, "loss": 2.4255, "step": 1452 }, { "epoch": 0.15, "learning_rate": 1.9308144577690154e-05, "loss": 2.4514, "step": 1453 }, { "epoch": 0.15, "learning_rate": 1.930695802503892e-05, "loss": 2.4932, "step": 1454 }, { "epoch": 0.15, "learning_rate": 1.93057704922952e-05, "loss": 2.4361, "step": 1455 }, { "epoch": 0.15, "learning_rate": 1.9304581979584062e-05, "loss": 2.329, "step": 1456 }, { "epoch": 0.15, "learning_rate": 1.9303392487030653e-05, "loss": 2.4493, "step": 1457 }, { "epoch": 0.15, "learning_rate": 1.930220201476025e-05, "loss": 2.3281, "step": 1458 }, { "epoch": 0.15, "learning_rate": 1.930101056289821e-05, "loss": 2.3846, "step": 1459 }, { "epoch": 0.15, "learning_rate": 1.929981813157e-05, "loss": 2.3887, "step": 1460 }, { "epoch": 0.15, "learning_rate": 1.92986247209012e-05, "loss": 2.4066, "step": 1461 }, { "epoch": 0.15, "learning_rate": 1.929743033101748e-05, "loss": 2.4554, "step": 1462 }, { "epoch": 0.15, "learning_rate": 1.9296234962044612e-05, "loss": 2.5204, "step": 1463 }, { "epoch": 0.15, "learning_rate": 1.929503861410849e-05, "loss": 2.4865, "step": 1464 }, { "epoch": 0.15, "learning_rate": 1.929384128733509e-05, "loss": 2.4719, "step": 1465 }, { "epoch": 0.15, "learning_rate": 1.9292642981850503e-05, "loss": 2.3992, "step": 1466 }, { "epoch": 0.15, "learning_rate": 1.9291443697780918e-05, "loss": 2.4836, "step": 1467 }, { "epoch": 0.15, "learning_rate": 1.929024343525263e-05, "loss": 2.4138, "step": 1468 }, { "epoch": 0.15, "learning_rate": 1.9289042194392035e-05, "loss": 2.4367, "step": 1469 }, { "epoch": 0.15, "learning_rate": 1.928783997532563e-05, "loss": 2.4874, "step": 1470 }, { "epoch": 0.15, "learning_rate": 1.9286636778180022e-05, "loss": 2.476, "step": 1471 }, { "epoch": 0.15, "learning_rate": 1.928543260308191e-05, "loss": 2.4274, "step": 1472 }, { "epoch": 0.15, "learning_rate": 1.9284227450158114e-05, "loss": 2.4164, "step": 1473 }, { "epoch": 0.15, "learning_rate": 1.9283021319535535e-05, "loss": 2.4387, "step": 1474 }, { "epoch": 0.15, "learning_rate": 1.9281814211341192e-05, "loss": 2.4854, "step": 1475 }, { "epoch": 0.15, "learning_rate": 1.9280606125702203e-05, "loss": 2.4941, "step": 1476 }, { "epoch": 0.15, "learning_rate": 1.9279397062745787e-05, "loss": 2.3646, "step": 1477 }, { "epoch": 0.15, "learning_rate": 1.9278187022599265e-05, "loss": 2.4642, "step": 1478 }, { "epoch": 0.15, "learning_rate": 1.9276976005390073e-05, "loss": 2.5066, "step": 1479 }, { "epoch": 0.15, "learning_rate": 1.927576401124573e-05, "loss": 2.4832, "step": 1480 }, { "epoch": 0.15, "learning_rate": 1.927455104029387e-05, "loss": 2.4543, "step": 1481 }, { "epoch": 0.15, "learning_rate": 1.927333709266223e-05, "loss": 2.3746, "step": 1482 }, { "epoch": 0.15, "learning_rate": 1.927212216847865e-05, "loss": 2.481, "step": 1483 }, { "epoch": 0.15, "learning_rate": 1.9270906267871065e-05, "loss": 2.4906, "step": 1484 }, { "epoch": 0.15, "learning_rate": 1.9269689390967524e-05, "loss": 2.4888, "step": 1485 }, { "epoch": 0.15, "learning_rate": 1.9268471537896168e-05, "loss": 2.4216, "step": 1486 }, { "epoch": 0.15, "learning_rate": 1.926725270878525e-05, "loss": 2.3652, "step": 1487 }, { "epoch": 0.15, "learning_rate": 1.926603290376312e-05, "loss": 2.3469, "step": 1488 }, { "epoch": 0.15, "learning_rate": 1.9264812122958235e-05, "loss": 2.4322, "step": 1489 }, { "epoch": 0.15, "learning_rate": 1.9263590366499148e-05, "loss": 2.3966, "step": 1490 }, { "epoch": 0.15, "learning_rate": 1.9262367634514522e-05, "loss": 2.3743, "step": 1491 }, { "epoch": 0.15, "learning_rate": 1.9261143927133118e-05, "loss": 2.4755, "step": 1492 }, { "epoch": 0.15, "learning_rate": 1.925991924448381e-05, "loss": 2.4513, "step": 1493 }, { "epoch": 0.15, "learning_rate": 1.925869358669555e-05, "loss": 2.5018, "step": 1494 }, { "epoch": 0.15, "learning_rate": 1.9257466953897426e-05, "loss": 2.4792, "step": 1495 }, { "epoch": 0.15, "learning_rate": 1.92562393462186e-05, "loss": 2.3069, "step": 1496 }, { "epoch": 0.15, "learning_rate": 1.9255010763788354e-05, "loss": 2.3735, "step": 1497 }, { "epoch": 0.15, "learning_rate": 1.9253781206736063e-05, "loss": 2.4273, "step": 1498 }, { "epoch": 0.15, "learning_rate": 1.9252550675191212e-05, "loss": 2.4324, "step": 1499 }, { "epoch": 0.15, "learning_rate": 1.9251319169283382e-05, "loss": 2.3619, "step": 1500 }, { "epoch": 0.15, "learning_rate": 1.9250086689142264e-05, "loss": 2.3993, "step": 1501 }, { "epoch": 0.15, "learning_rate": 1.9248853234897645e-05, "loss": 2.3815, "step": 1502 }, { "epoch": 0.15, "learning_rate": 1.9247618806679418e-05, "loss": 2.4922, "step": 1503 }, { "epoch": 0.15, "learning_rate": 1.9246383404617576e-05, "loss": 2.4143, "step": 1504 }, { "epoch": 0.15, "learning_rate": 1.9245147028842216e-05, "loss": 2.4619, "step": 1505 }, { "epoch": 0.15, "learning_rate": 1.924390967948354e-05, "loss": 2.4666, "step": 1506 }, { "epoch": 0.15, "learning_rate": 1.9242671356671847e-05, "loss": 2.3947, "step": 1507 }, { "epoch": 0.15, "learning_rate": 1.9241432060537542e-05, "loss": 2.4614, "step": 1508 }, { "epoch": 0.15, "learning_rate": 1.9240191791211136e-05, "loss": 2.5123, "step": 1509 }, { "epoch": 0.15, "learning_rate": 1.9238950548823234e-05, "loss": 2.3706, "step": 1510 }, { "epoch": 0.15, "learning_rate": 1.923770833350455e-05, "loss": 2.5126, "step": 1511 }, { "epoch": 0.15, "learning_rate": 1.9236465145385903e-05, "loss": 2.3594, "step": 1512 }, { "epoch": 0.15, "learning_rate": 1.9235220984598203e-05, "loss": 2.4721, "step": 1513 }, { "epoch": 0.15, "learning_rate": 1.923397585127247e-05, "loss": 2.4404, "step": 1514 }, { "epoch": 0.15, "learning_rate": 1.9232729745539832e-05, "loss": 2.3406, "step": 1515 }, { "epoch": 0.15, "learning_rate": 1.923148266753151e-05, "loss": 2.553, "step": 1516 }, { "epoch": 0.15, "learning_rate": 1.9230234617378826e-05, "loss": 2.3678, "step": 1517 }, { "epoch": 0.15, "learning_rate": 1.9228985595213214e-05, "loss": 2.4187, "step": 1518 }, { "epoch": 0.15, "learning_rate": 1.9227735601166206e-05, "loss": 2.4497, "step": 1519 }, { "epoch": 0.15, "learning_rate": 1.9226484635369435e-05, "loss": 2.3558, "step": 1520 }, { "epoch": 0.15, "learning_rate": 1.9225232697954635e-05, "loss": 2.4807, "step": 1521 }, { "epoch": 0.15, "learning_rate": 1.9223979789053647e-05, "loss": 2.5239, "step": 1522 }, { "epoch": 0.15, "learning_rate": 1.922272590879841e-05, "loss": 2.4425, "step": 1523 }, { "epoch": 0.15, "learning_rate": 1.922147105732097e-05, "loss": 2.5259, "step": 1524 }, { "epoch": 0.15, "learning_rate": 1.9220215234753464e-05, "loss": 2.4919, "step": 1525 }, { "epoch": 0.15, "learning_rate": 1.921895844122815e-05, "loss": 2.5031, "step": 1526 }, { "epoch": 0.15, "learning_rate": 1.921770067687737e-05, "loss": 2.4446, "step": 1527 }, { "epoch": 0.15, "learning_rate": 1.9216441941833583e-05, "loss": 2.4694, "step": 1528 }, { "epoch": 0.15, "learning_rate": 1.9215182236229336e-05, "loss": 2.4059, "step": 1529 }, { "epoch": 0.15, "learning_rate": 1.921392156019729e-05, "loss": 2.5019, "step": 1530 }, { "epoch": 0.15, "learning_rate": 1.92126599138702e-05, "loss": 2.4705, "step": 1531 }, { "epoch": 0.15, "learning_rate": 1.9211397297380934e-05, "loss": 2.4331, "step": 1532 }, { "epoch": 0.15, "learning_rate": 1.9210133710862448e-05, "loss": 2.5117, "step": 1533 }, { "epoch": 0.15, "learning_rate": 1.9208869154447808e-05, "loss": 2.4504, "step": 1534 }, { "epoch": 0.15, "learning_rate": 1.9207603628270185e-05, "loss": 2.459, "step": 1535 }, { "epoch": 0.15, "learning_rate": 1.9206337132462845e-05, "loss": 2.3384, "step": 1536 }, { "epoch": 0.15, "learning_rate": 1.920506966715916e-05, "loss": 2.4133, "step": 1537 }, { "epoch": 0.15, "learning_rate": 1.9203801232492604e-05, "loss": 2.3286, "step": 1538 }, { "epoch": 0.15, "learning_rate": 1.9202531828596756e-05, "loss": 2.4188, "step": 1539 }, { "epoch": 0.15, "learning_rate": 1.920126145560529e-05, "loss": 2.4483, "step": 1540 }, { "epoch": 0.15, "learning_rate": 1.9199990113651982e-05, "loss": 2.3709, "step": 1541 }, { "epoch": 0.15, "learning_rate": 1.9198717802870722e-05, "loss": 2.5394, "step": 1542 }, { "epoch": 0.15, "learning_rate": 1.919744452339549e-05, "loss": 2.4809, "step": 1543 }, { "epoch": 0.15, "learning_rate": 1.9196170275360368e-05, "loss": 2.3849, "step": 1544 }, { "epoch": 0.15, "learning_rate": 1.9194895058899555e-05, "loss": 2.4997, "step": 1545 }, { "epoch": 0.15, "learning_rate": 1.9193618874147327e-05, "loss": 2.3728, "step": 1546 }, { "epoch": 0.15, "learning_rate": 1.9192341721238087e-05, "loss": 2.4638, "step": 1547 }, { "epoch": 0.16, "learning_rate": 1.9191063600306323e-05, "loss": 2.3845, "step": 1548 }, { "epoch": 0.16, "learning_rate": 1.9189784511486632e-05, "loss": 2.4049, "step": 1549 }, { "epoch": 0.16, "learning_rate": 1.918850445491371e-05, "loss": 2.4627, "step": 1550 }, { "epoch": 0.16, "learning_rate": 1.918722343072236e-05, "loss": 2.4434, "step": 1551 }, { "epoch": 0.16, "learning_rate": 1.918594143904748e-05, "loss": 2.4135, "step": 1552 }, { "epoch": 0.16, "learning_rate": 1.9184658480024076e-05, "loss": 2.4184, "step": 1553 }, { "epoch": 0.16, "learning_rate": 1.9183374553787253e-05, "loss": 2.532, "step": 1554 }, { "epoch": 0.16, "learning_rate": 1.9182089660472217e-05, "loss": 2.5064, "step": 1555 }, { "epoch": 0.16, "learning_rate": 1.9180803800214274e-05, "loss": 2.396, "step": 1556 }, { "epoch": 0.16, "learning_rate": 1.9179516973148844e-05, "loss": 2.4145, "step": 1557 }, { "epoch": 0.16, "learning_rate": 1.917822917941143e-05, "loss": 2.4457, "step": 1558 }, { "epoch": 0.16, "learning_rate": 1.917694041913765e-05, "loss": 2.4456, "step": 1559 }, { "epoch": 0.16, "learning_rate": 1.917565069246322e-05, "loss": 2.4696, "step": 1560 }, { "epoch": 0.16, "learning_rate": 1.917435999952396e-05, "loss": 2.4053, "step": 1561 }, { "epoch": 0.16, "learning_rate": 1.9173068340455786e-05, "loss": 2.4201, "step": 1562 }, { "epoch": 0.16, "learning_rate": 1.917177571539472e-05, "loss": 2.5288, "step": 1563 }, { "epoch": 0.16, "learning_rate": 1.9170482124476885e-05, "loss": 2.4737, "step": 1564 }, { "epoch": 0.16, "learning_rate": 1.9169187567838508e-05, "loss": 2.4935, "step": 1565 }, { "epoch": 0.16, "learning_rate": 1.9167892045615914e-05, "loss": 2.49, "step": 1566 }, { "epoch": 0.16, "learning_rate": 1.9166595557945532e-05, "loss": 2.4005, "step": 1567 }, { "epoch": 0.16, "learning_rate": 1.9165298104963895e-05, "loss": 2.404, "step": 1568 }, { "epoch": 0.16, "learning_rate": 1.9163999686807624e-05, "loss": 2.413, "step": 1569 }, { "epoch": 0.16, "learning_rate": 1.9162700303613463e-05, "loss": 2.359, "step": 1570 }, { "epoch": 0.16, "learning_rate": 1.9161399955518244e-05, "loss": 2.4287, "step": 1571 }, { "epoch": 0.16, "learning_rate": 1.91600986426589e-05, "loss": 2.4264, "step": 1572 }, { "epoch": 0.16, "learning_rate": 1.9158796365172474e-05, "loss": 2.3426, "step": 1573 }, { "epoch": 0.16, "learning_rate": 1.91574931231961e-05, "loss": 2.3553, "step": 1574 }, { "epoch": 0.16, "learning_rate": 1.915618891686702e-05, "loss": 2.4273, "step": 1575 }, { "epoch": 0.16, "learning_rate": 1.9154883746322585e-05, "loss": 2.3828, "step": 1576 }, { "epoch": 0.16, "learning_rate": 1.9153577611700228e-05, "loss": 2.379, "step": 1577 }, { "epoch": 0.16, "learning_rate": 1.9152270513137507e-05, "loss": 2.4628, "step": 1578 }, { "epoch": 0.16, "learning_rate": 1.9150962450772055e-05, "loss": 2.4972, "step": 1579 }, { "epoch": 0.16, "learning_rate": 1.9149653424741628e-05, "loss": 2.4865, "step": 1580 }, { "epoch": 0.16, "learning_rate": 1.9148343435184077e-05, "loss": 2.4303, "step": 1581 }, { "epoch": 0.16, "learning_rate": 1.9147032482237354e-05, "loss": 2.3784, "step": 1582 }, { "epoch": 0.16, "learning_rate": 1.914572056603951e-05, "loss": 2.3558, "step": 1583 }, { "epoch": 0.16, "learning_rate": 1.9144407686728704e-05, "loss": 2.3888, "step": 1584 }, { "epoch": 0.16, "learning_rate": 1.9143093844443182e-05, "loss": 2.4502, "step": 1585 }, { "epoch": 0.16, "learning_rate": 1.9141779039321312e-05, "loss": 2.4858, "step": 1586 }, { "epoch": 0.16, "learning_rate": 1.914046327150155e-05, "loss": 2.4207, "step": 1587 }, { "epoch": 0.16, "learning_rate": 1.9139146541122455e-05, "loss": 2.4718, "step": 1588 }, { "epoch": 0.16, "learning_rate": 1.913782884832269e-05, "loss": 2.5083, "step": 1589 }, { "epoch": 0.16, "learning_rate": 1.9136510193241012e-05, "loss": 2.4906, "step": 1590 }, { "epoch": 0.16, "learning_rate": 1.9135190576016294e-05, "loss": 2.3876, "step": 1591 }, { "epoch": 0.16, "learning_rate": 1.9133869996787493e-05, "loss": 2.3844, "step": 1592 }, { "epoch": 0.16, "learning_rate": 1.9132548455693685e-05, "loss": 2.4311, "step": 1593 }, { "epoch": 0.16, "learning_rate": 1.913122595287403e-05, "loss": 2.4823, "step": 1594 }, { "epoch": 0.16, "learning_rate": 1.9129902488467804e-05, "loss": 2.5619, "step": 1595 }, { "epoch": 0.16, "learning_rate": 1.9128578062614375e-05, "loss": 2.4615, "step": 1596 }, { "epoch": 0.16, "learning_rate": 1.912725267545321e-05, "loss": 2.4802, "step": 1597 }, { "epoch": 0.16, "learning_rate": 1.9125926327123894e-05, "loss": 2.4058, "step": 1598 }, { "epoch": 0.16, "learning_rate": 1.912459901776609e-05, "loss": 2.3761, "step": 1599 }, { "epoch": 0.16, "learning_rate": 1.912327074751958e-05, "loss": 2.489, "step": 1600 }, { "epoch": 0.16, "learning_rate": 1.9121941516524235e-05, "loss": 2.4185, "step": 1601 }, { "epoch": 0.16, "learning_rate": 1.912061132492004e-05, "loss": 2.3356, "step": 1602 }, { "epoch": 0.16, "learning_rate": 1.911928017284707e-05, "loss": 2.3656, "step": 1603 }, { "epoch": 0.16, "learning_rate": 1.911794806044551e-05, "loss": 2.4615, "step": 1604 }, { "epoch": 0.16, "learning_rate": 1.9116614987855638e-05, "loss": 2.3658, "step": 1605 }, { "epoch": 0.16, "learning_rate": 1.9115280955217833e-05, "loss": 2.6181, "step": 1606 }, { "epoch": 0.16, "learning_rate": 1.911394596267258e-05, "loss": 2.5073, "step": 1607 }, { "epoch": 0.16, "learning_rate": 1.9112610010360468e-05, "loss": 2.3605, "step": 1608 }, { "epoch": 0.16, "learning_rate": 1.911127309842218e-05, "loss": 2.4181, "step": 1609 }, { "epoch": 0.16, "learning_rate": 1.9109935226998505e-05, "loss": 2.308, "step": 1610 }, { "epoch": 0.16, "learning_rate": 1.9108596396230328e-05, "loss": 2.4504, "step": 1611 }, { "epoch": 0.16, "learning_rate": 1.9107256606258637e-05, "loss": 2.4032, "step": 1612 }, { "epoch": 0.16, "learning_rate": 1.9105915857224526e-05, "loss": 2.3446, "step": 1613 }, { "epoch": 0.16, "learning_rate": 1.9104574149269183e-05, "loss": 2.4893, "step": 1614 }, { "epoch": 0.16, "learning_rate": 1.9103231482533903e-05, "loss": 2.4437, "step": 1615 }, { "epoch": 0.16, "learning_rate": 1.910188785716008e-05, "loss": 2.3964, "step": 1616 }, { "epoch": 0.16, "learning_rate": 1.9100543273289196e-05, "loss": 2.431, "step": 1617 }, { "epoch": 0.16, "learning_rate": 1.9099197731062858e-05, "loss": 2.3865, "step": 1618 }, { "epoch": 0.16, "learning_rate": 1.909785123062276e-05, "loss": 2.4247, "step": 1619 }, { "epoch": 0.16, "learning_rate": 1.9096503772110692e-05, "loss": 2.3946, "step": 1620 }, { "epoch": 0.16, "learning_rate": 1.9095155355668562e-05, "loss": 2.4816, "step": 1621 }, { "epoch": 0.16, "learning_rate": 1.909380598143836e-05, "loss": 2.4268, "step": 1622 }, { "epoch": 0.16, "learning_rate": 1.909245564956219e-05, "loss": 2.5004, "step": 1623 }, { "epoch": 0.16, "learning_rate": 1.9091104360182243e-05, "loss": 2.5218, "step": 1624 }, { "epoch": 0.16, "learning_rate": 1.9089752113440832e-05, "loss": 2.4586, "step": 1625 }, { "epoch": 0.16, "learning_rate": 1.9088398909480353e-05, "loss": 2.5042, "step": 1626 }, { "epoch": 0.16, "learning_rate": 1.908704474844331e-05, "loss": 2.4406, "step": 1627 }, { "epoch": 0.16, "learning_rate": 1.90856896304723e-05, "loss": 2.4438, "step": 1628 }, { "epoch": 0.16, "learning_rate": 1.9084333555710036e-05, "loss": 2.4074, "step": 1629 }, { "epoch": 0.16, "learning_rate": 1.908297652429932e-05, "loss": 2.3791, "step": 1630 }, { "epoch": 0.16, "learning_rate": 1.9081618536383058e-05, "loss": 2.3643, "step": 1631 }, { "epoch": 0.16, "learning_rate": 1.9080259592104252e-05, "loss": 2.4731, "step": 1632 }, { "epoch": 0.16, "learning_rate": 1.907889969160601e-05, "loss": 2.5004, "step": 1633 }, { "epoch": 0.16, "learning_rate": 1.907753883503155e-05, "loss": 2.5587, "step": 1634 }, { "epoch": 0.16, "learning_rate": 1.9076177022524164e-05, "loss": 2.4191, "step": 1635 }, { "epoch": 0.16, "learning_rate": 1.9074814254227273e-05, "loss": 2.4259, "step": 1636 }, { "epoch": 0.16, "learning_rate": 1.9073450530284383e-05, "loss": 2.4694, "step": 1637 }, { "epoch": 0.16, "learning_rate": 1.9072085850839102e-05, "loss": 2.4268, "step": 1638 }, { "epoch": 0.16, "learning_rate": 1.9070720216035145e-05, "loss": 2.406, "step": 1639 }, { "epoch": 0.16, "learning_rate": 1.9069353626016324e-05, "loss": 2.435, "step": 1640 }, { "epoch": 0.16, "learning_rate": 1.9067986080926547e-05, "loss": 2.3947, "step": 1641 }, { "epoch": 0.16, "learning_rate": 1.906661758090983e-05, "loss": 2.4758, "step": 1642 }, { "epoch": 0.16, "learning_rate": 1.9065248126110287e-05, "loss": 2.509, "step": 1643 }, { "epoch": 0.16, "learning_rate": 1.9063877716672126e-05, "loss": 2.3851, "step": 1644 }, { "epoch": 0.16, "learning_rate": 1.9062506352739663e-05, "loss": 2.3918, "step": 1645 }, { "epoch": 0.16, "learning_rate": 1.9061134034457323e-05, "loss": 2.4098, "step": 1646 }, { "epoch": 0.17, "learning_rate": 1.9059760761969607e-05, "loss": 2.4507, "step": 1647 }, { "epoch": 0.17, "learning_rate": 1.9058386535421143e-05, "loss": 2.441, "step": 1648 }, { "epoch": 0.17, "learning_rate": 1.9057011354956638e-05, "loss": 2.3421, "step": 1649 }, { "epoch": 0.17, "learning_rate": 1.9055635220720916e-05, "loss": 2.4105, "step": 1650 }, { "epoch": 0.17, "learning_rate": 1.905425813285889e-05, "loss": 2.4983, "step": 1651 }, { "epoch": 0.17, "learning_rate": 1.905288009151558e-05, "loss": 2.4828, "step": 1652 }, { "epoch": 0.17, "learning_rate": 1.9051501096836098e-05, "loss": 2.4436, "step": 1653 }, { "epoch": 0.17, "learning_rate": 1.9050121148965672e-05, "loss": 2.4313, "step": 1654 }, { "epoch": 0.17, "learning_rate": 1.9048740248049616e-05, "loss": 2.3279, "step": 1655 }, { "epoch": 0.17, "learning_rate": 1.9047358394233347e-05, "loss": 2.3785, "step": 1656 }, { "epoch": 0.17, "learning_rate": 1.9045975587662387e-05, "loss": 2.4961, "step": 1657 }, { "epoch": 0.17, "learning_rate": 1.904459182848236e-05, "loss": 2.4825, "step": 1658 }, { "epoch": 0.17, "learning_rate": 1.9043207116838976e-05, "loss": 2.4491, "step": 1659 }, { "epoch": 0.17, "learning_rate": 1.9041821452878066e-05, "loss": 2.4004, "step": 1660 }, { "epoch": 0.17, "learning_rate": 1.9040434836745544e-05, "loss": 2.4575, "step": 1661 }, { "epoch": 0.17, "learning_rate": 1.903904726858744e-05, "loss": 2.4459, "step": 1662 }, { "epoch": 0.17, "learning_rate": 1.903765874854986e-05, "loss": 2.5409, "step": 1663 }, { "epoch": 0.17, "learning_rate": 1.903626927677904e-05, "loss": 2.5259, "step": 1664 }, { "epoch": 0.17, "learning_rate": 1.9034878853421293e-05, "loss": 2.4184, "step": 1665 }, { "epoch": 0.17, "learning_rate": 1.9033487478623046e-05, "loss": 2.5051, "step": 1666 }, { "epoch": 0.17, "learning_rate": 1.903209515253082e-05, "loss": 2.5018, "step": 1667 }, { "epoch": 0.17, "learning_rate": 1.9030701875291237e-05, "loss": 2.3643, "step": 1668 }, { "epoch": 0.17, "learning_rate": 1.9029307647051016e-05, "loss": 2.4509, "step": 1669 }, { "epoch": 0.17, "learning_rate": 1.9027912467956983e-05, "loss": 2.4959, "step": 1670 }, { "epoch": 0.17, "learning_rate": 1.9026516338156066e-05, "loss": 2.3932, "step": 1671 }, { "epoch": 0.17, "learning_rate": 1.9025119257795278e-05, "loss": 2.4754, "step": 1672 }, { "epoch": 0.17, "learning_rate": 1.902372122702175e-05, "loss": 2.4311, "step": 1673 }, { "epoch": 0.17, "learning_rate": 1.90223222459827e-05, "loss": 2.3683, "step": 1674 }, { "epoch": 0.17, "learning_rate": 1.9020922314825453e-05, "loss": 2.4338, "step": 1675 }, { "epoch": 0.17, "learning_rate": 1.9019521433697434e-05, "loss": 2.3405, "step": 1676 }, { "epoch": 0.17, "learning_rate": 1.9018119602746164e-05, "loss": 2.3084, "step": 1677 }, { "epoch": 0.17, "learning_rate": 1.9016716822119266e-05, "loss": 2.3801, "step": 1678 }, { "epoch": 0.17, "learning_rate": 1.9015313091964467e-05, "loss": 2.4195, "step": 1679 }, { "epoch": 0.17, "learning_rate": 1.9013908412429584e-05, "loss": 2.362, "step": 1680 }, { "epoch": 0.17, "learning_rate": 1.9012502783662547e-05, "loss": 2.4336, "step": 1681 }, { "epoch": 0.17, "learning_rate": 1.901109620581138e-05, "loss": 2.5038, "step": 1682 }, { "epoch": 0.17, "learning_rate": 1.900968867902419e-05, "loss": 2.314, "step": 1683 }, { "epoch": 0.17, "learning_rate": 1.9008280203449224e-05, "loss": 2.3403, "step": 1684 }, { "epoch": 0.17, "learning_rate": 1.900687077923479e-05, "loss": 2.4452, "step": 1685 }, { "epoch": 0.17, "learning_rate": 1.9005460406529313e-05, "loss": 2.4741, "step": 1686 }, { "epoch": 0.17, "learning_rate": 1.900404908548132e-05, "loss": 2.389, "step": 1687 }, { "epoch": 0.17, "learning_rate": 1.9002636816239425e-05, "loss": 2.4795, "step": 1688 }, { "epoch": 0.17, "learning_rate": 1.9001223598952362e-05, "loss": 2.4137, "step": 1689 }, { "epoch": 0.17, "learning_rate": 1.899980943376895e-05, "loss": 2.4784, "step": 1690 }, { "epoch": 0.17, "learning_rate": 1.8998394320838104e-05, "loss": 2.4727, "step": 1691 }, { "epoch": 0.17, "learning_rate": 1.8996978260308855e-05, "loss": 2.4235, "step": 1692 }, { "epoch": 0.17, "learning_rate": 1.8995561252330317e-05, "loss": 2.457, "step": 1693 }, { "epoch": 0.17, "learning_rate": 1.899414329705172e-05, "loss": 2.4309, "step": 1694 }, { "epoch": 0.17, "learning_rate": 1.8992724394622378e-05, "loss": 2.3741, "step": 1695 }, { "epoch": 0.17, "learning_rate": 1.8991304545191713e-05, "loss": 2.3663, "step": 1696 }, { "epoch": 0.17, "learning_rate": 1.8989883748909252e-05, "loss": 2.474, "step": 1697 }, { "epoch": 0.17, "learning_rate": 1.8988462005924608e-05, "loss": 2.4612, "step": 1698 }, { "epoch": 0.17, "learning_rate": 1.8987039316387507e-05, "loss": 2.4448, "step": 1699 }, { "epoch": 0.17, "learning_rate": 1.898561568044776e-05, "loss": 2.3579, "step": 1700 }, { "epoch": 0.17, "learning_rate": 1.89841910982553e-05, "loss": 2.406, "step": 1701 }, { "epoch": 0.17, "learning_rate": 1.8982765569960137e-05, "loss": 2.4399, "step": 1702 }, { "epoch": 0.17, "learning_rate": 1.898133909571239e-05, "loss": 2.3756, "step": 1703 }, { "epoch": 0.17, "learning_rate": 1.8979911675662283e-05, "loss": 2.4475, "step": 1704 }, { "epoch": 0.17, "learning_rate": 1.8978483309960128e-05, "loss": 2.4669, "step": 1705 }, { "epoch": 0.17, "learning_rate": 1.897705399875634e-05, "loss": 2.4621, "step": 1706 }, { "epoch": 0.17, "learning_rate": 1.897562374220145e-05, "loss": 2.4589, "step": 1707 }, { "epoch": 0.17, "learning_rate": 1.8974192540446062e-05, "loss": 2.4674, "step": 1708 }, { "epoch": 0.17, "learning_rate": 1.8972760393640893e-05, "loss": 2.3614, "step": 1709 }, { "epoch": 0.17, "learning_rate": 1.8971327301936766e-05, "loss": 2.3888, "step": 1710 }, { "epoch": 0.17, "learning_rate": 1.896989326548459e-05, "loss": 2.3639, "step": 1711 }, { "epoch": 0.17, "learning_rate": 1.8968458284435386e-05, "loss": 2.425, "step": 1712 }, { "epoch": 0.17, "learning_rate": 1.896702235894026e-05, "loss": 2.4107, "step": 1713 }, { "epoch": 0.17, "learning_rate": 1.896558548915043e-05, "loss": 2.4456, "step": 1714 }, { "epoch": 0.17, "learning_rate": 1.8964147675217212e-05, "loss": 2.4296, "step": 1715 }, { "epoch": 0.17, "learning_rate": 1.8962708917292012e-05, "loss": 2.4286, "step": 1716 }, { "epoch": 0.17, "learning_rate": 1.896126921552635e-05, "loss": 2.5279, "step": 1717 }, { "epoch": 0.17, "learning_rate": 1.895982857007183e-05, "loss": 2.5279, "step": 1718 }, { "epoch": 0.17, "learning_rate": 1.8958386981080166e-05, "loss": 2.4763, "step": 1719 }, { "epoch": 0.17, "learning_rate": 1.895694444870317e-05, "loss": 2.4184, "step": 1720 }, { "epoch": 0.17, "learning_rate": 1.895550097309275e-05, "loss": 2.4731, "step": 1721 }, { "epoch": 0.17, "learning_rate": 1.895405655440091e-05, "loss": 2.482, "step": 1722 }, { "epoch": 0.17, "learning_rate": 1.8952611192779768e-05, "loss": 2.4745, "step": 1723 }, { "epoch": 0.17, "learning_rate": 1.8951164888381522e-05, "loss": 2.4266, "step": 1724 }, { "epoch": 0.17, "learning_rate": 1.8949717641358486e-05, "loss": 2.3483, "step": 1725 }, { "epoch": 0.17, "learning_rate": 1.894826945186306e-05, "loss": 2.4104, "step": 1726 }, { "epoch": 0.17, "learning_rate": 1.894682032004775e-05, "loss": 2.4037, "step": 1727 }, { "epoch": 0.17, "learning_rate": 1.8945370246065166e-05, "loss": 2.443, "step": 1728 }, { "epoch": 0.17, "learning_rate": 1.8943919230068008e-05, "loss": 2.3443, "step": 1729 }, { "epoch": 0.17, "learning_rate": 1.8942467272209074e-05, "loss": 2.4703, "step": 1730 }, { "epoch": 0.17, "learning_rate": 1.8941014372641275e-05, "loss": 2.4041, "step": 1731 }, { "epoch": 0.17, "learning_rate": 1.8939560531517607e-05, "loss": 2.3888, "step": 1732 }, { "epoch": 0.17, "learning_rate": 1.8938105748991172e-05, "loss": 2.3819, "step": 1733 }, { "epoch": 0.17, "learning_rate": 1.8936650025215166e-05, "loss": 2.4109, "step": 1734 }, { "epoch": 0.17, "learning_rate": 1.893519336034289e-05, "loss": 2.4015, "step": 1735 }, { "epoch": 0.17, "learning_rate": 1.8933735754527748e-05, "loss": 2.4913, "step": 1736 }, { "epoch": 0.17, "learning_rate": 1.893227720792323e-05, "loss": 2.3133, "step": 1737 }, { "epoch": 0.17, "learning_rate": 1.8930817720682928e-05, "loss": 2.3462, "step": 1738 }, { "epoch": 0.17, "learning_rate": 1.8929357292960546e-05, "loss": 2.5119, "step": 1739 }, { "epoch": 0.17, "learning_rate": 1.8927895924909873e-05, "loss": 2.3989, "step": 1740 }, { "epoch": 0.17, "learning_rate": 1.89264336166848e-05, "loss": 2.4147, "step": 1741 }, { "epoch": 0.17, "learning_rate": 1.8924970368439326e-05, "loss": 2.5147, "step": 1742 }, { "epoch": 0.17, "learning_rate": 1.8923506180327537e-05, "loss": 2.4732, "step": 1743 }, { "epoch": 0.17, "learning_rate": 1.8922041052503623e-05, "loss": 2.4347, "step": 1744 }, { "epoch": 0.17, "learning_rate": 1.8920574985121874e-05, "loss": 2.4049, "step": 1745 }, { "epoch": 0.17, "learning_rate": 1.891910797833668e-05, "loss": 2.4835, "step": 1746 }, { "epoch": 0.18, "learning_rate": 1.8917640032302522e-05, "loss": 2.3457, "step": 1747 }, { "epoch": 0.18, "learning_rate": 1.891617114717399e-05, "loss": 2.5503, "step": 1748 }, { "epoch": 0.18, "learning_rate": 1.891470132310577e-05, "loss": 2.4038, "step": 1749 }, { "epoch": 0.18, "learning_rate": 1.8913230560252646e-05, "loss": 2.4228, "step": 1750 }, { "epoch": 0.18, "learning_rate": 1.8911758858769493e-05, "loss": 2.4396, "step": 1751 }, { "epoch": 0.18, "learning_rate": 1.8910286218811296e-05, "loss": 2.3767, "step": 1752 }, { "epoch": 0.18, "learning_rate": 1.890881264053314e-05, "loss": 2.3927, "step": 1753 }, { "epoch": 0.18, "learning_rate": 1.8907338124090196e-05, "loss": 2.3655, "step": 1754 }, { "epoch": 0.18, "learning_rate": 1.890586266963775e-05, "loss": 2.3843, "step": 1755 }, { "epoch": 0.18, "learning_rate": 1.8904386277331174e-05, "loss": 2.3798, "step": 1756 }, { "epoch": 0.18, "learning_rate": 1.890290894732594e-05, "loss": 2.44, "step": 1757 }, { "epoch": 0.18, "learning_rate": 1.8901430679777625e-05, "loss": 2.4684, "step": 1758 }, { "epoch": 0.18, "learning_rate": 1.88999514748419e-05, "loss": 2.5021, "step": 1759 }, { "epoch": 0.18, "learning_rate": 1.8898471332674544e-05, "loss": 2.5017, "step": 1760 }, { "epoch": 0.18, "learning_rate": 1.889699025343142e-05, "loss": 2.474, "step": 1761 }, { "epoch": 0.18, "learning_rate": 1.8895508237268495e-05, "loss": 2.464, "step": 1762 }, { "epoch": 0.18, "learning_rate": 1.8894025284341843e-05, "loss": 2.5239, "step": 1763 }, { "epoch": 0.18, "learning_rate": 1.889254139480762e-05, "loss": 2.4716, "step": 1764 }, { "epoch": 0.18, "learning_rate": 1.8891056568822105e-05, "loss": 2.4612, "step": 1765 }, { "epoch": 0.18, "learning_rate": 1.888957080654165e-05, "loss": 2.4436, "step": 1766 }, { "epoch": 0.18, "learning_rate": 1.8888084108122715e-05, "loss": 2.436, "step": 1767 }, { "epoch": 0.18, "learning_rate": 1.8886596473721874e-05, "loss": 2.3637, "step": 1768 }, { "epoch": 0.18, "learning_rate": 1.8885107903495773e-05, "loss": 2.5061, "step": 1769 }, { "epoch": 0.18, "learning_rate": 1.8883618397601174e-05, "loss": 2.3796, "step": 1770 }, { "epoch": 0.18, "learning_rate": 1.888212795619494e-05, "loss": 2.4423, "step": 1771 }, { "epoch": 0.18, "learning_rate": 1.888063657943401e-05, "loss": 2.4475, "step": 1772 }, { "epoch": 0.18, "learning_rate": 1.8879144267475455e-05, "loss": 2.4174, "step": 1773 }, { "epoch": 0.18, "learning_rate": 1.887765102047641e-05, "loss": 2.5537, "step": 1774 }, { "epoch": 0.18, "learning_rate": 1.887615683859414e-05, "loss": 2.4414, "step": 1775 }, { "epoch": 0.18, "learning_rate": 1.8874661721985986e-05, "loss": 2.5469, "step": 1776 }, { "epoch": 0.18, "learning_rate": 1.887316567080939e-05, "loss": 2.4448, "step": 1777 }, { "epoch": 0.18, "learning_rate": 1.887166868522191e-05, "loss": 2.4896, "step": 1778 }, { "epoch": 0.18, "learning_rate": 1.887017076538118e-05, "loss": 2.426, "step": 1779 }, { "epoch": 0.18, "learning_rate": 1.8868671911444946e-05, "loss": 2.3108, "step": 1780 }, { "epoch": 0.18, "learning_rate": 1.8867172123571046e-05, "loss": 2.4228, "step": 1781 }, { "epoch": 0.18, "learning_rate": 1.8865671401917423e-05, "loss": 2.3977, "step": 1782 }, { "epoch": 0.18, "learning_rate": 1.8864169746642108e-05, "loss": 2.396, "step": 1783 }, { "epoch": 0.18, "learning_rate": 1.8862667157903246e-05, "loss": 2.4295, "step": 1784 }, { "epoch": 0.18, "learning_rate": 1.886116363585906e-05, "loss": 2.4568, "step": 1785 }, { "epoch": 0.18, "learning_rate": 1.8859659180667892e-05, "loss": 2.3852, "step": 1786 }, { "epoch": 0.18, "learning_rate": 1.8858153792488162e-05, "loss": 2.4048, "step": 1787 }, { "epoch": 0.18, "learning_rate": 1.885664747147841e-05, "loss": 2.3729, "step": 1788 }, { "epoch": 0.18, "learning_rate": 1.8855140217797254e-05, "loss": 2.3105, "step": 1789 }, { "epoch": 0.18, "learning_rate": 1.8853632031603425e-05, "loss": 2.4009, "step": 1790 }, { "epoch": 0.18, "learning_rate": 1.8852122913055742e-05, "loss": 2.4834, "step": 1791 }, { "epoch": 0.18, "learning_rate": 1.885061286231313e-05, "loss": 2.457, "step": 1792 }, { "epoch": 0.18, "learning_rate": 1.8849101879534606e-05, "loss": 2.3384, "step": 1793 }, { "epoch": 0.18, "learning_rate": 1.8847589964879288e-05, "loss": 2.4396, "step": 1794 }, { "epoch": 0.18, "learning_rate": 1.8846077118506397e-05, "loss": 2.4117, "step": 1795 }, { "epoch": 0.18, "learning_rate": 1.884456334057524e-05, "loss": 2.5053, "step": 1796 }, { "epoch": 0.18, "learning_rate": 1.884304863124523e-05, "loss": 2.4371, "step": 1797 }, { "epoch": 0.18, "learning_rate": 1.884153299067588e-05, "loss": 2.4308, "step": 1798 }, { "epoch": 0.18, "learning_rate": 1.8840016419026802e-05, "loss": 2.561, "step": 1799 }, { "epoch": 0.18, "learning_rate": 1.8838498916457693e-05, "loss": 2.4189, "step": 1800 }, { "epoch": 0.18, "learning_rate": 1.8836980483128363e-05, "loss": 2.4191, "step": 1801 }, { "epoch": 0.18, "learning_rate": 1.8835461119198718e-05, "loss": 2.4646, "step": 1802 }, { "epoch": 0.18, "learning_rate": 1.883394082482875e-05, "loss": 2.4484, "step": 1803 }, { "epoch": 0.18, "learning_rate": 1.8832419600178562e-05, "loss": 2.3067, "step": 1804 }, { "epoch": 0.18, "learning_rate": 1.883089744540835e-05, "loss": 2.3853, "step": 1805 }, { "epoch": 0.18, "learning_rate": 1.8829374360678408e-05, "loss": 2.4505, "step": 1806 }, { "epoch": 0.18, "learning_rate": 1.882785034614913e-05, "loss": 2.4402, "step": 1807 }, { "epoch": 0.18, "learning_rate": 1.8826325401981008e-05, "loss": 2.385, "step": 1808 }, { "epoch": 0.18, "learning_rate": 1.882479952833462e-05, "loss": 2.4622, "step": 1809 }, { "epoch": 0.18, "learning_rate": 1.8823272725370664e-05, "loss": 2.4134, "step": 1810 }, { "epoch": 0.18, "learning_rate": 1.8821744993249913e-05, "loss": 2.4141, "step": 1811 }, { "epoch": 0.18, "learning_rate": 1.8820216332133257e-05, "loss": 2.467, "step": 1812 }, { "epoch": 0.18, "learning_rate": 1.8818686742181674e-05, "loss": 2.4619, "step": 1813 }, { "epoch": 0.18, "learning_rate": 1.881715622355624e-05, "loss": 2.5041, "step": 1814 }, { "epoch": 0.18, "learning_rate": 1.8815624776418127e-05, "loss": 2.3606, "step": 1815 }, { "epoch": 0.18, "learning_rate": 1.8814092400928614e-05, "loss": 2.5231, "step": 1816 }, { "epoch": 0.18, "learning_rate": 1.8812559097249067e-05, "loss": 2.516, "step": 1817 }, { "epoch": 0.18, "learning_rate": 1.8811024865540958e-05, "loss": 2.4158, "step": 1818 }, { "epoch": 0.18, "learning_rate": 1.8809489705965847e-05, "loss": 2.5241, "step": 1819 }, { "epoch": 0.18, "learning_rate": 1.8807953618685402e-05, "loss": 2.3558, "step": 1820 }, { "epoch": 0.18, "learning_rate": 1.8806416603861386e-05, "loss": 2.4414, "step": 1821 }, { "epoch": 0.18, "learning_rate": 1.880487866165566e-05, "loss": 2.3573, "step": 1822 }, { "epoch": 0.18, "learning_rate": 1.8803339792230173e-05, "loss": 2.4303, "step": 1823 }, { "epoch": 0.18, "learning_rate": 1.8801799995746983e-05, "loss": 2.4288, "step": 1824 }, { "epoch": 0.18, "learning_rate": 1.8800259272368247e-05, "loss": 2.4001, "step": 1825 }, { "epoch": 0.18, "learning_rate": 1.8798717622256207e-05, "loss": 2.4559, "step": 1826 }, { "epoch": 0.18, "learning_rate": 1.8797175045573214e-05, "loss": 2.4204, "step": 1827 }, { "epoch": 0.18, "learning_rate": 1.8795631542481717e-05, "loss": 2.3629, "step": 1828 }, { "epoch": 0.18, "learning_rate": 1.879408711314425e-05, "loss": 2.4632, "step": 1829 }, { "epoch": 0.18, "learning_rate": 1.879254175772346e-05, "loss": 2.3843, "step": 1830 }, { "epoch": 0.18, "learning_rate": 1.879099547638208e-05, "loss": 2.375, "step": 1831 }, { "epoch": 0.18, "learning_rate": 1.878944826928295e-05, "loss": 2.5341, "step": 1832 }, { "epoch": 0.18, "learning_rate": 1.8787900136588996e-05, "loss": 2.4223, "step": 1833 }, { "epoch": 0.18, "learning_rate": 1.8786351078463253e-05, "loss": 2.5019, "step": 1834 }, { "epoch": 0.18, "learning_rate": 1.8784801095068846e-05, "loss": 2.4657, "step": 1835 }, { "epoch": 0.18, "learning_rate": 1.8783250186569e-05, "loss": 2.4727, "step": 1836 }, { "epoch": 0.18, "learning_rate": 1.8781698353127038e-05, "loss": 2.4139, "step": 1837 }, { "epoch": 0.18, "learning_rate": 1.8780145594906384e-05, "loss": 2.4393, "step": 1838 }, { "epoch": 0.18, "learning_rate": 1.8778591912070545e-05, "loss": 2.3578, "step": 1839 }, { "epoch": 0.18, "learning_rate": 1.8777037304783144e-05, "loss": 2.4398, "step": 1840 }, { "epoch": 0.18, "learning_rate": 1.8775481773207888e-05, "loss": 2.4173, "step": 1841 }, { "epoch": 0.18, "learning_rate": 1.877392531750859e-05, "loss": 2.4234, "step": 1842 }, { "epoch": 0.18, "learning_rate": 1.8772367937849157e-05, "loss": 2.3445, "step": 1843 }, { "epoch": 0.18, "learning_rate": 1.8770809634393587e-05, "loss": 2.4703, "step": 1844 }, { "epoch": 0.18, "learning_rate": 1.8769250407305984e-05, "loss": 2.4371, "step": 1845 }, { "epoch": 0.18, "learning_rate": 1.876769025675055e-05, "loss": 2.3492, "step": 1846 }, { "epoch": 0.19, "learning_rate": 1.8766129182891573e-05, "loss": 2.3111, "step": 1847 }, { "epoch": 0.19, "learning_rate": 1.8764567185893455e-05, "loss": 2.4435, "step": 1848 }, { "epoch": 0.19, "learning_rate": 1.8763004265920675e-05, "loss": 2.4128, "step": 1849 }, { "epoch": 0.19, "learning_rate": 1.8761440423137832e-05, "loss": 2.4395, "step": 1850 }, { "epoch": 0.19, "learning_rate": 1.8759875657709603e-05, "loss": 2.4108, "step": 1851 }, { "epoch": 0.19, "learning_rate": 1.875830996980077e-05, "loss": 2.4104, "step": 1852 }, { "epoch": 0.19, "learning_rate": 1.8756743359576213e-05, "loss": 2.5289, "step": 1853 }, { "epoch": 0.19, "learning_rate": 1.875517582720091e-05, "loss": 2.4733, "step": 1854 }, { "epoch": 0.19, "learning_rate": 1.8753607372839928e-05, "loss": 2.4213, "step": 1855 }, { "epoch": 0.19, "learning_rate": 1.8752037996658445e-05, "loss": 2.3996, "step": 1856 }, { "epoch": 0.19, "learning_rate": 1.8750467698821717e-05, "loss": 2.3678, "step": 1857 }, { "epoch": 0.19, "learning_rate": 1.874889647949512e-05, "loss": 2.3301, "step": 1858 }, { "epoch": 0.19, "learning_rate": 1.8747324338844107e-05, "loss": 2.4277, "step": 1859 }, { "epoch": 0.19, "learning_rate": 1.874575127703424e-05, "loss": 2.4375, "step": 1860 }, { "epoch": 0.19, "learning_rate": 1.8744177294231175e-05, "loss": 2.4402, "step": 1861 }, { "epoch": 0.19, "learning_rate": 1.8742602390600663e-05, "loss": 2.372, "step": 1862 }, { "epoch": 0.19, "learning_rate": 1.874102656630855e-05, "loss": 2.3335, "step": 1863 }, { "epoch": 0.19, "learning_rate": 1.873944982152079e-05, "loss": 2.3824, "step": 1864 }, { "epoch": 0.19, "learning_rate": 1.8737872156403413e-05, "loss": 2.3621, "step": 1865 }, { "epoch": 0.19, "learning_rate": 1.8736293571122573e-05, "loss": 2.4854, "step": 1866 }, { "epoch": 0.19, "learning_rate": 1.8734714065844496e-05, "loss": 2.5154, "step": 1867 }, { "epoch": 0.19, "learning_rate": 1.8733133640735527e-05, "loss": 2.4652, "step": 1868 }, { "epoch": 0.19, "learning_rate": 1.8731552295962084e-05, "loss": 2.4705, "step": 1869 }, { "epoch": 0.19, "learning_rate": 1.8729970031690704e-05, "loss": 2.3672, "step": 1870 }, { "epoch": 0.19, "learning_rate": 1.8728386848088008e-05, "loss": 2.3995, "step": 1871 }, { "epoch": 0.19, "learning_rate": 1.8726802745320713e-05, "loss": 2.3434, "step": 1872 }, { "epoch": 0.19, "learning_rate": 1.8725217723555643e-05, "loss": 2.4279, "step": 1873 }, { "epoch": 0.19, "learning_rate": 1.8723631782959716e-05, "loss": 2.3381, "step": 1874 }, { "epoch": 0.19, "learning_rate": 1.872204492369993e-05, "loss": 2.4334, "step": 1875 }, { "epoch": 0.19, "learning_rate": 1.8720457145943405e-05, "loss": 2.3874, "step": 1876 }, { "epoch": 0.19, "learning_rate": 1.8718868449857342e-05, "loss": 2.3665, "step": 1877 }, { "epoch": 0.19, "learning_rate": 1.8717278835609042e-05, "loss": 2.4818, "step": 1878 }, { "epoch": 0.19, "learning_rate": 1.8715688303365905e-05, "loss": 2.3736, "step": 1879 }, { "epoch": 0.19, "learning_rate": 1.8714096853295424e-05, "loss": 2.4773, "step": 1880 }, { "epoch": 0.19, "learning_rate": 1.871250448556519e-05, "loss": 2.3786, "step": 1881 }, { "epoch": 0.19, "learning_rate": 1.8710911200342897e-05, "loss": 2.478, "step": 1882 }, { "epoch": 0.19, "learning_rate": 1.8709316997796322e-05, "loss": 2.5123, "step": 1883 }, { "epoch": 0.19, "learning_rate": 1.8707721878093352e-05, "loss": 2.4149, "step": 1884 }, { "epoch": 0.19, "learning_rate": 1.8706125841401962e-05, "loss": 2.4775, "step": 1885 }, { "epoch": 0.19, "learning_rate": 1.8704528887890232e-05, "loss": 2.4421, "step": 1886 }, { "epoch": 0.19, "learning_rate": 1.8702931017726324e-05, "loss": 2.3801, "step": 1887 }, { "epoch": 0.19, "learning_rate": 1.8701332231078514e-05, "loss": 2.3903, "step": 1888 }, { "epoch": 0.19, "learning_rate": 1.8699732528115164e-05, "loss": 2.418, "step": 1889 }, { "epoch": 0.19, "learning_rate": 1.869813190900473e-05, "loss": 2.4445, "step": 1890 }, { "epoch": 0.19, "learning_rate": 1.8696530373915774e-05, "loss": 2.3958, "step": 1891 }, { "epoch": 0.19, "learning_rate": 1.869492792301695e-05, "loss": 2.4716, "step": 1892 }, { "epoch": 0.19, "learning_rate": 1.8693324556477006e-05, "loss": 2.367, "step": 1893 }, { "epoch": 0.19, "learning_rate": 1.8691720274464788e-05, "loss": 2.3937, "step": 1894 }, { "epoch": 0.19, "learning_rate": 1.869011507714924e-05, "loss": 2.4408, "step": 1895 }, { "epoch": 0.19, "learning_rate": 1.8688508964699404e-05, "loss": 2.4545, "step": 1896 }, { "epoch": 0.19, "learning_rate": 1.868690193728441e-05, "loss": 2.4978, "step": 1897 }, { "epoch": 0.19, "learning_rate": 1.8685293995073496e-05, "loss": 2.4157, "step": 1898 }, { "epoch": 0.19, "learning_rate": 1.8683685138235988e-05, "loss": 2.3688, "step": 1899 }, { "epoch": 0.19, "learning_rate": 1.868207536694131e-05, "loss": 2.4123, "step": 1900 }, { "epoch": 0.19, "learning_rate": 1.868046468135898e-05, "loss": 2.4161, "step": 1901 }, { "epoch": 0.19, "learning_rate": 1.867885308165862e-05, "loss": 2.4268, "step": 1902 }, { "epoch": 0.19, "learning_rate": 1.8677240568009944e-05, "loss": 2.3897, "step": 1903 }, { "epoch": 0.19, "learning_rate": 1.8675627140582758e-05, "loss": 2.3802, "step": 1904 }, { "epoch": 0.19, "learning_rate": 1.8674012799546973e-05, "loss": 2.4366, "step": 1905 }, { "epoch": 0.19, "learning_rate": 1.8672397545072586e-05, "loss": 2.4747, "step": 1906 }, { "epoch": 0.19, "learning_rate": 1.8670781377329697e-05, "loss": 2.4042, "step": 1907 }, { "epoch": 0.19, "learning_rate": 1.8669164296488503e-05, "loss": 2.4332, "step": 1908 }, { "epoch": 0.19, "learning_rate": 1.866754630271929e-05, "loss": 2.3717, "step": 1909 }, { "epoch": 0.19, "learning_rate": 1.866592739619245e-05, "loss": 2.456, "step": 1910 }, { "epoch": 0.19, "learning_rate": 1.866430757707846e-05, "loss": 2.4477, "step": 1911 }, { "epoch": 0.19, "learning_rate": 1.8662686845547907e-05, "loss": 2.398, "step": 1912 }, { "epoch": 0.19, "learning_rate": 1.866106520177146e-05, "loss": 2.4449, "step": 1913 }, { "epoch": 0.19, "learning_rate": 1.8659442645919893e-05, "loss": 2.4177, "step": 1914 }, { "epoch": 0.19, "learning_rate": 1.865781917816407e-05, "loss": 2.4108, "step": 1915 }, { "epoch": 0.19, "learning_rate": 1.865619479867496e-05, "loss": 2.514, "step": 1916 }, { "epoch": 0.19, "learning_rate": 1.8654569507623618e-05, "loss": 2.4688, "step": 1917 }, { "epoch": 0.19, "learning_rate": 1.86529433051812e-05, "loss": 2.4667, "step": 1918 }, { "epoch": 0.19, "learning_rate": 1.8651316191518956e-05, "loss": 2.5058, "step": 1919 }, { "epoch": 0.19, "learning_rate": 1.864968816680824e-05, "loss": 2.4891, "step": 1920 }, { "epoch": 0.19, "learning_rate": 1.864805923122049e-05, "loss": 2.4215, "step": 1921 }, { "epoch": 0.19, "learning_rate": 1.864642938492724e-05, "loss": 2.4521, "step": 1922 }, { "epoch": 0.19, "learning_rate": 1.8644798628100137e-05, "loss": 2.3452, "step": 1923 }, { "epoch": 0.19, "learning_rate": 1.8643166960910898e-05, "loss": 2.431, "step": 1924 }, { "epoch": 0.19, "learning_rate": 1.8641534383531362e-05, "loss": 2.4498, "step": 1925 }, { "epoch": 0.19, "learning_rate": 1.8639900896133446e-05, "loss": 2.3692, "step": 1926 }, { "epoch": 0.19, "learning_rate": 1.863826649888917e-05, "loss": 2.3669, "step": 1927 }, { "epoch": 0.19, "learning_rate": 1.8636631191970648e-05, "loss": 2.4435, "step": 1928 }, { "epoch": 0.19, "learning_rate": 1.863499497555009e-05, "loss": 2.3856, "step": 1929 }, { "epoch": 0.19, "learning_rate": 1.86333578497998e-05, "loss": 2.3965, "step": 1930 }, { "epoch": 0.19, "learning_rate": 1.8631719814892182e-05, "loss": 2.5371, "step": 1931 }, { "epoch": 0.19, "learning_rate": 1.8630080870999733e-05, "loss": 2.5377, "step": 1932 }, { "epoch": 0.19, "learning_rate": 1.8628441018295046e-05, "loss": 2.3979, "step": 1933 }, { "epoch": 0.19, "learning_rate": 1.8626800256950805e-05, "loss": 2.5603, "step": 1934 }, { "epoch": 0.19, "learning_rate": 1.86251585871398e-05, "loss": 2.3189, "step": 1935 }, { "epoch": 0.19, "learning_rate": 1.8623516009034913e-05, "loss": 2.4404, "step": 1936 }, { "epoch": 0.19, "learning_rate": 1.862187252280912e-05, "loss": 2.4607, "step": 1937 }, { "epoch": 0.19, "learning_rate": 1.8620228128635484e-05, "loss": 2.3836, "step": 1938 }, { "epoch": 0.19, "learning_rate": 1.8618582826687178e-05, "loss": 2.3981, "step": 1939 }, { "epoch": 0.19, "learning_rate": 1.8616936617137465e-05, "loss": 2.3627, "step": 1940 }, { "epoch": 0.19, "learning_rate": 1.8615289500159702e-05, "loss": 2.4513, "step": 1941 }, { "epoch": 0.19, "learning_rate": 1.861364147592734e-05, "loss": 2.4017, "step": 1942 }, { "epoch": 0.19, "learning_rate": 1.8611992544613934e-05, "loss": 2.4285, "step": 1943 }, { "epoch": 0.19, "learning_rate": 1.861034270639313e-05, "loss": 2.3516, "step": 1944 }, { "epoch": 0.19, "learning_rate": 1.8608691961438657e-05, "loss": 2.4854, "step": 1945 }, { "epoch": 0.19, "learning_rate": 1.8607040309924364e-05, "loss": 2.4193, "step": 1946 }, { "epoch": 0.2, "learning_rate": 1.8605387752024173e-05, "loss": 2.5058, "step": 1947 }, { "epoch": 0.2, "learning_rate": 1.8603734287912115e-05, "loss": 2.5023, "step": 1948 }, { "epoch": 0.2, "learning_rate": 1.860207991776231e-05, "loss": 2.4078, "step": 1949 }, { "epoch": 0.2, "learning_rate": 1.860042464174898e-05, "loss": 2.3911, "step": 1950 }, { "epoch": 0.2, "learning_rate": 1.859876846004643e-05, "loss": 2.4722, "step": 1951 }, { "epoch": 0.2, "learning_rate": 1.8597111372829082e-05, "loss": 2.3953, "step": 1952 }, { "epoch": 0.2, "learning_rate": 1.8595453380271423e-05, "loss": 2.4653, "step": 1953 }, { "epoch": 0.2, "learning_rate": 1.8593794482548065e-05, "loss": 2.453, "step": 1954 }, { "epoch": 0.2, "learning_rate": 1.8592134679833696e-05, "loss": 2.4434, "step": 1955 }, { "epoch": 0.2, "learning_rate": 1.8590473972303103e-05, "loss": 2.4627, "step": 1956 }, { "epoch": 0.2, "learning_rate": 1.8588812360131182e-05, "loss": 2.4089, "step": 1957 }, { "epoch": 0.2, "learning_rate": 1.8587149843492903e-05, "loss": 2.4541, "step": 1958 }, { "epoch": 0.2, "learning_rate": 1.8585486422563343e-05, "loss": 2.445, "step": 1959 }, { "epoch": 0.2, "learning_rate": 1.858382209751768e-05, "loss": 2.5008, "step": 1960 }, { "epoch": 0.2, "learning_rate": 1.8582156868531168e-05, "loss": 2.3845, "step": 1961 }, { "epoch": 0.2, "learning_rate": 1.8580490735779176e-05, "loss": 2.4422, "step": 1962 }, { "epoch": 0.2, "learning_rate": 1.8578823699437163e-05, "loss": 2.2985, "step": 1963 }, { "epoch": 0.2, "learning_rate": 1.8577155759680675e-05, "loss": 2.4032, "step": 1964 }, { "epoch": 0.2, "learning_rate": 1.8575486916685355e-05, "loss": 2.4438, "step": 1965 }, { "epoch": 0.2, "learning_rate": 1.8573817170626952e-05, "loss": 2.4658, "step": 1966 }, { "epoch": 0.2, "learning_rate": 1.85721465216813e-05, "loss": 2.535, "step": 1967 }, { "epoch": 0.2, "learning_rate": 1.8570474970024334e-05, "loss": 2.5403, "step": 1968 }, { "epoch": 0.2, "learning_rate": 1.8568802515832077e-05, "loss": 2.3704, "step": 1969 }, { "epoch": 0.2, "learning_rate": 1.856712915928065e-05, "loss": 2.379, "step": 1970 }, { "epoch": 0.2, "learning_rate": 1.856545490054627e-05, "loss": 2.4783, "step": 1971 }, { "epoch": 0.2, "learning_rate": 1.8563779739805253e-05, "loss": 2.4448, "step": 1972 }, { "epoch": 0.2, "learning_rate": 1.8562103677234007e-05, "loss": 2.4757, "step": 1973 }, { "epoch": 0.2, "learning_rate": 1.856042671300903e-05, "loss": 2.3384, "step": 1974 }, { "epoch": 0.2, "learning_rate": 1.855874884730692e-05, "loss": 2.3681, "step": 1975 }, { "epoch": 0.2, "learning_rate": 1.8557070080304365e-05, "loss": 2.506, "step": 1976 }, { "epoch": 0.2, "learning_rate": 1.855539041217816e-05, "loss": 2.4836, "step": 1977 }, { "epoch": 0.2, "learning_rate": 1.8553709843105177e-05, "loss": 2.2907, "step": 1978 }, { "epoch": 0.2, "learning_rate": 1.85520283732624e-05, "loss": 2.4494, "step": 1979 }, { "epoch": 0.2, "learning_rate": 1.8550346002826898e-05, "loss": 2.1928, "step": 1980 }, { "epoch": 0.2, "learning_rate": 1.8548662731975837e-05, "loss": 2.4886, "step": 1981 }, { "epoch": 0.2, "learning_rate": 1.8546978560886478e-05, "loss": 2.4552, "step": 1982 }, { "epoch": 0.2, "learning_rate": 1.854529348973618e-05, "loss": 2.3891, "step": 1983 }, { "epoch": 0.2, "learning_rate": 1.854360751870239e-05, "loss": 2.4576, "step": 1984 }, { "epoch": 0.2, "learning_rate": 1.854192064796265e-05, "loss": 2.407, "step": 1985 }, { "epoch": 0.2, "learning_rate": 1.854023287769461e-05, "loss": 2.448, "step": 1986 }, { "epoch": 0.2, "learning_rate": 1.8538544208075997e-05, "loss": 2.523, "step": 1987 }, { "epoch": 0.2, "learning_rate": 1.8536854639284642e-05, "loss": 2.4596, "step": 1988 }, { "epoch": 0.2, "learning_rate": 1.8535164171498466e-05, "loss": 2.3195, "step": 1989 }, { "epoch": 0.2, "learning_rate": 1.85334728048955e-05, "loss": 2.4388, "step": 1990 }, { "epoch": 0.2, "learning_rate": 1.8531780539653845e-05, "loss": 2.3964, "step": 1991 }, { "epoch": 0.2, "learning_rate": 1.8530087375951713e-05, "loss": 2.4234, "step": 1992 }, { "epoch": 0.2, "learning_rate": 1.8528393313967407e-05, "loss": 2.3513, "step": 1993 }, { "epoch": 0.2, "learning_rate": 1.8526698353879328e-05, "loss": 2.4938, "step": 1994 }, { "epoch": 0.2, "learning_rate": 1.8525002495865964e-05, "loss": 2.4963, "step": 1995 }, { "epoch": 0.2, "learning_rate": 1.8523305740105903e-05, "loss": 2.5195, "step": 1996 }, { "epoch": 0.2, "learning_rate": 1.852160808677783e-05, "loss": 2.4744, "step": 1997 }, { "epoch": 0.2, "learning_rate": 1.8519909536060508e-05, "loss": 2.5281, "step": 1998 }, { "epoch": 0.2, "learning_rate": 1.851821008813282e-05, "loss": 2.4829, "step": 1999 }, { "epoch": 0.2, "learning_rate": 1.8516509743173724e-05, "loss": 2.6168, "step": 2000 }, { "epoch": 0.2, "learning_rate": 1.851480850136228e-05, "loss": 2.5243, "step": 2001 }, { "epoch": 0.2, "learning_rate": 1.8513106362877646e-05, "loss": 2.4842, "step": 2002 }, { "epoch": 0.2, "learning_rate": 1.8511403327899063e-05, "loss": 2.468, "step": 2003 }, { "epoch": 0.2, "learning_rate": 1.8509699396605882e-05, "loss": 2.3894, "step": 2004 }, { "epoch": 0.2, "learning_rate": 1.850799456917753e-05, "loss": 2.4821, "step": 2005 }, { "epoch": 0.2, "learning_rate": 1.8506288845793545e-05, "loss": 2.4537, "step": 2006 }, { "epoch": 0.2, "learning_rate": 1.850458222663355e-05, "loss": 2.4287, "step": 2007 }, { "epoch": 0.2, "learning_rate": 1.8502874711877264e-05, "loss": 2.4149, "step": 2008 }, { "epoch": 0.2, "learning_rate": 1.8501166301704505e-05, "loss": 2.4135, "step": 2009 }, { "epoch": 0.2, "learning_rate": 1.8499456996295177e-05, "loss": 2.4853, "step": 2010 }, { "epoch": 0.2, "learning_rate": 1.8497746795829284e-05, "loss": 2.3177, "step": 2011 }, { "epoch": 0.2, "learning_rate": 1.8496035700486926e-05, "loss": 2.395, "step": 2012 }, { "epoch": 0.2, "learning_rate": 1.8494323710448284e-05, "loss": 2.4167, "step": 2013 }, { "epoch": 0.2, "learning_rate": 1.8492610825893658e-05, "loss": 2.4052, "step": 2014 }, { "epoch": 0.2, "learning_rate": 1.8490897047003418e-05, "loss": 2.5494, "step": 2015 }, { "epoch": 0.2, "learning_rate": 1.848918237395804e-05, "loss": 2.4267, "step": 2016 }, { "epoch": 0.2, "learning_rate": 1.8487466806938093e-05, "loss": 2.4507, "step": 2017 }, { "epoch": 0.2, "learning_rate": 1.8485750346124237e-05, "loss": 2.4253, "step": 2018 }, { "epoch": 0.2, "learning_rate": 1.848403299169723e-05, "loss": 2.5075, "step": 2019 }, { "epoch": 0.2, "learning_rate": 1.848231474383792e-05, "loss": 2.4997, "step": 2020 }, { "epoch": 0.2, "learning_rate": 1.8480595602727253e-05, "loss": 2.4229, "step": 2021 }, { "epoch": 0.2, "learning_rate": 1.847887556854627e-05, "loss": 2.3543, "step": 2022 }, { "epoch": 0.2, "learning_rate": 1.8477154641476097e-05, "loss": 2.3951, "step": 2023 }, { "epoch": 0.2, "learning_rate": 1.847543282169797e-05, "loss": 2.4874, "step": 2024 }, { "epoch": 0.2, "learning_rate": 1.84737101093932e-05, "loss": 2.5191, "step": 2025 }, { "epoch": 0.2, "learning_rate": 1.8471986504743203e-05, "loss": 2.4046, "step": 2026 }, { "epoch": 0.2, "learning_rate": 1.8470262007929497e-05, "loss": 2.4398, "step": 2027 }, { "epoch": 0.2, "learning_rate": 1.8468536619133674e-05, "loss": 2.4585, "step": 2028 }, { "epoch": 0.2, "learning_rate": 1.8466810338537434e-05, "loss": 2.4039, "step": 2029 }, { "epoch": 0.2, "learning_rate": 1.8465083166322567e-05, "loss": 2.417, "step": 2030 }, { "epoch": 0.2, "learning_rate": 1.8463355102670958e-05, "loss": 2.4189, "step": 2031 }, { "epoch": 0.2, "learning_rate": 1.8461626147764583e-05, "loss": 2.4271, "step": 2032 }, { "epoch": 0.2, "learning_rate": 1.8459896301785515e-05, "loss": 2.4747, "step": 2033 }, { "epoch": 0.2, "learning_rate": 1.8458165564915925e-05, "loss": 2.4785, "step": 2034 }, { "epoch": 0.2, "learning_rate": 1.8456433937338062e-05, "loss": 2.4407, "step": 2035 }, { "epoch": 0.2, "learning_rate": 1.845470141923429e-05, "loss": 2.3607, "step": 2036 }, { "epoch": 0.2, "learning_rate": 1.8452968010787046e-05, "loss": 2.4756, "step": 2037 }, { "epoch": 0.2, "learning_rate": 1.845123371217888e-05, "loss": 2.4444, "step": 2038 }, { "epoch": 0.2, "learning_rate": 1.8449498523592418e-05, "loss": 2.4906, "step": 2039 }, { "epoch": 0.2, "learning_rate": 1.8447762445210396e-05, "loss": 2.3546, "step": 2040 }, { "epoch": 0.2, "learning_rate": 1.8446025477215636e-05, "loss": 2.4518, "step": 2041 }, { "epoch": 0.2, "learning_rate": 1.8444287619791046e-05, "loss": 2.3452, "step": 2042 }, { "epoch": 0.2, "learning_rate": 1.8442548873119644e-05, "loss": 2.4843, "step": 2043 }, { "epoch": 0.2, "learning_rate": 1.844080923738453e-05, "loss": 2.4802, "step": 2044 }, { "epoch": 0.2, "learning_rate": 1.8439068712768898e-05, "loss": 2.5112, "step": 2045 }, { "epoch": 0.2, "learning_rate": 1.8437327299456038e-05, "loss": 2.4425, "step": 2046 }, { "epoch": 0.21, "learning_rate": 1.843558499762934e-05, "loss": 2.5832, "step": 2047 }, { "epoch": 0.21, "learning_rate": 1.8433841807472275e-05, "loss": 2.3656, "step": 2048 }, { "epoch": 0.21, "learning_rate": 1.8432097729168422e-05, "loss": 2.4173, "step": 2049 }, { "epoch": 0.21, "learning_rate": 1.8430352762901435e-05, "loss": 2.3957, "step": 2050 }, { "epoch": 0.21, "learning_rate": 1.842860690885508e-05, "loss": 2.4227, "step": 2051 }, { "epoch": 0.21, "learning_rate": 1.8426860167213206e-05, "loss": 2.3648, "step": 2052 }, { "epoch": 0.21, "learning_rate": 1.8425112538159754e-05, "loss": 2.3791, "step": 2053 }, { "epoch": 0.21, "learning_rate": 1.8423364021878768e-05, "loss": 2.409, "step": 2054 }, { "epoch": 0.21, "learning_rate": 1.842161461855438e-05, "loss": 2.4206, "step": 2055 }, { "epoch": 0.21, "learning_rate": 1.8419864328370812e-05, "loss": 2.4645, "step": 2056 }, { "epoch": 0.21, "learning_rate": 1.8418113151512386e-05, "loss": 2.436, "step": 2057 }, { "epoch": 0.21, "learning_rate": 1.841636108816351e-05, "loss": 2.4176, "step": 2058 }, { "epoch": 0.21, "learning_rate": 1.8414608138508694e-05, "loss": 2.3586, "step": 2059 }, { "epoch": 0.21, "learning_rate": 1.8412854302732532e-05, "loss": 2.408, "step": 2060 }, { "epoch": 0.21, "learning_rate": 1.841109958101972e-05, "loss": 2.3393, "step": 2061 }, { "epoch": 0.21, "learning_rate": 1.840934397355504e-05, "loss": 2.4738, "step": 2062 }, { "epoch": 0.21, "learning_rate": 1.840758748052337e-05, "loss": 2.4195, "step": 2063 }, { "epoch": 0.21, "learning_rate": 1.840583010210969e-05, "loss": 2.4028, "step": 2064 }, { "epoch": 0.21, "learning_rate": 1.840407183849906e-05, "loss": 2.5159, "step": 2065 }, { "epoch": 0.21, "learning_rate": 1.840231268987663e-05, "loss": 2.3706, "step": 2066 }, { "epoch": 0.21, "learning_rate": 1.8400552656427668e-05, "loss": 2.3859, "step": 2067 }, { "epoch": 0.21, "learning_rate": 1.8398791738337505e-05, "loss": 2.4998, "step": 2068 }, { "epoch": 0.21, "learning_rate": 1.8397029935791585e-05, "loss": 2.4718, "step": 2069 }, { "epoch": 0.21, "learning_rate": 1.8395267248975438e-05, "loss": 2.4721, "step": 2070 }, { "epoch": 0.21, "learning_rate": 1.8393503678074686e-05, "loss": 2.5032, "step": 2071 }, { "epoch": 0.21, "learning_rate": 1.839173922327505e-05, "loss": 2.454, "step": 2072 }, { "epoch": 0.21, "learning_rate": 1.838997388476234e-05, "loss": 2.4069, "step": 2073 }, { "epoch": 0.21, "learning_rate": 1.8388207662722454e-05, "loss": 2.3927, "step": 2074 }, { "epoch": 0.21, "learning_rate": 1.8386440557341398e-05, "loss": 2.3668, "step": 2075 }, { "epoch": 0.21, "learning_rate": 1.8384672568805254e-05, "loss": 2.3589, "step": 2076 }, { "epoch": 0.21, "learning_rate": 1.8382903697300204e-05, "loss": 2.3097, "step": 2077 }, { "epoch": 0.21, "learning_rate": 1.8381133943012527e-05, "loss": 2.3355, "step": 2078 }, { "epoch": 0.21, "learning_rate": 1.837936330612859e-05, "loss": 2.4164, "step": 2079 }, { "epoch": 0.21, "learning_rate": 1.8377591786834855e-05, "loss": 2.5103, "step": 2080 }, { "epoch": 0.21, "learning_rate": 1.8375819385317876e-05, "loss": 2.3466, "step": 2081 }, { "epoch": 0.21, "learning_rate": 1.8374046101764296e-05, "loss": 2.3387, "step": 2082 }, { "epoch": 0.21, "learning_rate": 1.8372271936360867e-05, "loss": 2.4275, "step": 2083 }, { "epoch": 0.21, "learning_rate": 1.8370496889294408e-05, "loss": 2.3973, "step": 2084 }, { "epoch": 0.21, "learning_rate": 1.8368720960751854e-05, "loss": 2.4289, "step": 2085 }, { "epoch": 0.21, "learning_rate": 1.836694415092022e-05, "loss": 2.4134, "step": 2086 }, { "epoch": 0.21, "learning_rate": 1.836516645998661e-05, "loss": 2.4889, "step": 2087 }, { "epoch": 0.21, "learning_rate": 1.8363387888138245e-05, "loss": 2.4159, "step": 2088 }, { "epoch": 0.21, "learning_rate": 1.836160843556241e-05, "loss": 2.4776, "step": 2089 }, { "epoch": 0.21, "learning_rate": 1.8359828102446497e-05, "loss": 2.431, "step": 2090 }, { "epoch": 0.21, "learning_rate": 1.835804688897799e-05, "loss": 2.4022, "step": 2091 }, { "epoch": 0.21, "learning_rate": 1.835626479534446e-05, "loss": 2.4324, "step": 2092 }, { "epoch": 0.21, "learning_rate": 1.835448182173358e-05, "loss": 2.4382, "step": 2093 }, { "epoch": 0.21, "learning_rate": 1.835269796833311e-05, "loss": 2.4019, "step": 2094 }, { "epoch": 0.21, "learning_rate": 1.83509132353309e-05, "loss": 2.3336, "step": 2095 }, { "epoch": 0.21, "learning_rate": 1.8349127622914898e-05, "loss": 2.4657, "step": 2096 }, { "epoch": 0.21, "learning_rate": 1.834734113127314e-05, "loss": 2.3579, "step": 2097 }, { "epoch": 0.21, "learning_rate": 1.834555376059376e-05, "loss": 2.3837, "step": 2098 }, { "epoch": 0.21, "learning_rate": 1.8343765511064982e-05, "loss": 2.4154, "step": 2099 }, { "epoch": 0.21, "learning_rate": 1.8341976382875117e-05, "loss": 2.3623, "step": 2100 }, { "epoch": 0.21, "learning_rate": 1.834018637621258e-05, "loss": 2.4305, "step": 2101 }, { "epoch": 0.21, "learning_rate": 1.8338395491265865e-05, "loss": 2.3165, "step": 2102 }, { "epoch": 0.21, "learning_rate": 1.833660372822357e-05, "loss": 2.462, "step": 2103 }, { "epoch": 0.21, "learning_rate": 1.8334811087274388e-05, "loss": 2.3853, "step": 2104 }, { "epoch": 0.21, "learning_rate": 1.833301756860708e-05, "loss": 2.3917, "step": 2105 }, { "epoch": 0.21, "learning_rate": 1.8331223172410535e-05, "loss": 2.4943, "step": 2106 }, { "epoch": 0.21, "learning_rate": 1.8329427898873706e-05, "loss": 2.3105, "step": 2107 }, { "epoch": 0.21, "learning_rate": 1.832763174818565e-05, "loss": 2.4474, "step": 2108 }, { "epoch": 0.21, "learning_rate": 1.8325834720535522e-05, "loss": 2.3747, "step": 2109 }, { "epoch": 0.21, "learning_rate": 1.832403681611255e-05, "loss": 2.5426, "step": 2110 }, { "epoch": 0.21, "learning_rate": 1.8322238035106076e-05, "loss": 2.4161, "step": 2111 }, { "epoch": 0.21, "learning_rate": 1.8320438377705522e-05, "loss": 2.4107, "step": 2112 }, { "epoch": 0.21, "learning_rate": 1.831863784410041e-05, "loss": 2.3932, "step": 2113 }, { "epoch": 0.21, "learning_rate": 1.8316836434480345e-05, "loss": 2.3904, "step": 2114 }, { "epoch": 0.21, "learning_rate": 1.831503414903503e-05, "loss": 2.4283, "step": 2115 }, { "epoch": 0.21, "learning_rate": 1.8313230987954257e-05, "loss": 2.4673, "step": 2116 }, { "epoch": 0.21, "learning_rate": 1.8311426951427918e-05, "loss": 2.4659, "step": 2117 }, { "epoch": 0.21, "learning_rate": 1.8309622039645982e-05, "loss": 2.3882, "step": 2118 }, { "epoch": 0.21, "learning_rate": 1.8307816252798533e-05, "loss": 2.3498, "step": 2119 }, { "epoch": 0.21, "learning_rate": 1.8306009591075723e-05, "loss": 2.4302, "step": 2120 }, { "epoch": 0.21, "learning_rate": 1.830420205466781e-05, "loss": 2.3731, "step": 2121 }, { "epoch": 0.21, "learning_rate": 1.8302393643765145e-05, "loss": 2.4598, "step": 2122 }, { "epoch": 0.21, "learning_rate": 1.8300584358558162e-05, "loss": 2.3772, "step": 2123 }, { "epoch": 0.21, "learning_rate": 1.8298774199237396e-05, "loss": 2.411, "step": 2124 }, { "epoch": 0.21, "learning_rate": 1.8296963165993467e-05, "loss": 2.4233, "step": 2125 }, { "epoch": 0.21, "learning_rate": 1.8295151259017095e-05, "loss": 2.3426, "step": 2126 }, { "epoch": 0.21, "learning_rate": 1.8293338478499084e-05, "loss": 2.5293, "step": 2127 }, { "epoch": 0.21, "learning_rate": 1.829152482463033e-05, "loss": 2.3955, "step": 2128 }, { "epoch": 0.21, "learning_rate": 1.828971029760183e-05, "loss": 2.3917, "step": 2129 }, { "epoch": 0.21, "learning_rate": 1.828789489760467e-05, "loss": 2.4279, "step": 2130 }, { "epoch": 0.21, "learning_rate": 1.8286078624830016e-05, "loss": 2.3497, "step": 2131 }, { "epoch": 0.21, "learning_rate": 1.8284261479469143e-05, "loss": 2.3964, "step": 2132 }, { "epoch": 0.21, "learning_rate": 1.8282443461713405e-05, "loss": 2.4438, "step": 2133 }, { "epoch": 0.21, "learning_rate": 1.8280624571754258e-05, "loss": 2.4814, "step": 2134 }, { "epoch": 0.21, "learning_rate": 1.827880480978324e-05, "loss": 2.46, "step": 2135 }, { "epoch": 0.21, "learning_rate": 1.8276984175991984e-05, "loss": 2.3785, "step": 2136 }, { "epoch": 0.21, "learning_rate": 1.8275162670572224e-05, "loss": 2.4696, "step": 2137 }, { "epoch": 0.21, "learning_rate": 1.8273340293715772e-05, "loss": 2.3809, "step": 2138 }, { "epoch": 0.21, "learning_rate": 1.827151704561454e-05, "loss": 2.3728, "step": 2139 }, { "epoch": 0.21, "learning_rate": 1.8269692926460528e-05, "loss": 2.3561, "step": 2140 }, { "epoch": 0.21, "learning_rate": 1.8267867936445835e-05, "loss": 2.437, "step": 2141 }, { "epoch": 0.21, "learning_rate": 1.826604207576264e-05, "loss": 2.4651, "step": 2142 }, { "epoch": 0.21, "learning_rate": 1.8264215344603223e-05, "loss": 2.3626, "step": 2143 }, { "epoch": 0.21, "learning_rate": 1.826238774315995e-05, "loss": 2.4165, "step": 2144 }, { "epoch": 0.21, "learning_rate": 1.8260559271625286e-05, "loss": 2.5295, "step": 2145 }, { "epoch": 0.22, "learning_rate": 1.8258729930191773e-05, "loss": 2.3787, "step": 2146 }, { "epoch": 0.22, "learning_rate": 1.8256899719052065e-05, "loss": 2.4106, "step": 2147 }, { "epoch": 0.22, "learning_rate": 1.8255068638398893e-05, "loss": 2.4984, "step": 2148 }, { "epoch": 0.22, "learning_rate": 1.825323668842508e-05, "loss": 2.4014, "step": 2149 }, { "epoch": 0.22, "learning_rate": 1.825140386932355e-05, "loss": 2.4614, "step": 2150 }, { "epoch": 0.22, "learning_rate": 1.8249570181287308e-05, "loss": 2.406, "step": 2151 }, { "epoch": 0.22, "learning_rate": 1.824773562450946e-05, "loss": 2.3927, "step": 2152 }, { "epoch": 0.22, "learning_rate": 1.8245900199183193e-05, "loss": 2.4555, "step": 2153 }, { "epoch": 0.22, "learning_rate": 1.824406390550179e-05, "loss": 2.3943, "step": 2154 }, { "epoch": 0.22, "learning_rate": 1.8242226743658638e-05, "loss": 2.3995, "step": 2155 }, { "epoch": 0.22, "learning_rate": 1.824038871384719e-05, "loss": 2.4531, "step": 2156 }, { "epoch": 0.22, "learning_rate": 1.8238549816261012e-05, "loss": 2.3754, "step": 2157 }, { "epoch": 0.22, "learning_rate": 1.8236710051093754e-05, "loss": 2.476, "step": 2158 }, { "epoch": 0.22, "learning_rate": 1.8234869418539155e-05, "loss": 2.3128, "step": 2159 }, { "epoch": 0.22, "learning_rate": 1.8233027918791048e-05, "loss": 2.454, "step": 2160 }, { "epoch": 0.22, "learning_rate": 1.823118555204335e-05, "loss": 2.3717, "step": 2161 }, { "epoch": 0.22, "learning_rate": 1.8229342318490087e-05, "loss": 2.4315, "step": 2162 }, { "epoch": 0.22, "learning_rate": 1.822749821832536e-05, "loss": 2.4309, "step": 2163 }, { "epoch": 0.22, "learning_rate": 1.8225653251743368e-05, "loss": 2.4139, "step": 2164 }, { "epoch": 0.22, "learning_rate": 1.82238074189384e-05, "loss": 2.47, "step": 2165 }, { "epoch": 0.22, "learning_rate": 1.8221960720104833e-05, "loss": 2.3656, "step": 2166 }, { "epoch": 0.22, "learning_rate": 1.8220113155437143e-05, "loss": 2.385, "step": 2167 }, { "epoch": 0.22, "learning_rate": 1.8218264725129886e-05, "loss": 2.3045, "step": 2168 }, { "epoch": 0.22, "learning_rate": 1.821641542937772e-05, "loss": 2.4303, "step": 2169 }, { "epoch": 0.22, "learning_rate": 1.821456526837539e-05, "loss": 2.4046, "step": 2170 }, { "epoch": 0.22, "learning_rate": 1.8212714242317733e-05, "loss": 2.4513, "step": 2171 }, { "epoch": 0.22, "learning_rate": 1.821086235139967e-05, "loss": 2.4077, "step": 2172 }, { "epoch": 0.22, "learning_rate": 1.8209009595816222e-05, "loss": 2.3321, "step": 2173 }, { "epoch": 0.22, "learning_rate": 1.82071559757625e-05, "loss": 2.4769, "step": 2174 }, { "epoch": 0.22, "learning_rate": 1.8205301491433706e-05, "loss": 2.3653, "step": 2175 }, { "epoch": 0.22, "learning_rate": 1.8203446143025127e-05, "loss": 2.5163, "step": 2176 }, { "epoch": 0.22, "learning_rate": 1.8201589930732144e-05, "loss": 2.4466, "step": 2177 }, { "epoch": 0.22, "learning_rate": 1.8199732854750233e-05, "loss": 2.6296, "step": 2178 }, { "epoch": 0.22, "learning_rate": 1.8197874915274956e-05, "loss": 2.4077, "step": 2179 }, { "epoch": 0.22, "learning_rate": 1.8196016112501975e-05, "loss": 2.3293, "step": 2180 }, { "epoch": 0.22, "learning_rate": 1.819415644662702e-05, "loss": 2.424, "step": 2181 }, { "epoch": 0.22, "learning_rate": 1.8192295917845947e-05, "loss": 2.4128, "step": 2182 }, { "epoch": 0.22, "learning_rate": 1.8190434526354667e-05, "loss": 2.4181, "step": 2183 }, { "epoch": 0.22, "learning_rate": 1.818857227234921e-05, "loss": 2.529, "step": 2184 }, { "epoch": 0.22, "learning_rate": 1.8186709156025683e-05, "loss": 2.49, "step": 2185 }, { "epoch": 0.22, "learning_rate": 1.818484517758028e-05, "loss": 2.4208, "step": 2186 }, { "epoch": 0.22, "learning_rate": 1.81829803372093e-05, "loss": 2.3942, "step": 2187 }, { "epoch": 0.22, "learning_rate": 1.8181114635109118e-05, "loss": 2.4265, "step": 2188 }, { "epoch": 0.22, "learning_rate": 1.8179248071476213e-05, "loss": 2.4752, "step": 2189 }, { "epoch": 0.22, "learning_rate": 1.817738064650714e-05, "loss": 2.511, "step": 2190 }, { "epoch": 0.22, "learning_rate": 1.8175512360398562e-05, "loss": 2.3616, "step": 2191 }, { "epoch": 0.22, "learning_rate": 1.8173643213347216e-05, "loss": 2.4696, "step": 2192 }, { "epoch": 0.22, "learning_rate": 1.817177320554994e-05, "loss": 2.5444, "step": 2193 }, { "epoch": 0.22, "learning_rate": 1.816990233720366e-05, "loss": 2.4107, "step": 2194 }, { "epoch": 0.22, "learning_rate": 1.816803060850539e-05, "loss": 2.5938, "step": 2195 }, { "epoch": 0.22, "learning_rate": 1.8166158019652246e-05, "loss": 2.4492, "step": 2196 }, { "epoch": 0.22, "learning_rate": 1.8164284570841417e-05, "loss": 2.4132, "step": 2197 }, { "epoch": 0.22, "learning_rate": 1.8162410262270188e-05, "loss": 2.3714, "step": 2198 }, { "epoch": 0.22, "learning_rate": 1.8160535094135948e-05, "loss": 2.3738, "step": 2199 }, { "epoch": 0.22, "learning_rate": 1.815865906663616e-05, "loss": 2.4554, "step": 2200 }, { "epoch": 0.22, "learning_rate": 1.8156782179968385e-05, "loss": 2.3171, "step": 2201 }, { "epoch": 0.22, "learning_rate": 1.8154904434330274e-05, "loss": 2.3451, "step": 2202 }, { "epoch": 0.22, "learning_rate": 1.8153025829919567e-05, "loss": 2.4311, "step": 2203 }, { "epoch": 0.22, "learning_rate": 1.8151146366934096e-05, "loss": 2.4203, "step": 2204 }, { "epoch": 0.22, "learning_rate": 1.814926604557178e-05, "loss": 2.4336, "step": 2205 }, { "epoch": 0.22, "learning_rate": 1.8147384866030634e-05, "loss": 2.3847, "step": 2206 }, { "epoch": 0.22, "learning_rate": 1.814550282850876e-05, "loss": 2.4493, "step": 2207 }, { "epoch": 0.22, "learning_rate": 1.814361993320435e-05, "loss": 2.4083, "step": 2208 }, { "epoch": 0.22, "learning_rate": 1.8141736180315684e-05, "loss": 2.4006, "step": 2209 }, { "epoch": 0.22, "learning_rate": 1.8139851570041137e-05, "loss": 2.3993, "step": 2210 }, { "epoch": 0.22, "learning_rate": 1.8137966102579178e-05, "loss": 2.4049, "step": 2211 }, { "epoch": 0.22, "learning_rate": 1.8136079778128352e-05, "loss": 2.3954, "step": 2212 }, { "epoch": 0.22, "learning_rate": 1.8134192596887307e-05, "loss": 2.3729, "step": 2213 }, { "epoch": 0.22, "learning_rate": 1.8132304559054783e-05, "loss": 2.2648, "step": 2214 }, { "epoch": 0.22, "learning_rate": 1.8130415664829594e-05, "loss": 2.4159, "step": 2215 }, { "epoch": 0.22, "learning_rate": 1.8128525914410664e-05, "loss": 2.3871, "step": 2216 }, { "epoch": 0.22, "learning_rate": 1.8126635307996995e-05, "loss": 2.4088, "step": 2217 }, { "epoch": 0.22, "learning_rate": 1.812474384578768e-05, "loss": 2.354, "step": 2218 }, { "epoch": 0.22, "learning_rate": 1.8122851527981902e-05, "loss": 2.4455, "step": 2219 }, { "epoch": 0.22, "learning_rate": 1.8120958354778943e-05, "loss": 2.3759, "step": 2220 }, { "epoch": 0.22, "learning_rate": 1.811906432637816e-05, "loss": 2.3954, "step": 2221 }, { "epoch": 0.22, "learning_rate": 1.811716944297902e-05, "loss": 2.4481, "step": 2222 }, { "epoch": 0.22, "learning_rate": 1.8115273704781057e-05, "loss": 2.3788, "step": 2223 }, { "epoch": 0.22, "learning_rate": 1.8113377111983914e-05, "loss": 2.384, "step": 2224 }, { "epoch": 0.22, "learning_rate": 1.811147966478731e-05, "loss": 2.3088, "step": 2225 }, { "epoch": 0.22, "learning_rate": 1.8109581363391068e-05, "loss": 2.4295, "step": 2226 }, { "epoch": 0.22, "learning_rate": 1.8107682207995086e-05, "loss": 2.4003, "step": 2227 }, { "epoch": 0.22, "learning_rate": 1.8105782198799367e-05, "loss": 2.2559, "step": 2228 }, { "epoch": 0.22, "learning_rate": 1.8103881336003987e-05, "loss": 2.4327, "step": 2229 }, { "epoch": 0.22, "learning_rate": 1.810197961980913e-05, "loss": 2.3787, "step": 2230 }, { "epoch": 0.22, "learning_rate": 1.8100077050415056e-05, "loss": 2.4127, "step": 2231 }, { "epoch": 0.22, "learning_rate": 1.8098173628022118e-05, "loss": 2.4532, "step": 2232 }, { "epoch": 0.22, "learning_rate": 1.8096269352830764e-05, "loss": 2.3711, "step": 2233 }, { "epoch": 0.22, "learning_rate": 1.809436422504153e-05, "loss": 2.5322, "step": 2234 }, { "epoch": 0.22, "learning_rate": 1.8092458244855035e-05, "loss": 2.4645, "step": 2235 }, { "epoch": 0.22, "learning_rate": 1.8090551412472e-05, "loss": 2.4967, "step": 2236 }, { "epoch": 0.22, "learning_rate": 1.8088643728093224e-05, "loss": 2.3849, "step": 2237 }, { "epoch": 0.22, "learning_rate": 1.80867351919196e-05, "loss": 2.4621, "step": 2238 }, { "epoch": 0.22, "learning_rate": 1.8084825804152113e-05, "loss": 2.4697, "step": 2239 }, { "epoch": 0.22, "learning_rate": 1.8082915564991833e-05, "loss": 2.4168, "step": 2240 }, { "epoch": 0.22, "learning_rate": 1.808100447463993e-05, "loss": 2.4151, "step": 2241 }, { "epoch": 0.22, "learning_rate": 1.807909253329765e-05, "loss": 2.4431, "step": 2242 }, { "epoch": 0.22, "learning_rate": 1.807717974116633e-05, "loss": 2.4529, "step": 2243 }, { "epoch": 0.22, "learning_rate": 1.8075266098447414e-05, "loss": 2.5069, "step": 2244 }, { "epoch": 0.22, "learning_rate": 1.8073351605342414e-05, "loss": 2.4688, "step": 2245 }, { "epoch": 0.23, "learning_rate": 1.807143626205294e-05, "loss": 2.5166, "step": 2246 }, { "epoch": 0.23, "learning_rate": 1.8069520068780697e-05, "loss": 2.389, "step": 2247 }, { "epoch": 0.23, "learning_rate": 1.806760302572747e-05, "loss": 2.5049, "step": 2248 }, { "epoch": 0.23, "learning_rate": 1.8065685133095145e-05, "loss": 2.4331, "step": 2249 }, { "epoch": 0.23, "learning_rate": 1.806376639108568e-05, "loss": 2.3996, "step": 2250 }, { "epoch": 0.23, "learning_rate": 1.806184679990114e-05, "loss": 2.3953, "step": 2251 }, { "epoch": 0.23, "learning_rate": 1.8059926359743672e-05, "loss": 2.3334, "step": 2252 }, { "epoch": 0.23, "learning_rate": 1.8058005070815515e-05, "loss": 2.3847, "step": 2253 }, { "epoch": 0.23, "learning_rate": 1.8056082933318986e-05, "loss": 2.438, "step": 2254 }, { "epoch": 0.23, "learning_rate": 1.8054159947456508e-05, "loss": 2.5558, "step": 2255 }, { "epoch": 0.23, "learning_rate": 1.8052236113430588e-05, "loss": 2.3384, "step": 2256 }, { "epoch": 0.23, "learning_rate": 1.805031143144381e-05, "loss": 2.4266, "step": 2257 }, { "epoch": 0.23, "learning_rate": 1.804838590169887e-05, "loss": 2.4295, "step": 2258 }, { "epoch": 0.23, "learning_rate": 1.804645952439853e-05, "loss": 2.4317, "step": 2259 }, { "epoch": 0.23, "learning_rate": 1.804453229974566e-05, "loss": 2.344, "step": 2260 }, { "epoch": 0.23, "learning_rate": 1.80426042279432e-05, "loss": 2.4426, "step": 2261 }, { "epoch": 0.23, "learning_rate": 1.8040675309194205e-05, "loss": 2.4642, "step": 2262 }, { "epoch": 0.23, "learning_rate": 1.8038745543701796e-05, "loss": 2.3159, "step": 2263 }, { "epoch": 0.23, "learning_rate": 1.8036814931669192e-05, "loss": 2.4355, "step": 2264 }, { "epoch": 0.23, "learning_rate": 1.8034883473299706e-05, "loss": 2.3737, "step": 2265 }, { "epoch": 0.23, "learning_rate": 1.8032951168796727e-05, "loss": 2.4301, "step": 2266 }, { "epoch": 0.23, "learning_rate": 1.8031018018363745e-05, "loss": 2.5248, "step": 2267 }, { "epoch": 0.23, "learning_rate": 1.8029084022204338e-05, "loss": 2.3974, "step": 2268 }, { "epoch": 0.23, "learning_rate": 1.802714918052217e-05, "loss": 2.4035, "step": 2269 }, { "epoch": 0.23, "learning_rate": 1.802521349352099e-05, "loss": 2.3147, "step": 2270 }, { "epoch": 0.23, "learning_rate": 1.8023276961404643e-05, "loss": 2.4218, "step": 2271 }, { "epoch": 0.23, "learning_rate": 1.8021339584377063e-05, "loss": 2.4386, "step": 2272 }, { "epoch": 0.23, "learning_rate": 1.8019401362642264e-05, "loss": 2.4138, "step": 2273 }, { "epoch": 0.23, "learning_rate": 1.8017462296404358e-05, "loss": 2.446, "step": 2274 }, { "epoch": 0.23, "learning_rate": 1.8015522385867544e-05, "loss": 2.3868, "step": 2275 }, { "epoch": 0.23, "learning_rate": 1.8013581631236113e-05, "loss": 2.3813, "step": 2276 }, { "epoch": 0.23, "learning_rate": 1.8011640032714433e-05, "loss": 2.5115, "step": 2277 }, { "epoch": 0.23, "learning_rate": 1.8009697590506976e-05, "loss": 2.4277, "step": 2278 }, { "epoch": 0.23, "learning_rate": 1.8007754304818292e-05, "loss": 2.4677, "step": 2279 }, { "epoch": 0.23, "learning_rate": 1.8005810175853025e-05, "loss": 2.4123, "step": 2280 }, { "epoch": 0.23, "learning_rate": 1.8003865203815903e-05, "loss": 2.4596, "step": 2281 }, { "epoch": 0.23, "learning_rate": 1.8001919388911752e-05, "loss": 2.3369, "step": 2282 }, { "epoch": 0.23, "learning_rate": 1.7999972731345476e-05, "loss": 2.3086, "step": 2283 }, { "epoch": 0.23, "learning_rate": 1.799802523132207e-05, "loss": 2.431, "step": 2284 }, { "epoch": 0.23, "learning_rate": 1.799607688904663e-05, "loss": 2.4781, "step": 2285 }, { "epoch": 0.23, "learning_rate": 1.7994127704724326e-05, "loss": 2.4467, "step": 2286 }, { "epoch": 0.23, "learning_rate": 1.7992177678560422e-05, "loss": 2.4665, "step": 2287 }, { "epoch": 0.23, "learning_rate": 1.7990226810760266e-05, "loss": 2.459, "step": 2288 }, { "epoch": 0.23, "learning_rate": 1.7988275101529303e-05, "loss": 2.3655, "step": 2289 }, { "epoch": 0.23, "learning_rate": 1.7986322551073067e-05, "loss": 2.2788, "step": 2290 }, { "epoch": 0.23, "learning_rate": 1.7984369159597167e-05, "loss": 2.5102, "step": 2291 }, { "epoch": 0.23, "learning_rate": 1.7982414927307318e-05, "loss": 2.5414, "step": 2292 }, { "epoch": 0.23, "learning_rate": 1.798045985440931e-05, "loss": 2.4879, "step": 2293 }, { "epoch": 0.23, "learning_rate": 1.797850394110903e-05, "loss": 2.3712, "step": 2294 }, { "epoch": 0.23, "learning_rate": 1.7976547187612446e-05, "loss": 2.41, "step": 2295 }, { "epoch": 0.23, "learning_rate": 1.7974589594125622e-05, "loss": 2.3387, "step": 2296 }, { "epoch": 0.23, "learning_rate": 1.797263116085471e-05, "loss": 2.4936, "step": 2297 }, { "epoch": 0.23, "learning_rate": 1.7970671888005945e-05, "loss": 2.4275, "step": 2298 }, { "epoch": 0.23, "learning_rate": 1.796871177578565e-05, "loss": 2.4001, "step": 2299 }, { "epoch": 0.23, "learning_rate": 1.7966750824400243e-05, "loss": 2.3103, "step": 2300 }, { "epoch": 0.23, "learning_rate": 1.7964789034056228e-05, "loss": 2.4326, "step": 2301 }, { "epoch": 0.23, "learning_rate": 1.7962826404960192e-05, "loss": 2.3995, "step": 2302 }, { "epoch": 0.23, "learning_rate": 1.7960862937318818e-05, "loss": 2.4775, "step": 2303 }, { "epoch": 0.23, "learning_rate": 1.7958898631338873e-05, "loss": 2.3665, "step": 2304 }, { "epoch": 0.23, "learning_rate": 1.7956933487227217e-05, "loss": 2.4297, "step": 2305 }, { "epoch": 0.23, "learning_rate": 1.7954967505190785e-05, "loss": 2.4636, "step": 2306 }, { "epoch": 0.23, "learning_rate": 1.7953000685436617e-05, "loss": 2.4677, "step": 2307 }, { "epoch": 0.23, "learning_rate": 1.7951033028171833e-05, "loss": 2.4971, "step": 2308 }, { "epoch": 0.23, "learning_rate": 1.794906453360364e-05, "loss": 2.4753, "step": 2309 }, { "epoch": 0.23, "learning_rate": 1.7947095201939335e-05, "loss": 2.5169, "step": 2310 }, { "epoch": 0.23, "learning_rate": 1.794512503338631e-05, "loss": 2.4539, "step": 2311 }, { "epoch": 0.23, "learning_rate": 1.7943154028152026e-05, "loss": 2.4269, "step": 2312 }, { "epoch": 0.23, "learning_rate": 1.794118218644406e-05, "loss": 2.4369, "step": 2313 }, { "epoch": 0.23, "learning_rate": 1.7939209508470047e-05, "loss": 2.3938, "step": 2314 }, { "epoch": 0.23, "learning_rate": 1.7937235994437735e-05, "loss": 2.3801, "step": 2315 }, { "epoch": 0.23, "learning_rate": 1.7935261644554943e-05, "loss": 2.3642, "step": 2316 }, { "epoch": 0.23, "learning_rate": 1.7933286459029592e-05, "loss": 2.3899, "step": 2317 }, { "epoch": 0.23, "learning_rate": 1.793131043806968e-05, "loss": 2.4026, "step": 2318 }, { "epoch": 0.23, "learning_rate": 1.792933358188329e-05, "loss": 2.2947, "step": 2319 }, { "epoch": 0.23, "learning_rate": 1.7927355890678614e-05, "loss": 2.4382, "step": 2320 }, { "epoch": 0.23, "learning_rate": 1.7925377364663906e-05, "loss": 2.4836, "step": 2321 }, { "epoch": 0.23, "learning_rate": 1.7923398004047526e-05, "loss": 2.4276, "step": 2322 }, { "epoch": 0.23, "learning_rate": 1.792141780903791e-05, "loss": 2.4491, "step": 2323 }, { "epoch": 0.23, "learning_rate": 1.7919436779843592e-05, "loss": 2.4583, "step": 2324 }, { "epoch": 0.23, "learning_rate": 1.791745491667319e-05, "loss": 2.4207, "step": 2325 }, { "epoch": 0.23, "learning_rate": 1.791547221973541e-05, "loss": 2.3225, "step": 2326 }, { "epoch": 0.23, "learning_rate": 1.7913488689239038e-05, "loss": 2.3539, "step": 2327 }, { "epoch": 0.23, "learning_rate": 1.7911504325392955e-05, "loss": 2.2671, "step": 2328 }, { "epoch": 0.23, "learning_rate": 1.790951912840614e-05, "loss": 2.5, "step": 2329 }, { "epoch": 0.23, "learning_rate": 1.7907533098487636e-05, "loss": 2.4613, "step": 2330 }, { "epoch": 0.23, "learning_rate": 1.79055462358466e-05, "loss": 2.3072, "step": 2331 }, { "epoch": 0.23, "learning_rate": 1.790355854069225e-05, "loss": 2.2936, "step": 2332 }, { "epoch": 0.23, "learning_rate": 1.7901570013233917e-05, "loss": 2.4507, "step": 2333 }, { "epoch": 0.23, "learning_rate": 1.7899580653681e-05, "loss": 2.4611, "step": 2334 }, { "epoch": 0.23, "learning_rate": 1.789759046224299e-05, "loss": 2.4396, "step": 2335 }, { "epoch": 0.23, "learning_rate": 1.7895599439129486e-05, "loss": 2.4867, "step": 2336 }, { "epoch": 0.23, "learning_rate": 1.789360758455014e-05, "loss": 2.4333, "step": 2337 }, { "epoch": 0.23, "learning_rate": 1.789161489871472e-05, "loss": 2.4081, "step": 2338 }, { "epoch": 0.23, "learning_rate": 1.7889621381833064e-05, "loss": 2.4396, "step": 2339 }, { "epoch": 0.23, "learning_rate": 1.7887627034115104e-05, "loss": 2.4419, "step": 2340 }, { "epoch": 0.23, "learning_rate": 1.7885631855770866e-05, "loss": 2.4266, "step": 2341 }, { "epoch": 0.23, "learning_rate": 1.7883635847010455e-05, "loss": 2.49, "step": 2342 }, { "epoch": 0.23, "learning_rate": 1.7881639008044064e-05, "loss": 2.4677, "step": 2343 }, { "epoch": 0.23, "learning_rate": 1.7879641339081976e-05, "loss": 2.3521, "step": 2344 }, { "epoch": 0.23, "learning_rate": 1.787764284033456e-05, "loss": 2.3992, "step": 2345 }, { "epoch": 0.24, "learning_rate": 1.7875643512012273e-05, "loss": 2.3983, "step": 2346 }, { "epoch": 0.24, "learning_rate": 1.787364335432566e-05, "loss": 2.4336, "step": 2347 }, { "epoch": 0.24, "learning_rate": 1.7871642367485354e-05, "loss": 2.4329, "step": 2348 }, { "epoch": 0.24, "learning_rate": 1.786964055170207e-05, "loss": 2.4991, "step": 2349 }, { "epoch": 0.24, "learning_rate": 1.7867637907186614e-05, "loss": 2.4611, "step": 2350 }, { "epoch": 0.24, "learning_rate": 1.7865634434149885e-05, "loss": 2.4596, "step": 2351 }, { "epoch": 0.24, "learning_rate": 1.7863630132802862e-05, "loss": 2.4557, "step": 2352 }, { "epoch": 0.24, "learning_rate": 1.7861625003356606e-05, "loss": 2.4096, "step": 2353 }, { "epoch": 0.24, "learning_rate": 1.7859619046022285e-05, "loss": 2.3215, "step": 2354 }, { "epoch": 0.24, "learning_rate": 1.7857612261011125e-05, "loss": 2.4516, "step": 2355 }, { "epoch": 0.24, "learning_rate": 1.7855604648534472e-05, "loss": 2.4658, "step": 2356 }, { "epoch": 0.24, "learning_rate": 1.7853596208803732e-05, "loss": 2.4484, "step": 2357 }, { "epoch": 0.24, "learning_rate": 1.785158694203041e-05, "loss": 2.4515, "step": 2358 }, { "epoch": 0.24, "learning_rate": 1.7849576848426103e-05, "loss": 2.4549, "step": 2359 }, { "epoch": 0.24, "learning_rate": 1.7847565928202484e-05, "loss": 2.4449, "step": 2360 }, { "epoch": 0.24, "learning_rate": 1.784555418157132e-05, "loss": 2.5033, "step": 2361 }, { "epoch": 0.24, "learning_rate": 1.7843541608744458e-05, "loss": 2.4129, "step": 2362 }, { "epoch": 0.24, "learning_rate": 1.784152820993384e-05, "loss": 2.4572, "step": 2363 }, { "epoch": 0.24, "learning_rate": 1.7839513985351496e-05, "loss": 2.4695, "step": 2364 }, { "epoch": 0.24, "learning_rate": 1.7837498935209536e-05, "loss": 2.4065, "step": 2365 }, { "epoch": 0.24, "learning_rate": 1.7835483059720155e-05, "loss": 2.3357, "step": 2366 }, { "epoch": 0.24, "learning_rate": 1.783346635909565e-05, "loss": 2.4399, "step": 2367 }, { "epoch": 0.24, "learning_rate": 1.7831448833548384e-05, "loss": 2.3081, "step": 2368 }, { "epoch": 0.24, "learning_rate": 1.7829430483290828e-05, "loss": 2.543, "step": 2369 }, { "epoch": 0.24, "learning_rate": 1.7827411308535517e-05, "loss": 2.4716, "step": 2370 }, { "epoch": 0.24, "learning_rate": 1.7825391309495098e-05, "loss": 2.3538, "step": 2371 }, { "epoch": 0.24, "learning_rate": 1.7823370486382284e-05, "loss": 2.4144, "step": 2372 }, { "epoch": 0.24, "learning_rate": 1.7821348839409887e-05, "loss": 2.4351, "step": 2373 }, { "epoch": 0.24, "learning_rate": 1.7819326368790798e-05, "loss": 2.3164, "step": 2374 }, { "epoch": 0.24, "learning_rate": 1.7817303074738004e-05, "loss": 2.4432, "step": 2375 }, { "epoch": 0.24, "learning_rate": 1.7815278957464565e-05, "loss": 2.3247, "step": 2376 }, { "epoch": 0.24, "learning_rate": 1.7813254017183637e-05, "loss": 2.4475, "step": 2377 }, { "epoch": 0.24, "learning_rate": 1.781122825410847e-05, "loss": 2.2939, "step": 2378 }, { "epoch": 0.24, "learning_rate": 1.7809201668452386e-05, "loss": 2.5527, "step": 2379 }, { "epoch": 0.24, "learning_rate": 1.7807174260428797e-05, "loss": 2.4145, "step": 2380 }, { "epoch": 0.24, "learning_rate": 1.780514603025121e-05, "loss": 2.3837, "step": 2381 }, { "epoch": 0.24, "learning_rate": 1.780311697813321e-05, "loss": 2.2212, "step": 2382 }, { "epoch": 0.24, "learning_rate": 1.7801087104288468e-05, "loss": 2.4353, "step": 2383 }, { "epoch": 0.24, "learning_rate": 1.779905640893075e-05, "loss": 2.4688, "step": 2384 }, { "epoch": 0.24, "learning_rate": 1.7797024892273903e-05, "loss": 2.3769, "step": 2385 }, { "epoch": 0.24, "learning_rate": 1.779499255453186e-05, "loss": 2.4048, "step": 2386 }, { "epoch": 0.24, "learning_rate": 1.779295939591864e-05, "loss": 2.4386, "step": 2387 }, { "epoch": 0.24, "learning_rate": 1.7790925416648352e-05, "loss": 2.4148, "step": 2388 }, { "epoch": 0.24, "learning_rate": 1.7788890616935188e-05, "loss": 2.3557, "step": 2389 }, { "epoch": 0.24, "learning_rate": 1.7786854996993427e-05, "loss": 2.4686, "step": 2390 }, { "epoch": 0.24, "learning_rate": 1.7784818557037437e-05, "loss": 2.4332, "step": 2391 }, { "epoch": 0.24, "learning_rate": 1.778278129728167e-05, "loss": 2.4406, "step": 2392 }, { "epoch": 0.24, "learning_rate": 1.7780743217940664e-05, "loss": 2.4726, "step": 2393 }, { "epoch": 0.24, "learning_rate": 1.7778704319229043e-05, "loss": 2.3774, "step": 2394 }, { "epoch": 0.24, "learning_rate": 1.777666460136152e-05, "loss": 2.3806, "step": 2395 }, { "epoch": 0.24, "learning_rate": 1.7774624064552896e-05, "loss": 2.3595, "step": 2396 }, { "epoch": 0.24, "learning_rate": 1.7772582709018047e-05, "loss": 2.4195, "step": 2397 }, { "epoch": 0.24, "learning_rate": 1.7770540534971943e-05, "loss": 2.4081, "step": 2398 }, { "epoch": 0.24, "learning_rate": 1.776849754262965e-05, "loss": 2.3834, "step": 2399 }, { "epoch": 0.24, "learning_rate": 1.7766453732206306e-05, "loss": 2.4552, "step": 2400 }, { "epoch": 0.24, "learning_rate": 1.7764409103917136e-05, "loss": 2.4627, "step": 2401 }, { "epoch": 0.24, "learning_rate": 1.7762363657977457e-05, "loss": 2.4195, "step": 2402 }, { "epoch": 0.24, "learning_rate": 1.7760317394602672e-05, "loss": 2.3563, "step": 2403 }, { "epoch": 0.24, "learning_rate": 1.775827031400826e-05, "loss": 2.4877, "step": 2404 }, { "epoch": 0.24, "learning_rate": 1.7756222416409804e-05, "loss": 2.4235, "step": 2405 }, { "epoch": 0.24, "learning_rate": 1.7754173702022956e-05, "loss": 2.2972, "step": 2406 }, { "epoch": 0.24, "learning_rate": 1.7752124171063465e-05, "loss": 2.4735, "step": 2407 }, { "epoch": 0.24, "learning_rate": 1.7750073823747162e-05, "loss": 2.4461, "step": 2408 }, { "epoch": 0.24, "learning_rate": 1.7748022660289962e-05, "loss": 2.4034, "step": 2409 }, { "epoch": 0.24, "learning_rate": 1.7745970680907866e-05, "loss": 2.3773, "step": 2410 }, { "epoch": 0.24, "learning_rate": 1.7743917885816964e-05, "loss": 2.347, "step": 2411 }, { "epoch": 0.24, "learning_rate": 1.7741864275233434e-05, "loss": 2.4229, "step": 2412 }, { "epoch": 0.24, "learning_rate": 1.7739809849373533e-05, "loss": 2.3895, "step": 2413 }, { "epoch": 0.24, "learning_rate": 1.773775460845361e-05, "loss": 2.4344, "step": 2414 }, { "epoch": 0.24, "learning_rate": 1.77356985526901e-05, "loss": 2.4755, "step": 2415 }, { "epoch": 0.24, "learning_rate": 1.7733641682299514e-05, "loss": 2.3873, "step": 2416 }, { "epoch": 0.24, "learning_rate": 1.773158399749846e-05, "loss": 2.4087, "step": 2417 }, { "epoch": 0.24, "learning_rate": 1.7729525498503625e-05, "loss": 2.2952, "step": 2418 }, { "epoch": 0.24, "learning_rate": 1.772746618553179e-05, "loss": 2.373, "step": 2419 }, { "epoch": 0.24, "learning_rate": 1.772540605879981e-05, "loss": 2.3986, "step": 2420 }, { "epoch": 0.24, "learning_rate": 1.7723345118524632e-05, "loss": 2.3634, "step": 2421 }, { "epoch": 0.24, "learning_rate": 1.772128336492329e-05, "loss": 2.3976, "step": 2422 }, { "epoch": 0.24, "learning_rate": 1.7719220798212905e-05, "loss": 2.4476, "step": 2423 }, { "epoch": 0.24, "learning_rate": 1.771715741861068e-05, "loss": 2.3385, "step": 2424 }, { "epoch": 0.24, "learning_rate": 1.77150932263339e-05, "loss": 2.3978, "step": 2425 }, { "epoch": 0.24, "learning_rate": 1.7713028221599944e-05, "loss": 2.3589, "step": 2426 }, { "epoch": 0.24, "learning_rate": 1.7710962404626273e-05, "loss": 2.3852, "step": 2427 }, { "epoch": 0.24, "learning_rate": 1.7708895775630427e-05, "loss": 2.375, "step": 2428 }, { "epoch": 0.24, "learning_rate": 1.7706828334830045e-05, "loss": 2.409, "step": 2429 }, { "epoch": 0.24, "learning_rate": 1.770476008244284e-05, "loss": 2.5084, "step": 2430 }, { "epoch": 0.24, "learning_rate": 1.7702691018686615e-05, "loss": 2.374, "step": 2431 }, { "epoch": 0.24, "learning_rate": 1.7700621143779257e-05, "loss": 2.3024, "step": 2432 }, { "epoch": 0.24, "learning_rate": 1.7698550457938744e-05, "loss": 2.3611, "step": 2433 }, { "epoch": 0.24, "learning_rate": 1.769647896138313e-05, "loss": 2.3412, "step": 2434 }, { "epoch": 0.24, "learning_rate": 1.7694406654330557e-05, "loss": 2.428, "step": 2435 }, { "epoch": 0.24, "learning_rate": 1.769233353699926e-05, "loss": 2.5782, "step": 2436 }, { "epoch": 0.24, "learning_rate": 1.7690259609607552e-05, "loss": 2.4035, "step": 2437 }, { "epoch": 0.24, "learning_rate": 1.7688184872373836e-05, "loss": 2.3888, "step": 2438 }, { "epoch": 0.24, "learning_rate": 1.768610932551659e-05, "loss": 2.386, "step": 2439 }, { "epoch": 0.24, "learning_rate": 1.7684032969254387e-05, "loss": 2.339, "step": 2440 }, { "epoch": 0.24, "learning_rate": 1.768195580380589e-05, "loss": 2.4251, "step": 2441 }, { "epoch": 0.24, "learning_rate": 1.767987782938983e-05, "loss": 2.3027, "step": 2442 }, { "epoch": 0.24, "learning_rate": 1.767779904622504e-05, "loss": 2.4098, "step": 2443 }, { "epoch": 0.24, "learning_rate": 1.7675719454530432e-05, "loss": 2.395, "step": 2444 }, { "epoch": 0.24, "learning_rate": 1.7673639054524998e-05, "loss": 2.4177, "step": 2445 }, { "epoch": 0.25, "learning_rate": 1.767155784642782e-05, "loss": 2.471, "step": 2446 }, { "epoch": 0.25, "learning_rate": 1.766947583045807e-05, "loss": 2.3929, "step": 2447 }, { "epoch": 0.25, "learning_rate": 1.7667393006834997e-05, "loss": 2.3801, "step": 2448 }, { "epoch": 0.25, "learning_rate": 1.7665309375777934e-05, "loss": 2.3168, "step": 2449 }, { "epoch": 0.25, "learning_rate": 1.7663224937506308e-05, "loss": 2.4077, "step": 2450 }, { "epoch": 0.25, "learning_rate": 1.7661139692239627e-05, "loss": 2.3588, "step": 2451 }, { "epoch": 0.25, "learning_rate": 1.765905364019748e-05, "loss": 2.4401, "step": 2452 }, { "epoch": 0.25, "learning_rate": 1.765696678159954e-05, "loss": 2.3952, "step": 2453 }, { "epoch": 0.25, "learning_rate": 1.7654879116665577e-05, "loss": 2.4941, "step": 2454 }, { "epoch": 0.25, "learning_rate": 1.7652790645615435e-05, "loss": 2.3861, "step": 2455 }, { "epoch": 0.25, "learning_rate": 1.765070136866904e-05, "loss": 2.4375, "step": 2456 }, { "epoch": 0.25, "learning_rate": 1.7648611286046417e-05, "loss": 2.342, "step": 2457 }, { "epoch": 0.25, "learning_rate": 1.7646520397967662e-05, "loss": 2.4062, "step": 2458 }, { "epoch": 0.25, "learning_rate": 1.7644428704652963e-05, "loss": 2.3467, "step": 2459 }, { "epoch": 0.25, "learning_rate": 1.7642336206322593e-05, "loss": 2.4184, "step": 2460 }, { "epoch": 0.25, "learning_rate": 1.7640242903196903e-05, "loss": 2.539, "step": 2461 }, { "epoch": 0.25, "learning_rate": 1.7638148795496337e-05, "loss": 2.3671, "step": 2462 }, { "epoch": 0.25, "learning_rate": 1.763605388344142e-05, "loss": 2.4429, "step": 2463 }, { "epoch": 0.25, "learning_rate": 1.763395816725276e-05, "loss": 2.3459, "step": 2464 }, { "epoch": 0.25, "learning_rate": 1.7631861647151054e-05, "loss": 2.4035, "step": 2465 }, { "epoch": 0.25, "learning_rate": 1.762976432335708e-05, "loss": 2.3325, "step": 2466 }, { "epoch": 0.25, "learning_rate": 1.76276661960917e-05, "loss": 2.4365, "step": 2467 }, { "epoch": 0.25, "learning_rate": 1.7625567265575867e-05, "loss": 2.4181, "step": 2468 }, { "epoch": 0.25, "learning_rate": 1.762346753203061e-05, "loss": 2.4423, "step": 2469 }, { "epoch": 0.25, "learning_rate": 1.7621366995677052e-05, "loss": 2.4417, "step": 2470 }, { "epoch": 0.25, "learning_rate": 1.7619265656736388e-05, "loss": 2.4523, "step": 2471 }, { "epoch": 0.25, "learning_rate": 1.7617163515429913e-05, "loss": 2.4538, "step": 2472 }, { "epoch": 0.25, "learning_rate": 1.761506057197899e-05, "loss": 2.4391, "step": 2473 }, { "epoch": 0.25, "learning_rate": 1.7612956826605076e-05, "loss": 2.3903, "step": 2474 }, { "epoch": 0.25, "learning_rate": 1.761085227952972e-05, "loss": 2.3221, "step": 2475 }, { "epoch": 0.25, "learning_rate": 1.7608746930974535e-05, "loss": 2.3781, "step": 2476 }, { "epoch": 0.25, "learning_rate": 1.7606640781161236e-05, "loss": 2.4562, "step": 2477 }, { "epoch": 0.25, "learning_rate": 1.7604533830311617e-05, "loss": 2.367, "step": 2478 }, { "epoch": 0.25, "learning_rate": 1.7602426078647555e-05, "loss": 2.4997, "step": 2479 }, { "epoch": 0.25, "learning_rate": 1.760031752639101e-05, "loss": 2.3857, "step": 2480 }, { "epoch": 0.25, "learning_rate": 1.7598208173764027e-05, "loss": 2.4053, "step": 2481 }, { "epoch": 0.25, "learning_rate": 1.7596098020988745e-05, "loss": 2.398, "step": 2482 }, { "epoch": 0.25, "learning_rate": 1.759398706828737e-05, "loss": 2.418, "step": 2483 }, { "epoch": 0.25, "learning_rate": 1.7591875315882203e-05, "loss": 2.3772, "step": 2484 }, { "epoch": 0.25, "learning_rate": 1.758976276399563e-05, "loss": 2.3702, "step": 2485 }, { "epoch": 0.25, "learning_rate": 1.758764941285012e-05, "loss": 2.4879, "step": 2486 }, { "epoch": 0.25, "learning_rate": 1.758553526266822e-05, "loss": 2.4356, "step": 2487 }, { "epoch": 0.25, "learning_rate": 1.7583420313672567e-05, "loss": 2.4462, "step": 2488 }, { "epoch": 0.25, "learning_rate": 1.7581304566085883e-05, "loss": 2.3564, "step": 2489 }, { "epoch": 0.25, "learning_rate": 1.757918802013097e-05, "loss": 2.3841, "step": 2490 }, { "epoch": 0.25, "learning_rate": 1.7577070676030717e-05, "loss": 2.4435, "step": 2491 }, { "epoch": 0.25, "learning_rate": 1.75749525340081e-05, "loss": 2.4966, "step": 2492 }, { "epoch": 0.25, "learning_rate": 1.757283359428617e-05, "loss": 2.3324, "step": 2493 }, { "epoch": 0.25, "learning_rate": 1.7570713857088065e-05, "loss": 2.431, "step": 2494 }, { "epoch": 0.25, "learning_rate": 1.7568593322637015e-05, "loss": 2.4571, "step": 2495 }, { "epoch": 0.25, "learning_rate": 1.7566471991156328e-05, "loss": 2.4139, "step": 2496 }, { "epoch": 0.25, "learning_rate": 1.7564349862869395e-05, "loss": 2.3745, "step": 2497 }, { "epoch": 0.25, "learning_rate": 1.7562226937999685e-05, "loss": 2.4127, "step": 2498 }, { "epoch": 0.25, "learning_rate": 1.756010321677077e-05, "loss": 2.4568, "step": 2499 }, { "epoch": 0.25, "learning_rate": 1.755797869940629e-05, "loss": 2.4072, "step": 2500 }, { "epoch": 0.25, "learning_rate": 1.7555853386129968e-05, "loss": 2.3423, "step": 2501 }, { "epoch": 0.25, "learning_rate": 1.7553727277165618e-05, "loss": 2.4112, "step": 2502 }, { "epoch": 0.25, "learning_rate": 1.7551600372737133e-05, "loss": 2.4717, "step": 2503 }, { "epoch": 0.25, "learning_rate": 1.7549472673068496e-05, "loss": 2.4055, "step": 2504 }, { "epoch": 0.25, "learning_rate": 1.754734417838377e-05, "loss": 2.5856, "step": 2505 }, { "epoch": 0.25, "learning_rate": 1.75452148889071e-05, "loss": 2.4179, "step": 2506 }, { "epoch": 0.25, "learning_rate": 1.754308480486271e-05, "loss": 2.4402, "step": 2507 }, { "epoch": 0.25, "learning_rate": 1.7540953926474926e-05, "loss": 2.4702, "step": 2508 }, { "epoch": 0.25, "learning_rate": 1.7538822253968137e-05, "loss": 2.3813, "step": 2509 }, { "epoch": 0.25, "learning_rate": 1.7536689787566824e-05, "loss": 2.4299, "step": 2510 }, { "epoch": 0.25, "learning_rate": 1.7534556527495558e-05, "loss": 2.3611, "step": 2511 }, { "epoch": 0.25, "learning_rate": 1.753242247397898e-05, "loss": 2.4055, "step": 2512 }, { "epoch": 0.25, "learning_rate": 1.7530287627241824e-05, "loss": 2.3587, "step": 2513 }, { "epoch": 0.25, "learning_rate": 1.7528151987508905e-05, "loss": 2.3879, "step": 2514 }, { "epoch": 0.25, "learning_rate": 1.7526015555005127e-05, "loss": 2.4762, "step": 2515 }, { "epoch": 0.25, "learning_rate": 1.7523878329955467e-05, "loss": 2.3918, "step": 2516 }, { "epoch": 0.25, "learning_rate": 1.752174031258499e-05, "loss": 2.4252, "step": 2517 }, { "epoch": 0.25, "learning_rate": 1.751960150311885e-05, "loss": 2.4185, "step": 2518 }, { "epoch": 0.25, "learning_rate": 1.7517461901782283e-05, "loss": 2.4385, "step": 2519 }, { "epoch": 0.25, "learning_rate": 1.7515321508800595e-05, "loss": 2.4987, "step": 2520 }, { "epoch": 0.25, "learning_rate": 1.7513180324399184e-05, "loss": 2.5587, "step": 2521 }, { "epoch": 0.25, "learning_rate": 1.7511038348803542e-05, "loss": 2.4947, "step": 2522 }, { "epoch": 0.25, "learning_rate": 1.7508895582239237e-05, "loss": 2.3814, "step": 2523 }, { "epoch": 0.25, "learning_rate": 1.7506752024931905e-05, "loss": 2.3435, "step": 2524 }, { "epoch": 0.25, "learning_rate": 1.7504607677107294e-05, "loss": 2.5111, "step": 2525 }, { "epoch": 0.25, "learning_rate": 1.7502462538991208e-05, "loss": 2.4096, "step": 2526 }, { "epoch": 0.25, "learning_rate": 1.750031661080955e-05, "loss": 2.4108, "step": 2527 }, { "epoch": 0.25, "learning_rate": 1.7498169892788305e-05, "loss": 2.4151, "step": 2528 }, { "epoch": 0.25, "learning_rate": 1.749602238515354e-05, "loss": 2.4322, "step": 2529 }, { "epoch": 0.25, "learning_rate": 1.7493874088131394e-05, "loss": 2.4259, "step": 2530 }, { "epoch": 0.25, "learning_rate": 1.7491725001948107e-05, "loss": 2.4517, "step": 2531 }, { "epoch": 0.25, "learning_rate": 1.748957512682999e-05, "loss": 2.4325, "step": 2532 }, { "epoch": 0.25, "learning_rate": 1.748742446300345e-05, "loss": 2.3708, "step": 2533 }, { "epoch": 0.25, "learning_rate": 1.7485273010694953e-05, "loss": 2.4389, "step": 2534 }, { "epoch": 0.25, "learning_rate": 1.7483120770131073e-05, "loss": 2.2884, "step": 2535 }, { "epoch": 0.25, "learning_rate": 1.748096774153846e-05, "loss": 2.3819, "step": 2536 }, { "epoch": 0.25, "learning_rate": 1.7478813925143834e-05, "loss": 2.4681, "step": 2537 }, { "epoch": 0.25, "learning_rate": 1.7476659321174015e-05, "loss": 2.4207, "step": 2538 }, { "epoch": 0.25, "learning_rate": 1.74745039298559e-05, "loss": 2.3996, "step": 2539 }, { "epoch": 0.25, "learning_rate": 1.7472347751416457e-05, "loss": 2.4053, "step": 2540 }, { "epoch": 0.25, "learning_rate": 1.7470190786082764e-05, "loss": 2.5373, "step": 2541 }, { "epoch": 0.25, "learning_rate": 1.7468033034081953e-05, "loss": 2.4979, "step": 2542 }, { "epoch": 0.25, "learning_rate": 1.7465874495641255e-05, "loss": 2.4114, "step": 2543 }, { "epoch": 0.25, "learning_rate": 1.7463715170987984e-05, "loss": 2.4121, "step": 2544 }, { "epoch": 0.25, "learning_rate": 1.7461555060349528e-05, "loss": 2.5142, "step": 2545 }, { "epoch": 0.26, "learning_rate": 1.7459394163953365e-05, "loss": 2.4046, "step": 2546 }, { "epoch": 0.26, "learning_rate": 1.7457232482027057e-05, "loss": 2.4114, "step": 2547 }, { "epoch": 0.26, "learning_rate": 1.7455070014798238e-05, "loss": 2.4185, "step": 2548 }, { "epoch": 0.26, "learning_rate": 1.7452906762494638e-05, "loss": 2.4451, "step": 2549 }, { "epoch": 0.26, "learning_rate": 1.745074272534406e-05, "loss": 2.3742, "step": 2550 }, { "epoch": 0.26, "learning_rate": 1.7448577903574397e-05, "loss": 2.462, "step": 2551 }, { "epoch": 0.26, "learning_rate": 1.7446412297413616e-05, "loss": 2.3011, "step": 2552 }, { "epoch": 0.26, "learning_rate": 1.744424590708978e-05, "loss": 2.4094, "step": 2553 }, { "epoch": 0.26, "learning_rate": 1.744207873283102e-05, "loss": 2.4406, "step": 2554 }, { "epoch": 0.26, "learning_rate": 1.743991077486555e-05, "loss": 2.4548, "step": 2555 }, { "epoch": 0.26, "learning_rate": 1.7437742033421683e-05, "loss": 2.3979, "step": 2556 }, { "epoch": 0.26, "learning_rate": 1.7435572508727798e-05, "loss": 2.3279, "step": 2557 }, { "epoch": 0.26, "learning_rate": 1.7433402201012364e-05, "loss": 2.4713, "step": 2558 }, { "epoch": 0.26, "learning_rate": 1.7431231110503933e-05, "loss": 2.4521, "step": 2559 }, { "epoch": 0.26, "learning_rate": 1.742905923743113e-05, "loss": 2.3922, "step": 2560 }, { "epoch": 0.26, "learning_rate": 1.7426886582022677e-05, "loss": 2.3774, "step": 2561 }, { "epoch": 0.26, "learning_rate": 1.7424713144507366e-05, "loss": 2.2837, "step": 2562 }, { "epoch": 0.26, "learning_rate": 1.742253892511408e-05, "loss": 2.3982, "step": 2563 }, { "epoch": 0.26, "learning_rate": 1.7420363924071775e-05, "loss": 2.4547, "step": 2564 }, { "epoch": 0.26, "learning_rate": 1.74181881416095e-05, "loss": 2.4735, "step": 2565 }, { "epoch": 0.26, "learning_rate": 1.741601157795638e-05, "loss": 2.3341, "step": 2566 }, { "epoch": 0.26, "learning_rate": 1.7413834233341628e-05, "loss": 2.4449, "step": 2567 }, { "epoch": 0.26, "learning_rate": 1.7411656107994523e-05, "loss": 2.435, "step": 2568 }, { "epoch": 0.26, "learning_rate": 1.740947720214445e-05, "loss": 2.3895, "step": 2569 }, { "epoch": 0.26, "learning_rate": 1.7407297516020854e-05, "loss": 2.464, "step": 2570 }, { "epoch": 0.26, "learning_rate": 1.7405117049853283e-05, "loss": 2.5049, "step": 2571 }, { "epoch": 0.26, "learning_rate": 1.7402935803871348e-05, "loss": 2.3802, "step": 2572 }, { "epoch": 0.26, "learning_rate": 1.7400753778304754e-05, "loss": 2.4681, "step": 2573 }, { "epoch": 0.26, "learning_rate": 1.739857097338328e-05, "loss": 2.36, "step": 2574 }, { "epoch": 0.26, "learning_rate": 1.7396387389336803e-05, "loss": 2.3784, "step": 2575 }, { "epoch": 0.26, "learning_rate": 1.739420302639526e-05, "loss": 2.3434, "step": 2576 }, { "epoch": 0.26, "learning_rate": 1.7392017884788684e-05, "loss": 2.4684, "step": 2577 }, { "epoch": 0.26, "learning_rate": 1.7389831964747185e-05, "loss": 2.5868, "step": 2578 }, { "epoch": 0.26, "learning_rate": 1.7387645266500962e-05, "loss": 2.401, "step": 2579 }, { "epoch": 0.26, "learning_rate": 1.7385457790280287e-05, "loss": 2.4193, "step": 2580 }, { "epoch": 0.26, "learning_rate": 1.7383269536315518e-05, "loss": 2.4152, "step": 2581 }, { "epoch": 0.26, "learning_rate": 1.7381080504837095e-05, "loss": 2.3302, "step": 2582 }, { "epoch": 0.26, "learning_rate": 1.737889069607554e-05, "loss": 2.4529, "step": 2583 }, { "epoch": 0.26, "learning_rate": 1.7376700110261456e-05, "loss": 2.3378, "step": 2584 }, { "epoch": 0.26, "learning_rate": 1.7374508747625526e-05, "loss": 2.4525, "step": 2585 }, { "epoch": 0.26, "learning_rate": 1.7372316608398518e-05, "loss": 2.4695, "step": 2586 }, { "epoch": 0.26, "learning_rate": 1.737012369281128e-05, "loss": 2.4092, "step": 2587 }, { "epoch": 0.26, "learning_rate": 1.736793000109475e-05, "loss": 2.5006, "step": 2588 }, { "epoch": 0.26, "learning_rate": 1.736573553347993e-05, "loss": 2.4045, "step": 2589 }, { "epoch": 0.26, "learning_rate": 1.7363540290197916e-05, "loss": 2.3538, "step": 2590 }, { "epoch": 0.26, "learning_rate": 1.7361344271479887e-05, "loss": 2.5021, "step": 2591 }, { "epoch": 0.26, "learning_rate": 1.7359147477557098e-05, "loss": 2.3988, "step": 2592 }, { "epoch": 0.26, "learning_rate": 1.735694990866089e-05, "loss": 2.2817, "step": 2593 }, { "epoch": 0.26, "learning_rate": 1.7354751565022683e-05, "loss": 2.2822, "step": 2594 }, { "epoch": 0.26, "learning_rate": 1.7352552446873976e-05, "loss": 2.3744, "step": 2595 }, { "epoch": 0.26, "learning_rate": 1.7350352554446355e-05, "loss": 2.5001, "step": 2596 }, { "epoch": 0.26, "learning_rate": 1.7348151887971486e-05, "loss": 2.4419, "step": 2597 }, { "epoch": 0.26, "learning_rate": 1.7345950447681114e-05, "loss": 2.3151, "step": 2598 }, { "epoch": 0.26, "learning_rate": 1.7343748233807066e-05, "loss": 2.3067, "step": 2599 }, { "epoch": 0.26, "learning_rate": 1.7341545246581252e-05, "loss": 2.4082, "step": 2600 }, { "epoch": 0.26, "learning_rate": 1.733934148623567e-05, "loss": 2.4327, "step": 2601 }, { "epoch": 0.26, "learning_rate": 1.7337136953002382e-05, "loss": 2.3981, "step": 2602 }, { "epoch": 0.26, "learning_rate": 1.733493164711355e-05, "loss": 2.3964, "step": 2603 }, { "epoch": 0.26, "learning_rate": 1.7332725568801404e-05, "loss": 2.4935, "step": 2604 }, { "epoch": 0.26, "learning_rate": 1.7330518718298263e-05, "loss": 2.3765, "step": 2605 }, { "epoch": 0.26, "learning_rate": 1.7328311095836525e-05, "loss": 2.2847, "step": 2606 }, { "epoch": 0.26, "learning_rate": 1.7326102701648672e-05, "loss": 2.3142, "step": 2607 }, { "epoch": 0.26, "learning_rate": 1.732389353596726e-05, "loss": 2.4682, "step": 2608 }, { "epoch": 0.26, "learning_rate": 1.7321683599024926e-05, "loss": 2.3595, "step": 2609 }, { "epoch": 0.26, "learning_rate": 1.7319472891054404e-05, "loss": 2.3995, "step": 2610 }, { "epoch": 0.26, "learning_rate": 1.7317261412288494e-05, "loss": 2.3833, "step": 2611 }, { "epoch": 0.26, "learning_rate": 1.731504916296008e-05, "loss": 2.3182, "step": 2612 }, { "epoch": 0.26, "learning_rate": 1.7312836143302125e-05, "loss": 2.4317, "step": 2613 }, { "epoch": 0.26, "learning_rate": 1.7310622353547683e-05, "loss": 2.4433, "step": 2614 }, { "epoch": 0.26, "learning_rate": 1.7308407793929878e-05, "loss": 2.4568, "step": 2615 }, { "epoch": 0.26, "learning_rate": 1.7306192464681924e-05, "loss": 2.4212, "step": 2616 }, { "epoch": 0.26, "learning_rate": 1.7303976366037106e-05, "loss": 2.3999, "step": 2617 }, { "epoch": 0.26, "learning_rate": 1.7301759498228803e-05, "loss": 2.4355, "step": 2618 }, { "epoch": 0.26, "learning_rate": 1.7299541861490466e-05, "loss": 2.4156, "step": 2619 }, { "epoch": 0.26, "learning_rate": 1.7297323456055625e-05, "loss": 2.372, "step": 2620 }, { "epoch": 0.26, "learning_rate": 1.7295104282157894e-05, "loss": 2.509, "step": 2621 }, { "epoch": 0.26, "learning_rate": 1.7292884340030976e-05, "loss": 2.494, "step": 2622 }, { "epoch": 0.26, "learning_rate": 1.7290663629908637e-05, "loss": 2.4127, "step": 2623 }, { "epoch": 0.26, "learning_rate": 1.7288442152024745e-05, "loss": 2.4957, "step": 2624 }, { "epoch": 0.26, "learning_rate": 1.7286219906613234e-05, "loss": 2.4656, "step": 2625 }, { "epoch": 0.26, "learning_rate": 1.7283996893908118e-05, "loss": 2.3869, "step": 2626 }, { "epoch": 0.26, "learning_rate": 1.7281773114143504e-05, "loss": 2.413, "step": 2627 }, { "epoch": 0.26, "learning_rate": 1.727954856755357e-05, "loss": 2.3756, "step": 2628 }, { "epoch": 0.26, "learning_rate": 1.727732325437258e-05, "loss": 2.3658, "step": 2629 }, { "epoch": 0.26, "learning_rate": 1.727509717483487e-05, "loss": 2.4304, "step": 2630 }, { "epoch": 0.26, "learning_rate": 1.7272870329174872e-05, "loss": 2.3546, "step": 2631 }, { "epoch": 0.26, "learning_rate": 1.727064271762708e-05, "loss": 2.4419, "step": 2632 }, { "epoch": 0.26, "learning_rate": 1.726841434042608e-05, "loss": 2.3705, "step": 2633 }, { "epoch": 0.26, "learning_rate": 1.7266185197806547e-05, "loss": 2.4217, "step": 2634 }, { "epoch": 0.26, "learning_rate": 1.7263955290003213e-05, "loss": 2.4081, "step": 2635 }, { "epoch": 0.26, "learning_rate": 1.7261724617250913e-05, "loss": 2.4585, "step": 2636 }, { "epoch": 0.26, "learning_rate": 1.7259493179784546e-05, "loss": 2.4319, "step": 2637 }, { "epoch": 0.26, "learning_rate": 1.725726097783911e-05, "loss": 2.4045, "step": 2638 }, { "epoch": 0.26, "learning_rate": 1.725502801164966e-05, "loss": 2.4018, "step": 2639 }, { "epoch": 0.26, "learning_rate": 1.7252794281451354e-05, "loss": 2.5121, "step": 2640 }, { "epoch": 0.26, "learning_rate": 1.7250559787479414e-05, "loss": 2.4062, "step": 2641 }, { "epoch": 0.26, "learning_rate": 1.7248324529969153e-05, "loss": 2.4241, "step": 2642 }, { "epoch": 0.26, "learning_rate": 1.7246088509155958e-05, "loss": 2.3634, "step": 2643 }, { "epoch": 0.26, "learning_rate": 1.72438517252753e-05, "loss": 2.4252, "step": 2644 }, { "epoch": 0.27, "learning_rate": 1.724161417856273e-05, "loss": 2.2641, "step": 2645 }, { "epoch": 0.27, "learning_rate": 1.723937586925388e-05, "loss": 2.4496, "step": 2646 }, { "epoch": 0.27, "learning_rate": 1.723713679758445e-05, "loss": 2.4168, "step": 2647 }, { "epoch": 0.27, "learning_rate": 1.7234896963790248e-05, "loss": 2.4915, "step": 2648 }, { "epoch": 0.27, "learning_rate": 1.7232656368107134e-05, "loss": 2.3485, "step": 2649 }, { "epoch": 0.27, "learning_rate": 1.723041501077106e-05, "loss": 2.5357, "step": 2650 }, { "epoch": 0.27, "learning_rate": 1.722817289201806e-05, "loss": 2.4121, "step": 2651 }, { "epoch": 0.27, "learning_rate": 1.7225930012084246e-05, "loss": 2.4773, "step": 2652 }, { "epoch": 0.27, "learning_rate": 1.7223686371205807e-05, "loss": 2.4909, "step": 2653 }, { "epoch": 0.27, "learning_rate": 1.722144196961902e-05, "loss": 2.4124, "step": 2654 }, { "epoch": 0.27, "learning_rate": 1.7219196807560238e-05, "loss": 2.4423, "step": 2655 }, { "epoch": 0.27, "learning_rate": 1.7216950885265888e-05, "loss": 2.3432, "step": 2656 }, { "epoch": 0.27, "learning_rate": 1.7214704202972486e-05, "loss": 2.371, "step": 2657 }, { "epoch": 0.27, "learning_rate": 1.7212456760916623e-05, "loss": 2.3821, "step": 2658 }, { "epoch": 0.27, "learning_rate": 1.7210208559334973e-05, "loss": 2.461, "step": 2659 }, { "epoch": 0.27, "learning_rate": 1.7207959598464285e-05, "loss": 2.4933, "step": 2660 }, { "epoch": 0.27, "learning_rate": 1.72057098785414e-05, "loss": 2.3815, "step": 2661 }, { "epoch": 0.27, "learning_rate": 1.7203459399803217e-05, "loss": 2.3569, "step": 2662 }, { "epoch": 0.27, "learning_rate": 1.720120816248674e-05, "loss": 2.3876, "step": 2663 }, { "epoch": 0.27, "learning_rate": 1.7198956166829036e-05, "loss": 2.3957, "step": 2664 }, { "epoch": 0.27, "learning_rate": 1.719670341306726e-05, "loss": 2.4444, "step": 2665 }, { "epoch": 0.27, "learning_rate": 1.7194449901438636e-05, "loss": 2.4418, "step": 2666 }, { "epoch": 0.27, "learning_rate": 1.7192195632180486e-05, "loss": 2.4049, "step": 2667 }, { "epoch": 0.27, "learning_rate": 1.71899406055302e-05, "loss": 2.3264, "step": 2668 }, { "epoch": 0.27, "learning_rate": 1.718768482172524e-05, "loss": 2.4395, "step": 2669 }, { "epoch": 0.27, "learning_rate": 1.7185428281003166e-05, "loss": 2.468, "step": 2670 }, { "epoch": 0.27, "learning_rate": 1.7183170983601604e-05, "loss": 2.4557, "step": 2671 }, { "epoch": 0.27, "learning_rate": 1.7180912929758267e-05, "loss": 2.2854, "step": 2672 }, { "epoch": 0.27, "learning_rate": 1.7178654119710946e-05, "loss": 2.4154, "step": 2673 }, { "epoch": 0.27, "learning_rate": 1.7176394553697507e-05, "loss": 2.4619, "step": 2674 }, { "epoch": 0.27, "learning_rate": 1.71741342319559e-05, "loss": 2.4381, "step": 2675 }, { "epoch": 0.27, "learning_rate": 1.7171873154724158e-05, "loss": 2.4045, "step": 2676 }, { "epoch": 0.27, "learning_rate": 1.7169611322240382e-05, "loss": 2.325, "step": 2677 }, { "epoch": 0.27, "learning_rate": 1.7167348734742767e-05, "loss": 2.5547, "step": 2678 }, { "epoch": 0.27, "learning_rate": 1.7165085392469577e-05, "loss": 2.4649, "step": 2679 }, { "epoch": 0.27, "learning_rate": 1.716282129565916e-05, "loss": 2.3304, "step": 2680 }, { "epoch": 0.27, "learning_rate": 1.716055644454994e-05, "loss": 2.4163, "step": 2681 }, { "epoch": 0.27, "learning_rate": 1.7158290839380425e-05, "loss": 2.4225, "step": 2682 }, { "epoch": 0.27, "learning_rate": 1.7156024480389202e-05, "loss": 2.3909, "step": 2683 }, { "epoch": 0.27, "learning_rate": 1.715375736781493e-05, "loss": 2.3617, "step": 2684 }, { "epoch": 0.27, "learning_rate": 1.7151489501896362e-05, "loss": 2.3859, "step": 2685 }, { "epoch": 0.27, "learning_rate": 1.714922088287231e-05, "loss": 2.4371, "step": 2686 }, { "epoch": 0.27, "learning_rate": 1.7146951510981685e-05, "loss": 2.4183, "step": 2687 }, { "epoch": 0.27, "learning_rate": 1.7144681386463468e-05, "loss": 2.4224, "step": 2688 }, { "epoch": 0.27, "learning_rate": 1.7142410509556716e-05, "loss": 2.2987, "step": 2689 }, { "epoch": 0.27, "learning_rate": 1.7140138880500574e-05, "loss": 2.4107, "step": 2690 }, { "epoch": 0.27, "learning_rate": 1.7137866499534253e-05, "loss": 2.41, "step": 2691 }, { "epoch": 0.27, "learning_rate": 1.7135593366897064e-05, "loss": 2.389, "step": 2692 }, { "epoch": 0.27, "learning_rate": 1.7133319482828376e-05, "loss": 2.3966, "step": 2693 }, { "epoch": 0.27, "learning_rate": 1.713104484756765e-05, "loss": 2.4516, "step": 2694 }, { "epoch": 0.27, "learning_rate": 1.712876946135442e-05, "loss": 2.366, "step": 2695 }, { "epoch": 0.27, "learning_rate": 1.7126493324428307e-05, "loss": 2.4767, "step": 2696 }, { "epoch": 0.27, "learning_rate": 1.7124216437028995e-05, "loss": 2.5263, "step": 2697 }, { "epoch": 0.27, "learning_rate": 1.712193879939627e-05, "loss": 2.3845, "step": 2698 }, { "epoch": 0.27, "learning_rate": 1.711966041176997e-05, "loss": 2.3848, "step": 2699 }, { "epoch": 0.27, "learning_rate": 1.7117381274390036e-05, "loss": 2.3793, "step": 2700 }, { "epoch": 0.27, "learning_rate": 1.7115101387496476e-05, "loss": 2.3996, "step": 2701 }, { "epoch": 0.27, "learning_rate": 1.711282075132938e-05, "loss": 2.4256, "step": 2702 }, { "epoch": 0.27, "learning_rate": 1.7110539366128916e-05, "loss": 2.444, "step": 2703 }, { "epoch": 0.27, "learning_rate": 1.7108257232135325e-05, "loss": 2.3145, "step": 2704 }, { "epoch": 0.27, "learning_rate": 1.7105974349588943e-05, "loss": 2.4111, "step": 2705 }, { "epoch": 0.27, "learning_rate": 1.7103690718730166e-05, "loss": 2.3927, "step": 2706 }, { "epoch": 0.27, "learning_rate": 1.7101406339799486e-05, "loss": 2.3888, "step": 2707 }, { "epoch": 0.27, "learning_rate": 1.7099121213037454e-05, "loss": 2.3931, "step": 2708 }, { "epoch": 0.27, "learning_rate": 1.7096835338684722e-05, "loss": 2.4984, "step": 2709 }, { "epoch": 0.27, "learning_rate": 1.7094548716982004e-05, "loss": 2.3409, "step": 2710 }, { "epoch": 0.27, "learning_rate": 1.7092261348170097e-05, "loss": 2.4206, "step": 2711 }, { "epoch": 0.27, "learning_rate": 1.7089973232489887e-05, "loss": 2.4878, "step": 2712 }, { "epoch": 0.27, "learning_rate": 1.7087684370182318e-05, "loss": 2.3823, "step": 2713 }, { "epoch": 0.27, "learning_rate": 1.708539476148843e-05, "loss": 2.3669, "step": 2714 }, { "epoch": 0.27, "learning_rate": 1.7083104406649337e-05, "loss": 2.4566, "step": 2715 }, { "epoch": 0.27, "learning_rate": 1.7080813305906226e-05, "loss": 2.425, "step": 2716 }, { "epoch": 0.27, "learning_rate": 1.7078521459500375e-05, "loss": 2.291, "step": 2717 }, { "epoch": 0.27, "learning_rate": 1.7076228867673125e-05, "loss": 2.3978, "step": 2718 }, { "epoch": 0.27, "learning_rate": 1.7073935530665906e-05, "loss": 2.4076, "step": 2719 }, { "epoch": 0.27, "learning_rate": 1.7071641448720223e-05, "loss": 2.435, "step": 2720 }, { "epoch": 0.27, "learning_rate": 1.706934662207766e-05, "loss": 2.3231, "step": 2721 }, { "epoch": 0.27, "learning_rate": 1.7067051050979885e-05, "loss": 2.3492, "step": 2722 }, { "epoch": 0.27, "learning_rate": 1.706475473566863e-05, "loss": 2.43, "step": 2723 }, { "epoch": 0.27, "learning_rate": 1.7062457676385716e-05, "loss": 2.4593, "step": 2724 }, { "epoch": 0.27, "learning_rate": 1.7060159873373047e-05, "loss": 2.3351, "step": 2725 }, { "epoch": 0.27, "learning_rate": 1.705786132687259e-05, "loss": 2.4321, "step": 2726 }, { "epoch": 0.27, "learning_rate": 1.705556203712641e-05, "loss": 2.4316, "step": 2727 }, { "epoch": 0.27, "learning_rate": 1.7053262004376624e-05, "loss": 2.3606, "step": 2728 }, { "epoch": 0.27, "learning_rate": 1.7050961228865463e-05, "loss": 2.4686, "step": 2729 }, { "epoch": 0.27, "learning_rate": 1.7048659710835195e-05, "loss": 2.4461, "step": 2730 }, { "epoch": 0.27, "learning_rate": 1.70463574505282e-05, "loss": 2.3347, "step": 2731 }, { "epoch": 0.27, "learning_rate": 1.704405444818692e-05, "loss": 2.4547, "step": 2732 }, { "epoch": 0.27, "learning_rate": 1.704175070405388e-05, "loss": 2.3995, "step": 2733 }, { "epoch": 0.27, "learning_rate": 1.703944621837168e-05, "loss": 2.3825, "step": 2734 }, { "epoch": 0.27, "learning_rate": 1.7037140991383004e-05, "loss": 2.379, "step": 2735 }, { "epoch": 0.27, "learning_rate": 1.7034835023330598e-05, "loss": 2.436, "step": 2736 }, { "epoch": 0.27, "learning_rate": 1.7032528314457312e-05, "loss": 2.4224, "step": 2737 }, { "epoch": 0.27, "learning_rate": 1.7030220865006048e-05, "loss": 2.3535, "step": 2738 }, { "epoch": 0.27, "learning_rate": 1.70279126752198e-05, "loss": 2.3976, "step": 2739 }, { "epoch": 0.27, "learning_rate": 1.7025603745341648e-05, "loss": 2.3916, "step": 2740 }, { "epoch": 0.27, "learning_rate": 1.7023294075614726e-05, "loss": 2.4697, "step": 2741 }, { "epoch": 0.27, "learning_rate": 1.7020983666282268e-05, "loss": 2.3679, "step": 2742 }, { "epoch": 0.27, "learning_rate": 1.7018672517587577e-05, "loss": 2.4639, "step": 2743 }, { "epoch": 0.27, "learning_rate": 1.701636062977403e-05, "loss": 2.4562, "step": 2744 }, { "epoch": 0.28, "learning_rate": 1.7014048003085085e-05, "loss": 2.438, "step": 2745 }, { "epoch": 0.28, "learning_rate": 1.7011734637764287e-05, "loss": 2.4405, "step": 2746 }, { "epoch": 0.28, "learning_rate": 1.7009420534055244e-05, "loss": 2.3913, "step": 2747 }, { "epoch": 0.28, "learning_rate": 1.7007105692201652e-05, "loss": 2.4142, "step": 2748 }, { "epoch": 0.28, "learning_rate": 1.700479011244728e-05, "loss": 2.3542, "step": 2749 }, { "epoch": 0.28, "learning_rate": 1.7002473795035975e-05, "loss": 2.4225, "step": 2750 }, { "epoch": 0.28, "learning_rate": 1.700015674021166e-05, "loss": 2.4005, "step": 2751 }, { "epoch": 0.28, "learning_rate": 1.6997838948218347e-05, "loss": 2.3926, "step": 2752 }, { "epoch": 0.28, "learning_rate": 1.6995520419300108e-05, "loss": 2.3337, "step": 2753 }, { "epoch": 0.28, "learning_rate": 1.6993201153701106e-05, "loss": 2.3733, "step": 2754 }, { "epoch": 0.28, "learning_rate": 1.6990881151665574e-05, "loss": 2.3797, "step": 2755 }, { "epoch": 0.28, "learning_rate": 1.6988560413437828e-05, "loss": 2.4357, "step": 2756 }, { "epoch": 0.28, "learning_rate": 1.698623893926226e-05, "loss": 2.3253, "step": 2757 }, { "epoch": 0.28, "learning_rate": 1.698391672938334e-05, "loss": 2.452, "step": 2758 }, { "epoch": 0.28, "learning_rate": 1.6981593784045603e-05, "loss": 2.3756, "step": 2759 }, { "epoch": 0.28, "learning_rate": 1.697927010349369e-05, "loss": 2.4288, "step": 2760 }, { "epoch": 0.28, "learning_rate": 1.697694568797229e-05, "loss": 2.4256, "step": 2761 }, { "epoch": 0.28, "learning_rate": 1.6974620537726185e-05, "loss": 2.3933, "step": 2762 }, { "epoch": 0.28, "learning_rate": 1.6972294653000224e-05, "loss": 2.3758, "step": 2763 }, { "epoch": 0.28, "learning_rate": 1.696996803403935e-05, "loss": 2.4095, "step": 2764 }, { "epoch": 0.28, "learning_rate": 1.6967640681088574e-05, "loss": 2.4281, "step": 2765 }, { "epoch": 0.28, "learning_rate": 1.6965312594392975e-05, "loss": 2.4759, "step": 2766 }, { "epoch": 0.28, "learning_rate": 1.6962983774197723e-05, "loss": 2.3505, "step": 2767 }, { "epoch": 0.28, "learning_rate": 1.6960654220748058e-05, "loss": 2.4406, "step": 2768 }, { "epoch": 0.28, "learning_rate": 1.6958323934289304e-05, "loss": 2.4624, "step": 2769 }, { "epoch": 0.28, "learning_rate": 1.6955992915066854e-05, "loss": 2.3435, "step": 2770 }, { "epoch": 0.28, "learning_rate": 1.6953661163326184e-05, "loss": 2.3669, "step": 2771 }, { "epoch": 0.28, "learning_rate": 1.695132867931284e-05, "loss": 2.3995, "step": 2772 }, { "epoch": 0.28, "learning_rate": 1.6948995463272452e-05, "loss": 2.4771, "step": 2773 }, { "epoch": 0.28, "learning_rate": 1.694666151545073e-05, "loss": 2.4903, "step": 2774 }, { "epoch": 0.28, "learning_rate": 1.6944326836093453e-05, "loss": 2.3923, "step": 2775 }, { "epoch": 0.28, "learning_rate": 1.694199142544648e-05, "loss": 2.3583, "step": 2776 }, { "epoch": 0.28, "learning_rate": 1.6939655283755746e-05, "loss": 2.5457, "step": 2777 }, { "epoch": 0.28, "learning_rate": 1.6937318411267266e-05, "loss": 2.3831, "step": 2778 }, { "epoch": 0.28, "learning_rate": 1.693498080822713e-05, "loss": 2.4505, "step": 2779 }, { "epoch": 0.28, "learning_rate": 1.6932642474881506e-05, "loss": 2.3677, "step": 2780 }, { "epoch": 0.28, "learning_rate": 1.6930303411476633e-05, "loss": 2.3757, "step": 2781 }, { "epoch": 0.28, "learning_rate": 1.6927963618258842e-05, "loss": 2.4375, "step": 2782 }, { "epoch": 0.28, "learning_rate": 1.692562309547452e-05, "loss": 2.3521, "step": 2783 }, { "epoch": 0.28, "learning_rate": 1.692328184337015e-05, "loss": 2.4354, "step": 2784 }, { "epoch": 0.28, "learning_rate": 1.6920939862192275e-05, "loss": 2.4202, "step": 2785 }, { "epoch": 0.28, "learning_rate": 1.691859715218753e-05, "loss": 2.3825, "step": 2786 }, { "epoch": 0.28, "learning_rate": 1.691625371360262e-05, "loss": 2.4893, "step": 2787 }, { "epoch": 0.28, "learning_rate": 1.6913909546684323e-05, "loss": 2.3928, "step": 2788 }, { "epoch": 0.28, "learning_rate": 1.6911564651679496e-05, "loss": 2.3407, "step": 2789 }, { "epoch": 0.28, "learning_rate": 1.6909219028835074e-05, "loss": 2.3551, "step": 2790 }, { "epoch": 0.28, "learning_rate": 1.690687267839808e-05, "loss": 2.494, "step": 2791 }, { "epoch": 0.28, "learning_rate": 1.690452560061559e-05, "loss": 2.3577, "step": 2792 }, { "epoch": 0.28, "learning_rate": 1.6902177795734775e-05, "loss": 2.3901, "step": 2793 }, { "epoch": 0.28, "learning_rate": 1.689982926400287e-05, "loss": 2.4569, "step": 2794 }, { "epoch": 0.28, "learning_rate": 1.68974800056672e-05, "loss": 2.4496, "step": 2795 }, { "epoch": 0.28, "learning_rate": 1.6895130020975154e-05, "loss": 2.3672, "step": 2796 }, { "epoch": 0.28, "learning_rate": 1.6892779310174207e-05, "loss": 2.5088, "step": 2797 }, { "epoch": 0.28, "learning_rate": 1.6890427873511906e-05, "loss": 2.471, "step": 2798 }, { "epoch": 0.28, "learning_rate": 1.6888075711235873e-05, "loss": 2.4123, "step": 2799 }, { "epoch": 0.28, "learning_rate": 1.688572282359381e-05, "loss": 2.3905, "step": 2800 }, { "epoch": 0.28, "learning_rate": 1.6883369210833494e-05, "loss": 2.3822, "step": 2801 }, { "epoch": 0.28, "learning_rate": 1.6881014873202777e-05, "loss": 2.4491, "step": 2802 }, { "epoch": 0.28, "learning_rate": 1.6878659810949587e-05, "loss": 2.3871, "step": 2803 }, { "epoch": 0.28, "learning_rate": 1.687630402432193e-05, "loss": 2.4319, "step": 2804 }, { "epoch": 0.28, "learning_rate": 1.6873947513567893e-05, "loss": 2.4248, "step": 2805 }, { "epoch": 0.28, "learning_rate": 1.687159027893563e-05, "loss": 2.4208, "step": 2806 }, { "epoch": 0.28, "learning_rate": 1.6869232320673377e-05, "loss": 2.4068, "step": 2807 }, { "epoch": 0.28, "learning_rate": 1.686687363902944e-05, "loss": 2.4104, "step": 2808 }, { "epoch": 0.28, "learning_rate": 1.6864514234252212e-05, "loss": 2.4762, "step": 2809 }, { "epoch": 0.28, "learning_rate": 1.6862154106590152e-05, "loss": 2.4224, "step": 2810 }, { "epoch": 0.28, "learning_rate": 1.6859793256291802e-05, "loss": 2.4021, "step": 2811 }, { "epoch": 0.28, "learning_rate": 1.6857431683605777e-05, "loss": 2.4349, "step": 2812 }, { "epoch": 0.28, "learning_rate": 1.6855069388780766e-05, "loss": 2.3354, "step": 2813 }, { "epoch": 0.28, "learning_rate": 1.685270637206554e-05, "loss": 2.4234, "step": 2814 }, { "epoch": 0.28, "learning_rate": 1.6850342633708935e-05, "loss": 2.3751, "step": 2815 }, { "epoch": 0.28, "learning_rate": 1.684797817395988e-05, "loss": 2.3734, "step": 2816 }, { "epoch": 0.28, "learning_rate": 1.6845612993067363e-05, "loss": 2.4313, "step": 2817 }, { "epoch": 0.28, "learning_rate": 1.684324709128046e-05, "loss": 2.2783, "step": 2818 }, { "epoch": 0.28, "learning_rate": 1.6840880468848314e-05, "loss": 2.3564, "step": 2819 }, { "epoch": 0.28, "learning_rate": 1.6838513126020153e-05, "loss": 2.4207, "step": 2820 }, { "epoch": 0.28, "learning_rate": 1.683614506304527e-05, "loss": 2.4256, "step": 2821 }, { "epoch": 0.28, "learning_rate": 1.6833776280173046e-05, "loss": 2.5191, "step": 2822 }, { "epoch": 0.28, "learning_rate": 1.683140677765293e-05, "loss": 2.4075, "step": 2823 }, { "epoch": 0.28, "learning_rate": 1.6829036555734447e-05, "loss": 2.4743, "step": 2824 }, { "epoch": 0.28, "learning_rate": 1.6826665614667195e-05, "loss": 2.3645, "step": 2825 }, { "epoch": 0.28, "learning_rate": 1.6824293954700855e-05, "loss": 2.4496, "step": 2826 }, { "epoch": 0.28, "learning_rate": 1.6821921576085186e-05, "loss": 2.3934, "step": 2827 }, { "epoch": 0.28, "learning_rate": 1.6819548479070012e-05, "loss": 2.3388, "step": 2828 }, { "epoch": 0.28, "learning_rate": 1.681717466390524e-05, "loss": 2.3516, "step": 2829 }, { "epoch": 0.28, "learning_rate": 1.6814800130840848e-05, "loss": 2.4674, "step": 2830 }, { "epoch": 0.28, "learning_rate": 1.6812424880126895e-05, "loss": 2.4506, "step": 2831 }, { "epoch": 0.28, "learning_rate": 1.681004891201351e-05, "loss": 2.3328, "step": 2832 }, { "epoch": 0.28, "learning_rate": 1.68076722267509e-05, "loss": 2.4526, "step": 2833 }, { "epoch": 0.28, "learning_rate": 1.6805294824589353e-05, "loss": 2.4204, "step": 2834 }, { "epoch": 0.28, "learning_rate": 1.680291670577922e-05, "loss": 2.4095, "step": 2835 }, { "epoch": 0.28, "learning_rate": 1.6800537870570943e-05, "loss": 2.4671, "step": 2836 }, { "epoch": 0.28, "learning_rate": 1.679815831921502e-05, "loss": 2.4045, "step": 2837 }, { "epoch": 0.28, "learning_rate": 1.679577805196205e-05, "loss": 2.4902, "step": 2838 }, { "epoch": 0.28, "learning_rate": 1.6793397069062678e-05, "loss": 2.4785, "step": 2839 }, { "epoch": 0.28, "learning_rate": 1.679101537076765e-05, "loss": 2.4048, "step": 2840 }, { "epoch": 0.28, "learning_rate": 1.6788632957327772e-05, "loss": 2.4036, "step": 2841 }, { "epoch": 0.28, "learning_rate": 1.6786249828993933e-05, "loss": 2.4042, "step": 2842 }, { "epoch": 0.28, "learning_rate": 1.678386598601709e-05, "loss": 2.4719, "step": 2843 }, { "epoch": 0.28, "learning_rate": 1.6781481428648284e-05, "loss": 2.439, "step": 2844 }, { "epoch": 0.29, "learning_rate": 1.6779096157138624e-05, "loss": 2.308, "step": 2845 }, { "epoch": 0.29, "learning_rate": 1.6776710171739297e-05, "loss": 2.4206, "step": 2846 }, { "epoch": 0.29, "learning_rate": 1.6774323472701565e-05, "loss": 2.4621, "step": 2847 }, { "epoch": 0.29, "learning_rate": 1.6771936060276765e-05, "loss": 2.4164, "step": 2848 }, { "epoch": 0.29, "learning_rate": 1.6769547934716315e-05, "loss": 2.502, "step": 2849 }, { "epoch": 0.29, "learning_rate": 1.67671590962717e-05, "loss": 2.3214, "step": 2850 }, { "epoch": 0.29, "learning_rate": 1.6764769545194475e-05, "loss": 2.447, "step": 2851 }, { "epoch": 0.29, "learning_rate": 1.6762379281736287e-05, "loss": 2.4484, "step": 2852 }, { "epoch": 0.29, "learning_rate": 1.675998830614884e-05, "loss": 2.4061, "step": 2853 }, { "epoch": 0.29, "learning_rate": 1.6757596618683933e-05, "loss": 2.3715, "step": 2854 }, { "epoch": 0.29, "learning_rate": 1.675520421959342e-05, "loss": 2.4631, "step": 2855 }, { "epoch": 0.29, "learning_rate": 1.675281110912924e-05, "loss": 2.4533, "step": 2856 }, { "epoch": 0.29, "learning_rate": 1.6750417287543408e-05, "loss": 2.3535, "step": 2857 }, { "epoch": 0.29, "learning_rate": 1.674802275508801e-05, "loss": 2.4251, "step": 2858 }, { "epoch": 0.29, "learning_rate": 1.6745627512015206e-05, "loss": 2.3922, "step": 2859 }, { "epoch": 0.29, "learning_rate": 1.6743231558577236e-05, "loss": 2.3259, "step": 2860 }, { "epoch": 0.29, "learning_rate": 1.6740834895026414e-05, "loss": 2.3824, "step": 2861 }, { "epoch": 0.29, "learning_rate": 1.6738437521615117e-05, "loss": 2.4058, "step": 2862 }, { "epoch": 0.29, "learning_rate": 1.6736039438595815e-05, "loss": 2.4258, "step": 2863 }, { "epoch": 0.29, "learning_rate": 1.6733640646221044e-05, "loss": 2.4773, "step": 2864 }, { "epoch": 0.29, "learning_rate": 1.6731241144743415e-05, "loss": 2.4491, "step": 2865 }, { "epoch": 0.29, "learning_rate": 1.6728840934415608e-05, "loss": 2.3441, "step": 2866 }, { "epoch": 0.29, "learning_rate": 1.672644001549039e-05, "loss": 2.5092, "step": 2867 }, { "epoch": 0.29, "learning_rate": 1.672403838822059e-05, "loss": 2.4665, "step": 2868 }, { "epoch": 0.29, "learning_rate": 1.672163605285912e-05, "loss": 2.4815, "step": 2869 }, { "epoch": 0.29, "learning_rate": 1.6719233009658965e-05, "loss": 2.4605, "step": 2870 }, { "epoch": 0.29, "learning_rate": 1.671682925887318e-05, "loss": 2.3473, "step": 2871 }, { "epoch": 0.29, "learning_rate": 1.6714424800754902e-05, "loss": 2.4988, "step": 2872 }, { "epoch": 0.29, "learning_rate": 1.6712019635557332e-05, "loss": 2.3728, "step": 2873 }, { "epoch": 0.29, "learning_rate": 1.6709613763533763e-05, "loss": 2.3287, "step": 2874 }, { "epoch": 0.29, "learning_rate": 1.670720718493754e-05, "loss": 2.4093, "step": 2875 }, { "epoch": 0.29, "learning_rate": 1.67047999000221e-05, "loss": 2.4335, "step": 2876 }, { "epoch": 0.29, "learning_rate": 1.670239190904095e-05, "loss": 2.3513, "step": 2877 }, { "epoch": 0.29, "learning_rate": 1.6699983212247662e-05, "loss": 2.3976, "step": 2878 }, { "epoch": 0.29, "learning_rate": 1.6697573809895896e-05, "loss": 2.3463, "step": 2879 }, { "epoch": 0.29, "learning_rate": 1.6695163702239378e-05, "loss": 2.3847, "step": 2880 }, { "epoch": 0.29, "learning_rate": 1.669275288953191e-05, "loss": 2.3754, "step": 2881 }, { "epoch": 0.29, "learning_rate": 1.669034137202737e-05, "loss": 2.4247, "step": 2882 }, { "epoch": 0.29, "learning_rate": 1.668792914997971e-05, "loss": 2.3823, "step": 2883 }, { "epoch": 0.29, "learning_rate": 1.668551622364295e-05, "loss": 2.4638, "step": 2884 }, { "epoch": 0.29, "learning_rate": 1.6683102593271195e-05, "loss": 2.3385, "step": 2885 }, { "epoch": 0.29, "learning_rate": 1.6680688259118615e-05, "loss": 2.4064, "step": 2886 }, { "epoch": 0.29, "learning_rate": 1.667827322143946e-05, "loss": 2.4735, "step": 2887 }, { "epoch": 0.29, "learning_rate": 1.667585748048805e-05, "loss": 2.3079, "step": 2888 }, { "epoch": 0.29, "learning_rate": 1.667344103651878e-05, "loss": 2.2575, "step": 2889 }, { "epoch": 0.29, "learning_rate": 1.6671023889786115e-05, "loss": 2.3055, "step": 2890 }, { "epoch": 0.29, "learning_rate": 1.666860604054461e-05, "loss": 2.4268, "step": 2891 }, { "epoch": 0.29, "learning_rate": 1.6666187489048876e-05, "loss": 2.3992, "step": 2892 }, { "epoch": 0.29, "learning_rate": 1.6663768235553605e-05, "loss": 2.4236, "step": 2893 }, { "epoch": 0.29, "learning_rate": 1.666134828031356e-05, "loss": 2.4265, "step": 2894 }, { "epoch": 0.29, "learning_rate": 1.6658927623583587e-05, "loss": 2.4256, "step": 2895 }, { "epoch": 0.29, "learning_rate": 1.6656506265618594e-05, "loss": 2.4103, "step": 2896 }, { "epoch": 0.29, "learning_rate": 1.6654084206673572e-05, "loss": 2.3277, "step": 2897 }, { "epoch": 0.29, "learning_rate": 1.6651661447003578e-05, "loss": 2.2368, "step": 2898 }, { "epoch": 0.29, "learning_rate": 1.6649237986863746e-05, "loss": 2.4824, "step": 2899 }, { "epoch": 0.29, "learning_rate": 1.664681382650929e-05, "loss": 2.3889, "step": 2900 }, { "epoch": 0.29, "learning_rate": 1.664438896619549e-05, "loss": 2.4251, "step": 2901 }, { "epoch": 0.29, "learning_rate": 1.6641963406177695e-05, "loss": 2.3324, "step": 2902 }, { "epoch": 0.29, "learning_rate": 1.6639537146711348e-05, "loss": 2.4137, "step": 2903 }, { "epoch": 0.29, "learning_rate": 1.6637110188051944e-05, "loss": 2.3566, "step": 2904 }, { "epoch": 0.29, "learning_rate": 1.663468253045506e-05, "loss": 2.4509, "step": 2905 }, { "epoch": 0.29, "learning_rate": 1.6632254174176345e-05, "loss": 2.4269, "step": 2906 }, { "epoch": 0.29, "learning_rate": 1.662982511947153e-05, "loss": 2.4161, "step": 2907 }, { "epoch": 0.29, "learning_rate": 1.6627395366596408e-05, "loss": 2.3352, "step": 2908 }, { "epoch": 0.29, "learning_rate": 1.6624964915806848e-05, "loss": 2.4371, "step": 2909 }, { "epoch": 0.29, "learning_rate": 1.6622533767358798e-05, "loss": 2.3539, "step": 2910 }, { "epoch": 0.29, "learning_rate": 1.6620101921508275e-05, "loss": 2.3722, "step": 2911 }, { "epoch": 0.29, "learning_rate": 1.6617669378511374e-05, "loss": 2.4338, "step": 2912 }, { "epoch": 0.29, "learning_rate": 1.661523613862426e-05, "loss": 2.3893, "step": 2913 }, { "epoch": 0.29, "learning_rate": 1.661280220210316e-05, "loss": 2.3754, "step": 2914 }, { "epoch": 0.29, "learning_rate": 1.6610367569204398e-05, "loss": 2.3642, "step": 2915 }, { "epoch": 0.29, "learning_rate": 1.6607932240184356e-05, "loss": 2.3613, "step": 2916 }, { "epoch": 0.29, "learning_rate": 1.6605496215299493e-05, "loss": 2.4767, "step": 2917 }, { "epoch": 0.29, "learning_rate": 1.660305949480634e-05, "loss": 2.4633, "step": 2918 }, { "epoch": 0.29, "learning_rate": 1.66006220789615e-05, "loss": 2.4269, "step": 2919 }, { "epoch": 0.29, "learning_rate": 1.659818396802165e-05, "loss": 2.3777, "step": 2920 }, { "epoch": 0.29, "learning_rate": 1.6595745162243548e-05, "loss": 2.5145, "step": 2921 }, { "epoch": 0.29, "learning_rate": 1.6593305661884013e-05, "loss": 2.3127, "step": 2922 }, { "epoch": 0.29, "learning_rate": 1.6590865467199946e-05, "loss": 2.42, "step": 2923 }, { "epoch": 0.29, "learning_rate": 1.6588424578448314e-05, "loss": 2.4362, "step": 2924 }, { "epoch": 0.29, "learning_rate": 1.6585982995886165e-05, "loss": 2.4056, "step": 2925 }, { "epoch": 0.29, "learning_rate": 1.658354071977061e-05, "loss": 2.4067, "step": 2926 }, { "epoch": 0.29, "learning_rate": 1.658109775035885e-05, "loss": 2.3366, "step": 2927 }, { "epoch": 0.29, "learning_rate": 1.6578654087908134e-05, "loss": 2.3567, "step": 2928 }, { "epoch": 0.29, "learning_rate": 1.657620973267581e-05, "loss": 2.4075, "step": 2929 }, { "epoch": 0.29, "learning_rate": 1.657376468491928e-05, "loss": 2.4323, "step": 2930 }, { "epoch": 0.29, "learning_rate": 1.657131894489602e-05, "loss": 2.3238, "step": 2931 }, { "epoch": 0.29, "learning_rate": 1.6568872512863603e-05, "loss": 2.3889, "step": 2932 }, { "epoch": 0.29, "learning_rate": 1.6566425389079644e-05, "loss": 2.4288, "step": 2933 }, { "epoch": 0.29, "learning_rate": 1.6563977573801843e-05, "loss": 2.3249, "step": 2934 }, { "epoch": 0.29, "learning_rate": 1.6561529067287975e-05, "loss": 2.4026, "step": 2935 }, { "epoch": 0.29, "learning_rate": 1.655907986979589e-05, "loss": 2.4187, "step": 2936 }, { "epoch": 0.29, "learning_rate": 1.6556629981583503e-05, "loss": 2.3257, "step": 2937 }, { "epoch": 0.29, "learning_rate": 1.6554179402908803e-05, "loss": 2.4545, "step": 2938 }, { "epoch": 0.29, "learning_rate": 1.655172813402986e-05, "loss": 2.3962, "step": 2939 }, { "epoch": 0.29, "learning_rate": 1.6549276175204813e-05, "loss": 2.456, "step": 2940 }, { "epoch": 0.29, "learning_rate": 1.6546823526691868e-05, "loss": 2.3236, "step": 2941 }, { "epoch": 0.29, "learning_rate": 1.65443701887493e-05, "loss": 2.3914, "step": 2942 }, { "epoch": 0.29, "learning_rate": 1.654191616163547e-05, "loss": 2.4725, "step": 2943 }, { "epoch": 0.29, "learning_rate": 1.653946144560881e-05, "loss": 2.3545, "step": 2944 }, { "epoch": 0.3, "learning_rate": 1.653700604092782e-05, "loss": 2.3905, "step": 2945 }, { "epoch": 0.3, "learning_rate": 1.653454994785106e-05, "loss": 2.3304, "step": 2946 }, { "epoch": 0.3, "learning_rate": 1.653209316663719e-05, "loss": 2.4211, "step": 2947 }, { "epoch": 0.3, "learning_rate": 1.6529635697544918e-05, "loss": 2.3804, "step": 2948 }, { "epoch": 0.3, "learning_rate": 1.6527177540833038e-05, "loss": 2.3275, "step": 2949 }, { "epoch": 0.3, "learning_rate": 1.6524718696760412e-05, "loss": 2.4068, "step": 2950 }, { "epoch": 0.3, "learning_rate": 1.6522259165585973e-05, "loss": 2.4029, "step": 2951 }, { "epoch": 0.3, "learning_rate": 1.651979894756873e-05, "loss": 2.4539, "step": 2952 }, { "epoch": 0.3, "learning_rate": 1.6517338042967758e-05, "loss": 2.4104, "step": 2953 }, { "epoch": 0.3, "learning_rate": 1.6514876452042217e-05, "loss": 2.4022, "step": 2954 }, { "epoch": 0.3, "learning_rate": 1.6512414175051325e-05, "loss": 2.4128, "step": 2955 }, { "epoch": 0.3, "learning_rate": 1.6509951212254377e-05, "loss": 2.4645, "step": 2956 }, { "epoch": 0.3, "learning_rate": 1.6507487563910743e-05, "loss": 2.3758, "step": 2957 }, { "epoch": 0.3, "learning_rate": 1.650502323027987e-05, "loss": 2.3799, "step": 2958 }, { "epoch": 0.3, "learning_rate": 1.6502558211621263e-05, "loss": 2.4245, "step": 2959 }, { "epoch": 0.3, "learning_rate": 1.650009250819451e-05, "loss": 2.4035, "step": 2960 }, { "epoch": 0.3, "learning_rate": 1.6497626120259265e-05, "loss": 2.3904, "step": 2961 }, { "epoch": 0.3, "learning_rate": 1.649515904807526e-05, "loss": 2.3939, "step": 2962 }, { "epoch": 0.3, "learning_rate": 1.64926912919023e-05, "loss": 2.3716, "step": 2963 }, { "epoch": 0.3, "learning_rate": 1.649022285200025e-05, "loss": 2.4067, "step": 2964 }, { "epoch": 0.3, "learning_rate": 1.648775372862906e-05, "loss": 2.4018, "step": 2965 }, { "epoch": 0.3, "learning_rate": 1.6485283922048746e-05, "loss": 2.478, "step": 2966 }, { "epoch": 0.3, "learning_rate": 1.64828134325194e-05, "loss": 2.4558, "step": 2967 }, { "epoch": 0.3, "learning_rate": 1.648034226030118e-05, "loss": 2.4371, "step": 2968 }, { "epoch": 0.3, "learning_rate": 1.6477870405654316e-05, "loss": 2.2994, "step": 2969 }, { "epoch": 0.3, "learning_rate": 1.647539786883912e-05, "loss": 2.3937, "step": 2970 }, { "epoch": 0.3, "learning_rate": 1.6472924650115963e-05, "loss": 2.3805, "step": 2971 }, { "epoch": 0.3, "learning_rate": 1.64704507497453e-05, "loss": 2.4313, "step": 2972 }, { "epoch": 0.3, "learning_rate": 1.646797616798764e-05, "loss": 2.2525, "step": 2973 }, { "epoch": 0.3, "learning_rate": 1.6465500905103585e-05, "loss": 2.4364, "step": 2974 }, { "epoch": 0.3, "learning_rate": 1.6463024961353796e-05, "loss": 2.4768, "step": 2975 }, { "epoch": 0.3, "learning_rate": 1.6460548336999008e-05, "loss": 2.4718, "step": 2976 }, { "epoch": 0.3, "learning_rate": 1.645807103230003e-05, "loss": 2.4158, "step": 2977 }, { "epoch": 0.3, "learning_rate": 1.6455593047517738e-05, "loss": 2.3228, "step": 2978 }, { "epoch": 0.3, "learning_rate": 1.6453114382913084e-05, "loss": 2.3105, "step": 2979 }, { "epoch": 0.3, "learning_rate": 1.6450635038747086e-05, "loss": 2.3679, "step": 2980 }, { "epoch": 0.3, "learning_rate": 1.6448155015280843e-05, "loss": 2.3988, "step": 2981 }, { "epoch": 0.3, "learning_rate": 1.6445674312775518e-05, "loss": 2.3001, "step": 2982 }, { "epoch": 0.3, "learning_rate": 1.6443192931492347e-05, "loss": 2.4214, "step": 2983 }, { "epoch": 0.3, "learning_rate": 1.644071087169264e-05, "loss": 2.3984, "step": 2984 }, { "epoch": 0.3, "learning_rate": 1.6438228133637775e-05, "loss": 2.3278, "step": 2985 }, { "epoch": 0.3, "learning_rate": 1.6435744717589202e-05, "loss": 2.4002, "step": 2986 }, { "epoch": 0.3, "learning_rate": 1.6433260623808444e-05, "loss": 2.4414, "step": 2987 }, { "epoch": 0.3, "learning_rate": 1.6430775852557096e-05, "loss": 2.4793, "step": 2988 }, { "epoch": 0.3, "learning_rate": 1.642829040409682e-05, "loss": 2.3651, "step": 2989 }, { "epoch": 0.3, "learning_rate": 1.6425804278689356e-05, "loss": 2.4623, "step": 2990 }, { "epoch": 0.3, "learning_rate": 1.642331747659651e-05, "loss": 2.3399, "step": 2991 }, { "epoch": 0.3, "learning_rate": 1.642082999808016e-05, "loss": 2.3988, "step": 2992 }, { "epoch": 0.3, "learning_rate": 1.641834184340226e-05, "loss": 2.4176, "step": 2993 }, { "epoch": 0.3, "learning_rate": 1.641585301282483e-05, "loss": 2.4072, "step": 2994 }, { "epoch": 0.3, "learning_rate": 1.6413363506609955e-05, "loss": 2.4638, "step": 2995 }, { "epoch": 0.3, "learning_rate": 1.6410873325019808e-05, "loss": 2.3989, "step": 2996 }, { "epoch": 0.3, "learning_rate": 1.640838246831662e-05, "loss": 2.3954, "step": 2997 }, { "epoch": 0.3, "learning_rate": 1.64058909367627e-05, "loss": 2.3667, "step": 2998 }, { "epoch": 0.3, "learning_rate": 1.640339873062042e-05, "loss": 2.344, "step": 2999 }, { "epoch": 0.3, "learning_rate": 1.6400905850152225e-05, "loss": 2.4356, "step": 3000 }, { "epoch": 0.3, "learning_rate": 1.6398412295620646e-05, "loss": 2.4421, "step": 3001 }, { "epoch": 0.3, "learning_rate": 1.6395918067288266e-05, "loss": 2.3933, "step": 3002 }, { "epoch": 0.3, "learning_rate": 1.6393423165417746e-05, "loss": 2.3873, "step": 3003 }, { "epoch": 0.3, "learning_rate": 1.639092759027182e-05, "loss": 2.4264, "step": 3004 }, { "epoch": 0.3, "learning_rate": 1.6388431342113286e-05, "loss": 2.3539, "step": 3005 }, { "epoch": 0.3, "learning_rate": 1.6385934421205017e-05, "loss": 2.4429, "step": 3006 }, { "epoch": 0.3, "learning_rate": 1.6383436827809966e-05, "loss": 2.4236, "step": 3007 }, { "epoch": 0.3, "learning_rate": 1.6380938562191144e-05, "loss": 2.3227, "step": 3008 }, { "epoch": 0.3, "learning_rate": 1.6378439624611635e-05, "loss": 2.3669, "step": 3009 }, { "epoch": 0.3, "learning_rate": 1.6375940015334596e-05, "loss": 2.4202, "step": 3010 }, { "epoch": 0.3, "learning_rate": 1.637343973462326e-05, "loss": 2.3336, "step": 3011 }, { "epoch": 0.3, "learning_rate": 1.637093878274092e-05, "loss": 2.4663, "step": 3012 }, { "epoch": 0.3, "learning_rate": 1.6368437159950942e-05, "loss": 2.338, "step": 3013 }, { "epoch": 0.3, "learning_rate": 1.6365934866516773e-05, "loss": 2.3953, "step": 3014 }, { "epoch": 0.3, "learning_rate": 1.6363431902701922e-05, "loss": 2.36, "step": 3015 }, { "epoch": 0.3, "learning_rate": 1.6360928268769966e-05, "loss": 2.3802, "step": 3016 }, { "epoch": 0.3, "learning_rate": 1.635842396498456e-05, "loss": 2.3883, "step": 3017 }, { "epoch": 0.3, "learning_rate": 1.6355918991609423e-05, "loss": 2.4567, "step": 3018 }, { "epoch": 0.3, "learning_rate": 1.6353413348908352e-05, "loss": 2.3875, "step": 3019 }, { "epoch": 0.3, "learning_rate": 1.6350907037145202e-05, "loss": 2.4219, "step": 3020 }, { "epoch": 0.3, "learning_rate": 1.6348400056583916e-05, "loss": 2.2927, "step": 3021 }, { "epoch": 0.3, "learning_rate": 1.634589240748849e-05, "loss": 2.3579, "step": 3022 }, { "epoch": 0.3, "learning_rate": 1.6343384090123e-05, "loss": 2.4456, "step": 3023 }, { "epoch": 0.3, "learning_rate": 1.6340875104751595e-05, "loss": 2.2908, "step": 3024 }, { "epoch": 0.3, "learning_rate": 1.633836545163849e-05, "loss": 2.3997, "step": 3025 }, { "epoch": 0.3, "learning_rate": 1.633585513104796e-05, "loss": 2.455, "step": 3026 }, { "epoch": 0.3, "learning_rate": 1.6333344143244373e-05, "loss": 2.4051, "step": 3027 }, { "epoch": 0.3, "learning_rate": 1.6330832488492148e-05, "loss": 2.4848, "step": 3028 }, { "epoch": 0.3, "learning_rate": 1.6328320167055784e-05, "loss": 2.4064, "step": 3029 }, { "epoch": 0.3, "learning_rate": 1.632580717919985e-05, "loss": 2.3639, "step": 3030 }, { "epoch": 0.3, "learning_rate": 1.6323293525188973e-05, "loss": 2.3162, "step": 3031 }, { "epoch": 0.3, "learning_rate": 1.6320779205287865e-05, "loss": 2.4159, "step": 3032 }, { "epoch": 0.3, "learning_rate": 1.6318264219761303e-05, "loss": 2.3489, "step": 3033 }, { "epoch": 0.3, "learning_rate": 1.6315748568874136e-05, "loss": 2.4075, "step": 3034 }, { "epoch": 0.3, "learning_rate": 1.631323225289128e-05, "loss": 2.3872, "step": 3035 }, { "epoch": 0.3, "learning_rate": 1.6310715272077717e-05, "loss": 2.4171, "step": 3036 }, { "epoch": 0.3, "learning_rate": 1.630819762669851e-05, "loss": 2.4101, "step": 3037 }, { "epoch": 0.3, "learning_rate": 1.6305679317018785e-05, "loss": 2.3219, "step": 3038 }, { "epoch": 0.3, "learning_rate": 1.6303160343303735e-05, "loss": 2.5016, "step": 3039 }, { "epoch": 0.3, "learning_rate": 1.630064070581863e-05, "loss": 2.463, "step": 3040 }, { "epoch": 0.3, "learning_rate": 1.6298120404828806e-05, "loss": 2.4117, "step": 3041 }, { "epoch": 0.3, "learning_rate": 1.629559944059967e-05, "loss": 2.4166, "step": 3042 }, { "epoch": 0.3, "learning_rate": 1.62930778133967e-05, "loss": 2.3999, "step": 3043 }, { "epoch": 0.3, "learning_rate": 1.6290555523485436e-05, "loss": 2.3908, "step": 3044 }, { "epoch": 0.31, "learning_rate": 1.62880325711315e-05, "loss": 2.3322, "step": 3045 }, { "epoch": 0.31, "learning_rate": 1.6285508956600576e-05, "loss": 2.3993, "step": 3046 }, { "epoch": 0.31, "learning_rate": 1.6282984680158423e-05, "loss": 2.4144, "step": 3047 }, { "epoch": 0.31, "learning_rate": 1.628045974207086e-05, "loss": 2.3286, "step": 3048 }, { "epoch": 0.31, "learning_rate": 1.6277934142603785e-05, "loss": 2.3725, "step": 3049 }, { "epoch": 0.31, "learning_rate": 1.6275407882023163e-05, "loss": 2.3783, "step": 3050 }, { "epoch": 0.31, "learning_rate": 1.6272880960595027e-05, "loss": 2.449, "step": 3051 }, { "epoch": 0.31, "learning_rate": 1.627035337858548e-05, "loss": 2.3648, "step": 3052 }, { "epoch": 0.31, "learning_rate": 1.6267825136260698e-05, "loss": 2.447, "step": 3053 }, { "epoch": 0.31, "learning_rate": 1.626529623388692e-05, "loss": 2.449, "step": 3054 }, { "epoch": 0.31, "learning_rate": 1.6262766671730466e-05, "loss": 2.347, "step": 3055 }, { "epoch": 0.31, "learning_rate": 1.626023645005771e-05, "loss": 2.4224, "step": 3056 }, { "epoch": 0.31, "learning_rate": 1.6257705569135107e-05, "loss": 2.3801, "step": 3057 }, { "epoch": 0.31, "learning_rate": 1.6255174029229178e-05, "loss": 2.4066, "step": 3058 }, { "epoch": 0.31, "learning_rate": 1.6252641830606508e-05, "loss": 2.3807, "step": 3059 }, { "epoch": 0.31, "learning_rate": 1.6250108973533764e-05, "loss": 2.4613, "step": 3060 }, { "epoch": 0.31, "learning_rate": 1.6247575458277674e-05, "loss": 2.4715, "step": 3061 }, { "epoch": 0.31, "learning_rate": 1.624504128510503e-05, "loss": 2.3624, "step": 3062 }, { "epoch": 0.31, "learning_rate": 1.62425064542827e-05, "loss": 2.4836, "step": 3063 }, { "epoch": 0.31, "learning_rate": 1.623997096607763e-05, "loss": 2.2886, "step": 3064 }, { "epoch": 0.31, "learning_rate": 1.6237434820756814e-05, "loss": 2.3062, "step": 3065 }, { "epoch": 0.31, "learning_rate": 1.6234898018587336e-05, "loss": 2.4025, "step": 3066 }, { "epoch": 0.31, "learning_rate": 1.6232360559836338e-05, "loss": 2.3349, "step": 3067 }, { "epoch": 0.31, "learning_rate": 1.622982244477103e-05, "loss": 2.3359, "step": 3068 }, { "epoch": 0.31, "learning_rate": 1.62272836736587e-05, "loss": 2.3378, "step": 3069 }, { "epoch": 0.31, "learning_rate": 1.6224744246766692e-05, "loss": 2.3462, "step": 3070 }, { "epoch": 0.31, "learning_rate": 1.6222204164362433e-05, "loss": 2.3401, "step": 3071 }, { "epoch": 0.31, "learning_rate": 1.6219663426713412e-05, "loss": 2.4226, "step": 3072 }, { "epoch": 0.31, "learning_rate": 1.621712203408719e-05, "loss": 2.469, "step": 3073 }, { "epoch": 0.31, "learning_rate": 1.6214579986751386e-05, "loss": 2.395, "step": 3074 }, { "epoch": 0.31, "learning_rate": 1.6212037284973706e-05, "loss": 2.3161, "step": 3075 }, { "epoch": 0.31, "learning_rate": 1.620949392902191e-05, "loss": 2.434, "step": 3076 }, { "epoch": 0.31, "learning_rate": 1.6206949919163833e-05, "loss": 2.3807, "step": 3077 }, { "epoch": 0.31, "learning_rate": 1.6204405255667382e-05, "loss": 2.322, "step": 3078 }, { "epoch": 0.31, "learning_rate": 1.6201859938800527e-05, "loss": 2.3393, "step": 3079 }, { "epoch": 0.31, "learning_rate": 1.6199313968831306e-05, "loss": 2.4721, "step": 3080 }, { "epoch": 0.31, "learning_rate": 1.6196767346027833e-05, "loss": 2.3776, "step": 3081 }, { "epoch": 0.31, "learning_rate": 1.6194220070658285e-05, "loss": 2.3514, "step": 3082 }, { "epoch": 0.31, "learning_rate": 1.6191672142990908e-05, "loss": 2.4844, "step": 3083 }, { "epoch": 0.31, "learning_rate": 1.618912356329402e-05, "loss": 2.3487, "step": 3084 }, { "epoch": 0.31, "learning_rate": 1.6186574331836e-05, "loss": 2.3485, "step": 3085 }, { "epoch": 0.31, "learning_rate": 1.6184024448885312e-05, "loss": 2.4856, "step": 3086 }, { "epoch": 0.31, "learning_rate": 1.6181473914710467e-05, "loss": 2.3695, "step": 3087 }, { "epoch": 0.31, "learning_rate": 1.6178922729580064e-05, "loss": 2.3737, "step": 3088 }, { "epoch": 0.31, "learning_rate": 1.6176370893762757e-05, "loss": 2.3465, "step": 3089 }, { "epoch": 0.31, "learning_rate": 1.617381840752727e-05, "loss": 2.3835, "step": 3090 }, { "epoch": 0.31, "learning_rate": 1.6171265271142405e-05, "loss": 2.425, "step": 3091 }, { "epoch": 0.31, "learning_rate": 1.6168711484877028e-05, "loss": 2.4284, "step": 3092 }, { "epoch": 0.31, "learning_rate": 1.6166157049000067e-05, "loss": 2.43, "step": 3093 }, { "epoch": 0.31, "learning_rate": 1.6163601963780523e-05, "loss": 2.4626, "step": 3094 }, { "epoch": 0.31, "learning_rate": 1.6161046229487466e-05, "loss": 2.3212, "step": 3095 }, { "epoch": 0.31, "learning_rate": 1.615848984639004e-05, "loss": 2.4183, "step": 3096 }, { "epoch": 0.31, "learning_rate": 1.615593281475744e-05, "loss": 2.3793, "step": 3097 }, { "epoch": 0.31, "learning_rate": 1.6153375134858957e-05, "loss": 2.3209, "step": 3098 }, { "epoch": 0.31, "learning_rate": 1.6150816806963913e-05, "loss": 2.4456, "step": 3099 }, { "epoch": 0.31, "learning_rate": 1.6148257831341738e-05, "loss": 2.3412, "step": 3100 }, { "epoch": 0.31, "learning_rate": 1.61456982082619e-05, "loss": 2.4846, "step": 3101 }, { "epoch": 0.31, "learning_rate": 1.614313793799395e-05, "loss": 2.3521, "step": 3102 }, { "epoch": 0.31, "learning_rate": 1.6140577020807503e-05, "loss": 2.3772, "step": 3103 }, { "epoch": 0.31, "learning_rate": 1.6138015456972247e-05, "loss": 2.4242, "step": 3104 }, { "epoch": 0.31, "learning_rate": 1.613545324675793e-05, "loss": 2.3769, "step": 3105 }, { "epoch": 0.31, "learning_rate": 1.613289039043437e-05, "loss": 2.3459, "step": 3106 }, { "epoch": 0.31, "learning_rate": 1.6130326888271456e-05, "loss": 2.3487, "step": 3107 }, { "epoch": 0.31, "learning_rate": 1.612776274053915e-05, "loss": 2.4013, "step": 3108 }, { "epoch": 0.31, "learning_rate": 1.6125197947507468e-05, "loss": 2.3863, "step": 3109 }, { "epoch": 0.31, "learning_rate": 1.6122632509446504e-05, "loss": 2.4422, "step": 3110 }, { "epoch": 0.31, "learning_rate": 1.6120066426626425e-05, "loss": 2.3829, "step": 3111 }, { "epoch": 0.31, "learning_rate": 1.6117499699317445e-05, "loss": 2.4762, "step": 3112 }, { "epoch": 0.31, "learning_rate": 1.6114932327789873e-05, "loss": 2.4808, "step": 3113 }, { "epoch": 0.31, "learning_rate": 1.6112364312314065e-05, "loss": 2.3611, "step": 3114 }, { "epoch": 0.31, "learning_rate": 1.6109795653160457e-05, "loss": 2.388, "step": 3115 }, { "epoch": 0.31, "learning_rate": 1.6107226350599542e-05, "loss": 2.4605, "step": 3116 }, { "epoch": 0.31, "learning_rate": 1.610465640490189e-05, "loss": 2.4851, "step": 3117 }, { "epoch": 0.31, "learning_rate": 1.6102085816338135e-05, "loss": 2.4317, "step": 3118 }, { "epoch": 0.31, "learning_rate": 1.6099514585178982e-05, "loss": 2.3608, "step": 3119 }, { "epoch": 0.31, "learning_rate": 1.6096942711695202e-05, "loss": 2.3976, "step": 3120 }, { "epoch": 0.31, "learning_rate": 1.6094370196157622e-05, "loss": 2.4308, "step": 3121 }, { "epoch": 0.31, "learning_rate": 1.609179703883716e-05, "loss": 2.3873, "step": 3122 }, { "epoch": 0.31, "learning_rate": 1.6089223240004785e-05, "loss": 2.3968, "step": 3123 }, { "epoch": 0.31, "learning_rate": 1.6086648799931533e-05, "loss": 2.3847, "step": 3124 }, { "epoch": 0.31, "learning_rate": 1.6084073718888514e-05, "loss": 2.3894, "step": 3125 }, { "epoch": 0.31, "learning_rate": 1.60814979971469e-05, "loss": 2.3731, "step": 3126 }, { "epoch": 0.31, "learning_rate": 1.6078921634977948e-05, "loss": 2.4046, "step": 3127 }, { "epoch": 0.31, "learning_rate": 1.6076344632652948e-05, "loss": 2.3489, "step": 3128 }, { "epoch": 0.31, "learning_rate": 1.6073766990443295e-05, "loss": 2.3656, "step": 3129 }, { "epoch": 0.31, "learning_rate": 1.607118870862042e-05, "loss": 2.416, "step": 3130 }, { "epoch": 0.31, "learning_rate": 1.606860978745585e-05, "loss": 2.466, "step": 3131 }, { "epoch": 0.31, "learning_rate": 1.6066030227221152e-05, "loss": 2.4821, "step": 3132 }, { "epoch": 0.31, "learning_rate": 1.606345002818798e-05, "loss": 2.4127, "step": 3133 }, { "epoch": 0.31, "learning_rate": 1.606086919062804e-05, "loss": 2.4313, "step": 3134 }, { "epoch": 0.31, "learning_rate": 1.6058287714813126e-05, "loss": 2.3792, "step": 3135 }, { "epoch": 0.31, "learning_rate": 1.605570560101508e-05, "loss": 2.3468, "step": 3136 }, { "epoch": 0.31, "learning_rate": 1.6053122849505817e-05, "loss": 2.3829, "step": 3137 }, { "epoch": 0.31, "learning_rate": 1.6050539460557324e-05, "loss": 2.397, "step": 3138 }, { "epoch": 0.31, "learning_rate": 1.6047955434441647e-05, "loss": 2.3552, "step": 3139 }, { "epoch": 0.31, "learning_rate": 1.6045370771430905e-05, "loss": 2.3075, "step": 3140 }, { "epoch": 0.31, "learning_rate": 1.604278547179728e-05, "loss": 2.3552, "step": 3141 }, { "epoch": 0.31, "learning_rate": 1.604019953581303e-05, "loss": 2.3051, "step": 3142 }, { "epoch": 0.31, "learning_rate": 1.603761296375047e-05, "loss": 2.3575, "step": 3143 }, { "epoch": 0.31, "learning_rate": 1.603502575588198e-05, "loss": 2.4193, "step": 3144 }, { "epoch": 0.32, "learning_rate": 1.6032437912480022e-05, "loss": 2.3955, "step": 3145 }, { "epoch": 0.32, "learning_rate": 1.602984943381711e-05, "loss": 2.4063, "step": 3146 }, { "epoch": 0.32, "learning_rate": 1.602726032016583e-05, "loss": 2.4117, "step": 3147 }, { "epoch": 0.32, "learning_rate": 1.6024670571798834e-05, "loss": 2.3565, "step": 3148 }, { "epoch": 0.32, "learning_rate": 1.6022080188988845e-05, "loss": 2.4719, "step": 3149 }, { "epoch": 0.32, "learning_rate": 1.601948917200865e-05, "loss": 2.367, "step": 3150 }, { "epoch": 0.32, "learning_rate": 1.60168975211311e-05, "loss": 2.3529, "step": 3151 }, { "epoch": 0.32, "learning_rate": 1.6014305236629117e-05, "loss": 2.2694, "step": 3152 }, { "epoch": 0.32, "learning_rate": 1.6011712318775687e-05, "loss": 2.4514, "step": 3153 }, { "epoch": 0.32, "learning_rate": 1.6009118767843862e-05, "loss": 2.3935, "step": 3154 }, { "epoch": 0.32, "learning_rate": 1.6006524584106767e-05, "loss": 2.3315, "step": 3155 }, { "epoch": 0.32, "learning_rate": 1.6003929767837586e-05, "loss": 2.4789, "step": 3156 }, { "epoch": 0.32, "learning_rate": 1.6001334319309573e-05, "loss": 2.4955, "step": 3157 }, { "epoch": 0.32, "learning_rate": 1.5998738238796047e-05, "loss": 2.4076, "step": 3158 }, { "epoch": 0.32, "learning_rate": 1.5996141526570398e-05, "loss": 2.4612, "step": 3159 }, { "epoch": 0.32, "learning_rate": 1.5993544182906074e-05, "loss": 2.4277, "step": 3160 }, { "epoch": 0.32, "learning_rate": 1.59909462080766e-05, "loss": 2.3779, "step": 3161 }, { "epoch": 0.32, "learning_rate": 1.5988347602355564e-05, "loss": 2.4559, "step": 3162 }, { "epoch": 0.32, "learning_rate": 1.598574836601661e-05, "loss": 2.4747, "step": 3163 }, { "epoch": 0.32, "learning_rate": 1.5983148499333462e-05, "loss": 2.3752, "step": 3164 }, { "epoch": 0.32, "learning_rate": 1.598054800257991e-05, "loss": 2.2741, "step": 3165 }, { "epoch": 0.32, "learning_rate": 1.5977946876029796e-05, "loss": 2.3899, "step": 3166 }, { "epoch": 0.32, "learning_rate": 1.5975345119957046e-05, "loss": 2.4539, "step": 3167 }, { "epoch": 0.32, "learning_rate": 1.597274273463564e-05, "loss": 2.374, "step": 3168 }, { "epoch": 0.32, "learning_rate": 1.5970139720339632e-05, "loss": 2.4118, "step": 3169 }, { "epoch": 0.32, "learning_rate": 1.596753607734314e-05, "loss": 2.3347, "step": 3170 }, { "epoch": 0.32, "learning_rate": 1.596493180592034e-05, "loss": 2.4125, "step": 3171 }, { "epoch": 0.32, "learning_rate": 1.5962326906345487e-05, "loss": 2.3991, "step": 3172 }, { "epoch": 0.32, "learning_rate": 1.5959721378892897e-05, "loss": 2.3535, "step": 3173 }, { "epoch": 0.32, "learning_rate": 1.5957115223836948e-05, "loss": 2.3903, "step": 3174 }, { "epoch": 0.32, "learning_rate": 1.595450844145209e-05, "loss": 2.3353, "step": 3175 }, { "epoch": 0.32, "learning_rate": 1.5951901032012836e-05, "loss": 2.3457, "step": 3176 }, { "epoch": 0.32, "learning_rate": 1.5949292995793767e-05, "loss": 2.4783, "step": 3177 }, { "epoch": 0.32, "learning_rate": 1.594668433306953e-05, "loss": 2.4536, "step": 3178 }, { "epoch": 0.32, "learning_rate": 1.594407504411483e-05, "loss": 2.3823, "step": 3179 }, { "epoch": 0.32, "learning_rate": 1.594146512920445e-05, "loss": 2.4511, "step": 3180 }, { "epoch": 0.32, "learning_rate": 1.5938854588613236e-05, "loss": 2.4637, "step": 3181 }, { "epoch": 0.32, "learning_rate": 1.5936243422616097e-05, "loss": 2.3639, "step": 3182 }, { "epoch": 0.32, "learning_rate": 1.5933631631488e-05, "loss": 2.4033, "step": 3183 }, { "epoch": 0.32, "learning_rate": 1.5931019215503992e-05, "loss": 2.4138, "step": 3184 }, { "epoch": 0.32, "learning_rate": 1.5928406174939183e-05, "loss": 2.4079, "step": 3185 }, { "epoch": 0.32, "learning_rate": 1.5925792510068744e-05, "loss": 2.2866, "step": 3186 }, { "epoch": 0.32, "learning_rate": 1.592317822116791e-05, "loss": 2.3695, "step": 3187 }, { "epoch": 0.32, "learning_rate": 1.5920563308511985e-05, "loss": 2.4246, "step": 3188 }, { "epoch": 0.32, "learning_rate": 1.5917947772376345e-05, "loss": 2.4244, "step": 3189 }, { "epoch": 0.32, "learning_rate": 1.591533161303642e-05, "loss": 2.3725, "step": 3190 }, { "epoch": 0.32, "learning_rate": 1.5912714830767715e-05, "loss": 2.4566, "step": 3191 }, { "epoch": 0.32, "learning_rate": 1.5910097425845794e-05, "loss": 2.3717, "step": 3192 }, { "epoch": 0.32, "learning_rate": 1.5907479398546287e-05, "loss": 2.445, "step": 3193 }, { "epoch": 0.32, "learning_rate": 1.5904860749144902e-05, "loss": 2.4421, "step": 3194 }, { "epoch": 0.32, "learning_rate": 1.5902241477917392e-05, "loss": 2.433, "step": 3195 }, { "epoch": 0.32, "learning_rate": 1.589962158513959e-05, "loss": 2.3465, "step": 3196 }, { "epoch": 0.32, "learning_rate": 1.589700107108739e-05, "loss": 2.4649, "step": 3197 }, { "epoch": 0.32, "learning_rate": 1.589437993603675e-05, "loss": 2.404, "step": 3198 }, { "epoch": 0.32, "learning_rate": 1.58917581802637e-05, "loss": 2.3987, "step": 3199 }, { "epoch": 0.32, "learning_rate": 1.5889135804044327e-05, "loss": 2.4443, "step": 3200 }, { "epoch": 0.32, "learning_rate": 1.5886512807654786e-05, "loss": 2.3032, "step": 3201 }, { "epoch": 0.32, "learning_rate": 1.5883889191371298e-05, "loss": 2.4635, "step": 3202 }, { "epoch": 0.32, "learning_rate": 1.5881264955470154e-05, "loss": 2.4281, "step": 3203 }, { "epoch": 0.32, "learning_rate": 1.58786401002277e-05, "loss": 2.3481, "step": 3204 }, { "epoch": 0.32, "learning_rate": 1.5876014625920356e-05, "loss": 2.463, "step": 3205 }, { "epoch": 0.32, "learning_rate": 1.587338853282461e-05, "loss": 2.3719, "step": 3206 }, { "epoch": 0.32, "learning_rate": 1.5870761821216993e-05, "loss": 2.4371, "step": 3207 }, { "epoch": 0.32, "learning_rate": 1.5868134491374134e-05, "loss": 2.3681, "step": 3208 }, { "epoch": 0.32, "learning_rate": 1.5865506543572703e-05, "loss": 2.3491, "step": 3209 }, { "epoch": 0.32, "learning_rate": 1.5862877978089443e-05, "loss": 2.3999, "step": 3210 }, { "epoch": 0.32, "learning_rate": 1.586024879520116e-05, "loss": 2.3086, "step": 3211 }, { "epoch": 0.32, "learning_rate": 1.5857618995184734e-05, "loss": 2.4138, "step": 3212 }, { "epoch": 0.32, "learning_rate": 1.5854988578317095e-05, "loss": 2.4379, "step": 3213 }, { "epoch": 0.32, "learning_rate": 1.585235754487525e-05, "loss": 2.4436, "step": 3214 }, { "epoch": 0.32, "learning_rate": 1.584972589513626e-05, "loss": 2.4413, "step": 3215 }, { "epoch": 0.32, "learning_rate": 1.5847093629377268e-05, "loss": 2.2962, "step": 3216 }, { "epoch": 0.32, "learning_rate": 1.5844460747875463e-05, "loss": 2.5257, "step": 3217 }, { "epoch": 0.32, "learning_rate": 1.5841827250908112e-05, "loss": 2.4222, "step": 3218 }, { "epoch": 0.32, "learning_rate": 1.5839193138752538e-05, "loss": 2.3712, "step": 3219 }, { "epoch": 0.32, "learning_rate": 1.5836558411686132e-05, "loss": 2.4459, "step": 3220 }, { "epoch": 0.32, "learning_rate": 1.5833923069986355e-05, "loss": 2.4165, "step": 3221 }, { "epoch": 0.32, "learning_rate": 1.583128711393073e-05, "loss": 2.3676, "step": 3222 }, { "epoch": 0.32, "learning_rate": 1.5828650543796836e-05, "loss": 2.3023, "step": 3223 }, { "epoch": 0.32, "learning_rate": 1.5826013359862323e-05, "loss": 2.3647, "step": 3224 }, { "epoch": 0.32, "learning_rate": 1.5823375562404913e-05, "loss": 2.3753, "step": 3225 }, { "epoch": 0.32, "learning_rate": 1.5820737151702385e-05, "loss": 2.3147, "step": 3226 }, { "epoch": 0.32, "learning_rate": 1.5818098128032582e-05, "loss": 2.4229, "step": 3227 }, { "epoch": 0.32, "learning_rate": 1.5815458491673413e-05, "loss": 2.4835, "step": 3228 }, { "epoch": 0.32, "learning_rate": 1.5812818242902847e-05, "loss": 2.3763, "step": 3229 }, { "epoch": 0.32, "learning_rate": 1.5810177381998927e-05, "loss": 2.3571, "step": 3230 }, { "epoch": 0.32, "learning_rate": 1.580753590923975e-05, "loss": 2.3232, "step": 3231 }, { "epoch": 0.32, "learning_rate": 1.58048938249035e-05, "loss": 2.45, "step": 3232 }, { "epoch": 0.32, "learning_rate": 1.5802251129268384e-05, "loss": 2.3906, "step": 3233 }, { "epoch": 0.32, "learning_rate": 1.5799607822612712e-05, "loss": 2.3039, "step": 3234 }, { "epoch": 0.32, "learning_rate": 1.579696390521484e-05, "loss": 2.4007, "step": 3235 }, { "epoch": 0.32, "learning_rate": 1.57943193773532e-05, "loss": 2.3819, "step": 3236 }, { "epoch": 0.32, "learning_rate": 1.5791674239306268e-05, "loss": 2.3283, "step": 3237 }, { "epoch": 0.32, "learning_rate": 1.5789028491352602e-05, "loss": 2.4335, "step": 3238 }, { "epoch": 0.32, "learning_rate": 1.5786382133770825e-05, "loss": 2.3884, "step": 3239 }, { "epoch": 0.32, "learning_rate": 1.578373516683961e-05, "loss": 2.4655, "step": 3240 }, { "epoch": 0.32, "learning_rate": 1.578108759083771e-05, "loss": 2.4822, "step": 3241 }, { "epoch": 0.32, "learning_rate": 1.5778439406043923e-05, "loss": 2.2683, "step": 3242 }, { "epoch": 0.32, "learning_rate": 1.5775790612737134e-05, "loss": 2.3933, "step": 3243 }, { "epoch": 0.33, "learning_rate": 1.577314121119628e-05, "loss": 2.4585, "step": 3244 }, { "epoch": 0.33, "learning_rate": 1.5770491201700357e-05, "loss": 2.3383, "step": 3245 }, { "epoch": 0.33, "learning_rate": 1.5767840584528436e-05, "loss": 2.3447, "step": 3246 }, { "epoch": 0.33, "learning_rate": 1.576518935995964e-05, "loss": 2.4064, "step": 3247 }, { "epoch": 0.33, "learning_rate": 1.5762537528273173e-05, "loss": 2.3304, "step": 3248 }, { "epoch": 0.33, "learning_rate": 1.5759885089748284e-05, "loss": 2.415, "step": 3249 }, { "epoch": 0.33, "learning_rate": 1.5757232044664298e-05, "loss": 2.4767, "step": 3250 }, { "epoch": 0.33, "learning_rate": 1.57545783933006e-05, "loss": 2.3906, "step": 3251 }, { "epoch": 0.33, "learning_rate": 1.575192413593664e-05, "loss": 2.2869, "step": 3252 }, { "epoch": 0.33, "learning_rate": 1.5749269272851932e-05, "loss": 2.4561, "step": 3253 }, { "epoch": 0.33, "learning_rate": 1.5746613804326052e-05, "loss": 2.3823, "step": 3254 }, { "epoch": 0.33, "learning_rate": 1.5743957730638643e-05, "loss": 2.337, "step": 3255 }, { "epoch": 0.33, "learning_rate": 1.5741301052069403e-05, "loss": 2.3641, "step": 3256 }, { "epoch": 0.33, "learning_rate": 1.5738643768898108e-05, "loss": 2.4242, "step": 3257 }, { "epoch": 0.33, "learning_rate": 1.5735985881404584e-05, "loss": 2.3936, "step": 3258 }, { "epoch": 0.33, "learning_rate": 1.5733327389868728e-05, "loss": 2.42, "step": 3259 }, { "epoch": 0.33, "learning_rate": 1.57306682945705e-05, "loss": 2.5221, "step": 3260 }, { "epoch": 0.33, "learning_rate": 1.5728008595789925e-05, "loss": 2.4259, "step": 3261 }, { "epoch": 0.33, "learning_rate": 1.5725348293807084e-05, "loss": 2.4094, "step": 3262 }, { "epoch": 0.33, "learning_rate": 1.5722687388902132e-05, "loss": 2.415, "step": 3263 }, { "epoch": 0.33, "learning_rate": 1.5720025881355278e-05, "loss": 2.4715, "step": 3264 }, { "epoch": 0.33, "learning_rate": 1.5717363771446802e-05, "loss": 2.4341, "step": 3265 }, { "epoch": 0.33, "learning_rate": 1.5714701059457044e-05, "loss": 2.4146, "step": 3266 }, { "epoch": 0.33, "learning_rate": 1.5712037745666403e-05, "loss": 2.4049, "step": 3267 }, { "epoch": 0.33, "learning_rate": 1.570937383035535e-05, "loss": 2.4625, "step": 3268 }, { "epoch": 0.33, "learning_rate": 1.570670931380441e-05, "loss": 2.3907, "step": 3269 }, { "epoch": 0.33, "learning_rate": 1.5704044196294188e-05, "loss": 2.3696, "step": 3270 }, { "epoch": 0.33, "learning_rate": 1.570137847810533e-05, "loss": 2.3661, "step": 3271 }, { "epoch": 0.33, "learning_rate": 1.569871215951856e-05, "loss": 2.4208, "step": 3272 }, { "epoch": 0.33, "learning_rate": 1.5696045240814662e-05, "loss": 2.4477, "step": 3273 }, { "epoch": 0.33, "learning_rate": 1.5693377722274483e-05, "loss": 2.3604, "step": 3274 }, { "epoch": 0.33, "learning_rate": 1.5690709604178928e-05, "loss": 2.4456, "step": 3275 }, { "epoch": 0.33, "learning_rate": 1.5688040886808976e-05, "loss": 2.4511, "step": 3276 }, { "epoch": 0.33, "learning_rate": 1.568537157044566e-05, "loss": 2.287, "step": 3277 }, { "epoch": 0.33, "learning_rate": 1.5682701655370077e-05, "loss": 2.3075, "step": 3278 }, { "epoch": 0.33, "learning_rate": 1.5680031141863396e-05, "loss": 2.3938, "step": 3279 }, { "epoch": 0.33, "learning_rate": 1.5677360030206835e-05, "loss": 2.3978, "step": 3280 }, { "epoch": 0.33, "learning_rate": 1.5674688320681685e-05, "loss": 2.3998, "step": 3281 }, { "epoch": 0.33, "learning_rate": 1.5672016013569297e-05, "loss": 2.4213, "step": 3282 }, { "epoch": 0.33, "learning_rate": 1.566934310915108e-05, "loss": 2.3899, "step": 3283 }, { "epoch": 0.33, "learning_rate": 1.566666960770852e-05, "loss": 2.3148, "step": 3284 }, { "epoch": 0.33, "learning_rate": 1.566399550952315e-05, "loss": 2.4684, "step": 3285 }, { "epoch": 0.33, "learning_rate": 1.5661320814876578e-05, "loss": 2.3789, "step": 3286 }, { "epoch": 0.33, "learning_rate": 1.5658645524050464e-05, "loss": 2.3574, "step": 3287 }, { "epoch": 0.33, "learning_rate": 1.5655969637326542e-05, "loss": 2.4303, "step": 3288 }, { "epoch": 0.33, "learning_rate": 1.5653293154986594e-05, "loss": 2.502, "step": 3289 }, { "epoch": 0.33, "learning_rate": 1.565061607731248e-05, "loss": 2.3364, "step": 3290 }, { "epoch": 0.33, "learning_rate": 1.5647938404586118e-05, "loss": 2.359, "step": 3291 }, { "epoch": 0.33, "learning_rate": 1.5645260137089482e-05, "loss": 2.3546, "step": 3292 }, { "epoch": 0.33, "learning_rate": 1.5642581275104615e-05, "loss": 2.3545, "step": 3293 }, { "epoch": 0.33, "learning_rate": 1.5639901818913624e-05, "loss": 2.4289, "step": 3294 }, { "epoch": 0.33, "learning_rate": 1.5637221768798678e-05, "loss": 2.2805, "step": 3295 }, { "epoch": 0.33, "learning_rate": 1.5634541125041995e-05, "loss": 2.4197, "step": 3296 }, { "epoch": 0.33, "learning_rate": 1.5631859887925878e-05, "loss": 2.5115, "step": 3297 }, { "epoch": 0.33, "learning_rate": 1.562917805773268e-05, "loss": 2.3437, "step": 3298 }, { "epoch": 0.33, "learning_rate": 1.5626495634744813e-05, "loss": 2.3416, "step": 3299 }, { "epoch": 0.33, "learning_rate": 1.5623812619244758e-05, "loss": 2.4091, "step": 3300 }, { "epoch": 0.33, "learning_rate": 1.562112901151506e-05, "loss": 2.3459, "step": 3301 }, { "epoch": 0.33, "learning_rate": 1.5618444811838318e-05, "loss": 2.3491, "step": 3302 }, { "epoch": 0.33, "learning_rate": 1.5615760020497202e-05, "loss": 2.472, "step": 3303 }, { "epoch": 0.33, "learning_rate": 1.5613074637774444e-05, "loss": 2.4928, "step": 3304 }, { "epoch": 0.33, "learning_rate": 1.5610388663952826e-05, "loss": 2.4356, "step": 3305 }, { "epoch": 0.33, "learning_rate": 1.5607702099315204e-05, "loss": 2.2903, "step": 3306 }, { "epoch": 0.33, "learning_rate": 1.5605014944144498e-05, "loss": 2.355, "step": 3307 }, { "epoch": 0.33, "learning_rate": 1.5602327198723682e-05, "loss": 2.4137, "step": 3308 }, { "epoch": 0.33, "learning_rate": 1.5599638863335797e-05, "loss": 2.3836, "step": 3309 }, { "epoch": 0.33, "learning_rate": 1.5596949938263942e-05, "loss": 2.4653, "step": 3310 }, { "epoch": 0.33, "learning_rate": 1.5594260423791286e-05, "loss": 2.515, "step": 3311 }, { "epoch": 0.33, "learning_rate": 1.5591570320201052e-05, "loss": 2.441, "step": 3312 }, { "epoch": 0.33, "learning_rate": 1.558887962777653e-05, "loss": 2.4277, "step": 3313 }, { "epoch": 0.33, "learning_rate": 1.5586188346801063e-05, "loss": 2.4607, "step": 3314 }, { "epoch": 0.33, "learning_rate": 1.558349647755807e-05, "loss": 2.3832, "step": 3315 }, { "epoch": 0.33, "learning_rate": 1.558080402033103e-05, "loss": 2.3754, "step": 3316 }, { "epoch": 0.33, "learning_rate": 1.5578110975403467e-05, "loss": 2.4228, "step": 3317 }, { "epoch": 0.33, "learning_rate": 1.5575417343058986e-05, "loss": 2.4043, "step": 3318 }, { "epoch": 0.33, "learning_rate": 1.557272312358124e-05, "loss": 2.3848, "step": 3319 }, { "epoch": 0.33, "learning_rate": 1.5570028317253963e-05, "loss": 2.3467, "step": 3320 }, { "epoch": 0.33, "learning_rate": 1.5567332924360926e-05, "loss": 2.3737, "step": 3321 }, { "epoch": 0.33, "learning_rate": 1.5564636945185982e-05, "loss": 2.3799, "step": 3322 }, { "epoch": 0.33, "learning_rate": 1.556194038001303e-05, "loss": 2.3688, "step": 3323 }, { "epoch": 0.33, "learning_rate": 1.5559243229126047e-05, "loss": 2.2918, "step": 3324 }, { "epoch": 0.33, "learning_rate": 1.5556545492809063e-05, "loss": 2.4765, "step": 3325 }, { "epoch": 0.33, "learning_rate": 1.5553847171346165e-05, "loss": 2.3484, "step": 3326 }, { "epoch": 0.33, "learning_rate": 1.55511482650215e-05, "loss": 2.4394, "step": 3327 }, { "epoch": 0.33, "learning_rate": 1.55484487741193e-05, "loss": 2.3623, "step": 3328 }, { "epoch": 0.33, "learning_rate": 1.554574869892383e-05, "loss": 2.3872, "step": 3329 }, { "epoch": 0.33, "learning_rate": 1.554304803971943e-05, "loss": 2.2664, "step": 3330 }, { "epoch": 0.33, "learning_rate": 1.5540346796790497e-05, "loss": 2.3528, "step": 3331 }, { "epoch": 0.33, "learning_rate": 1.5537644970421503e-05, "loss": 2.3554, "step": 3332 }, { "epoch": 0.33, "learning_rate": 1.5534942560896958e-05, "loss": 2.3307, "step": 3333 }, { "epoch": 0.33, "learning_rate": 1.5532239568501453e-05, "loss": 2.3612, "step": 3334 }, { "epoch": 0.33, "learning_rate": 1.552953599351963e-05, "loss": 2.3981, "step": 3335 }, { "epoch": 0.33, "learning_rate": 1.5526831836236198e-05, "loss": 2.4052, "step": 3336 }, { "epoch": 0.33, "learning_rate": 1.5524127096935928e-05, "loss": 2.4052, "step": 3337 }, { "epoch": 0.33, "learning_rate": 1.552142177590364e-05, "loss": 2.3759, "step": 3338 }, { "epoch": 0.33, "learning_rate": 1.5518715873424233e-05, "loss": 2.4879, "step": 3339 }, { "epoch": 0.33, "learning_rate": 1.5516009389782654e-05, "loss": 2.442, "step": 3340 }, { "epoch": 0.33, "learning_rate": 1.5513302325263923e-05, "loss": 2.5068, "step": 3341 }, { "epoch": 0.33, "learning_rate": 1.55105946801531e-05, "loss": 2.4337, "step": 3342 }, { "epoch": 0.33, "learning_rate": 1.550788645473534e-05, "loss": 2.376, "step": 3343 }, { "epoch": 0.34, "learning_rate": 1.5505177649295825e-05, "loss": 2.3729, "step": 3344 }, { "epoch": 0.34, "learning_rate": 1.5502468264119813e-05, "loss": 2.2446, "step": 3345 }, { "epoch": 0.34, "learning_rate": 1.549975829949263e-05, "loss": 2.3174, "step": 3346 }, { "epoch": 0.34, "learning_rate": 1.549704775569965e-05, "loss": 2.3711, "step": 3347 }, { "epoch": 0.34, "learning_rate": 1.5494336633026316e-05, "loss": 2.4897, "step": 3348 }, { "epoch": 0.34, "learning_rate": 1.5491624931758127e-05, "loss": 2.3094, "step": 3349 }, { "epoch": 0.34, "learning_rate": 1.548891265218065e-05, "loss": 2.3568, "step": 3350 }, { "epoch": 0.34, "learning_rate": 1.548619979457951e-05, "loss": 2.3307, "step": 3351 }, { "epoch": 0.34, "learning_rate": 1.548348635924038e-05, "loss": 2.3552, "step": 3352 }, { "epoch": 0.34, "learning_rate": 1.5480772346449014e-05, "loss": 2.4045, "step": 3353 }, { "epoch": 0.34, "learning_rate": 1.547805775649122e-05, "loss": 2.4368, "step": 3354 }, { "epoch": 0.34, "learning_rate": 1.5475342589652854e-05, "loss": 2.3346, "step": 3355 }, { "epoch": 0.34, "learning_rate": 1.5472626846219853e-05, "loss": 2.3527, "step": 3356 }, { "epoch": 0.34, "learning_rate": 1.5469910526478204e-05, "loss": 2.3505, "step": 3357 }, { "epoch": 0.34, "learning_rate": 1.5467193630713954e-05, "loss": 2.3323, "step": 3358 }, { "epoch": 0.34, "learning_rate": 1.5464476159213207e-05, "loss": 2.4141, "step": 3359 }, { "epoch": 0.34, "learning_rate": 1.5461758112262145e-05, "loss": 2.413, "step": 3360 }, { "epoch": 0.34, "learning_rate": 1.545903949014699e-05, "loss": 2.3515, "step": 3361 }, { "epoch": 0.34, "learning_rate": 1.545632029315404e-05, "loss": 2.425, "step": 3362 }, { "epoch": 0.34, "learning_rate": 1.5453600521569635e-05, "loss": 2.4224, "step": 3363 }, { "epoch": 0.34, "learning_rate": 1.54508801756802e-05, "loss": 2.4696, "step": 3364 }, { "epoch": 0.34, "learning_rate": 1.54481592557722e-05, "loss": 2.4034, "step": 3365 }, { "epoch": 0.34, "learning_rate": 1.5445437762132173e-05, "loss": 2.3849, "step": 3366 }, { "epoch": 0.34, "learning_rate": 1.544271569504671e-05, "loss": 2.3911, "step": 3367 }, { "epoch": 0.34, "learning_rate": 1.5439993054802465e-05, "loss": 2.3127, "step": 3368 }, { "epoch": 0.34, "learning_rate": 1.5437269841686154e-05, "loss": 2.3234, "step": 3369 }, { "epoch": 0.34, "learning_rate": 1.5434546055984553e-05, "loss": 2.472, "step": 3370 }, { "epoch": 0.34, "learning_rate": 1.5431821697984494e-05, "loss": 2.381, "step": 3371 }, { "epoch": 0.34, "learning_rate": 1.542909676797287e-05, "loss": 2.2912, "step": 3372 }, { "epoch": 0.34, "learning_rate": 1.5426371266236647e-05, "loss": 2.387, "step": 3373 }, { "epoch": 0.34, "learning_rate": 1.5423645193062826e-05, "loss": 2.3741, "step": 3374 }, { "epoch": 0.34, "learning_rate": 1.5420918548738497e-05, "loss": 2.4545, "step": 3375 }, { "epoch": 0.34, "learning_rate": 1.5418191333550786e-05, "loss": 2.2775, "step": 3376 }, { "epoch": 0.34, "learning_rate": 1.5415463547786894e-05, "loss": 2.38, "step": 3377 }, { "epoch": 0.34, "learning_rate": 1.5412735191734074e-05, "loss": 2.438, "step": 3378 }, { "epoch": 0.34, "learning_rate": 1.5410006265679646e-05, "loss": 2.3675, "step": 3379 }, { "epoch": 0.34, "learning_rate": 1.540727676991099e-05, "loss": 2.3562, "step": 3380 }, { "epoch": 0.34, "learning_rate": 1.540454670471553e-05, "loss": 2.3008, "step": 3381 }, { "epoch": 0.34, "learning_rate": 1.5401816070380773e-05, "loss": 2.3595, "step": 3382 }, { "epoch": 0.34, "learning_rate": 1.5399084867194272e-05, "loss": 2.3783, "step": 3383 }, { "epoch": 0.34, "learning_rate": 1.5396353095443644e-05, "loss": 2.3706, "step": 3384 }, { "epoch": 0.34, "learning_rate": 1.5393620755416562e-05, "loss": 2.4497, "step": 3385 }, { "epoch": 0.34, "learning_rate": 1.5390887847400766e-05, "loss": 2.422, "step": 3386 }, { "epoch": 0.34, "learning_rate": 1.538815437168405e-05, "loss": 2.3039, "step": 3387 }, { "epoch": 0.34, "learning_rate": 1.538542032855427e-05, "loss": 2.3888, "step": 3388 }, { "epoch": 0.34, "learning_rate": 1.5382685718299338e-05, "loss": 2.4105, "step": 3389 }, { "epoch": 0.34, "learning_rate": 1.537995054120723e-05, "loss": 2.3216, "step": 3390 }, { "epoch": 0.34, "learning_rate": 1.537721479756599e-05, "loss": 2.4115, "step": 3391 }, { "epoch": 0.34, "learning_rate": 1.53744784876637e-05, "loss": 2.3318, "step": 3392 }, { "epoch": 0.34, "learning_rate": 1.5371741611788516e-05, "loss": 2.3759, "step": 3393 }, { "epoch": 0.34, "learning_rate": 1.5369004170228654e-05, "loss": 2.3755, "step": 3394 }, { "epoch": 0.34, "learning_rate": 1.5366266163272393e-05, "loss": 2.371, "step": 3395 }, { "epoch": 0.34, "learning_rate": 1.5363527591208055e-05, "loss": 2.3147, "step": 3396 }, { "epoch": 0.34, "learning_rate": 1.5360788454324042e-05, "loss": 2.3801, "step": 3397 }, { "epoch": 0.34, "learning_rate": 1.5358048752908795e-05, "loss": 2.4076, "step": 3398 }, { "epoch": 0.34, "learning_rate": 1.535530848725083e-05, "loss": 2.4955, "step": 3399 }, { "epoch": 0.34, "learning_rate": 1.5352567657638724e-05, "loss": 2.4621, "step": 3400 }, { "epoch": 0.34, "learning_rate": 1.5349826264361095e-05, "loss": 2.4268, "step": 3401 }, { "epoch": 0.34, "learning_rate": 1.5347084307706643e-05, "loss": 2.4798, "step": 3402 }, { "epoch": 0.34, "learning_rate": 1.534434178796411e-05, "loss": 2.3986, "step": 3403 }, { "epoch": 0.34, "learning_rate": 1.5341598705422307e-05, "loss": 2.4147, "step": 3404 }, { "epoch": 0.34, "learning_rate": 1.5338855060370098e-05, "loss": 2.349, "step": 3405 }, { "epoch": 0.34, "learning_rate": 1.5336110853096417e-05, "loss": 2.3698, "step": 3406 }, { "epoch": 0.34, "learning_rate": 1.533336608389024e-05, "loss": 2.3751, "step": 3407 }, { "epoch": 0.34, "learning_rate": 1.5330620753040618e-05, "loss": 2.4723, "step": 3408 }, { "epoch": 0.34, "learning_rate": 1.5327874860836652e-05, "loss": 2.3826, "step": 3409 }, { "epoch": 0.34, "learning_rate": 1.5325128407567504e-05, "loss": 2.4539, "step": 3410 }, { "epoch": 0.34, "learning_rate": 1.5322381393522402e-05, "loss": 2.3439, "step": 3411 }, { "epoch": 0.34, "learning_rate": 1.5319633818990616e-05, "loss": 2.3211, "step": 3412 }, { "epoch": 0.34, "learning_rate": 1.53168856842615e-05, "loss": 2.3617, "step": 3413 }, { "epoch": 0.34, "learning_rate": 1.5314136989624447e-05, "loss": 2.3734, "step": 3414 }, { "epoch": 0.34, "learning_rate": 1.531138773536891e-05, "loss": 2.4399, "step": 3415 }, { "epoch": 0.34, "learning_rate": 1.5308637921784414e-05, "loss": 2.3534, "step": 3416 }, { "epoch": 0.34, "learning_rate": 1.5305887549160533e-05, "loss": 2.3945, "step": 3417 }, { "epoch": 0.34, "learning_rate": 1.5303136617786896e-05, "loss": 2.4129, "step": 3418 }, { "epoch": 0.34, "learning_rate": 1.530038512795321e-05, "loss": 2.4085, "step": 3419 }, { "epoch": 0.34, "learning_rate": 1.529763307994921e-05, "loss": 2.2968, "step": 3420 }, { "epoch": 0.34, "learning_rate": 1.529488047406472e-05, "loss": 2.4196, "step": 3421 }, { "epoch": 0.34, "learning_rate": 1.5292127310589603e-05, "loss": 2.3042, "step": 3422 }, { "epoch": 0.34, "learning_rate": 1.5289373589813794e-05, "loss": 2.4355, "step": 3423 }, { "epoch": 0.34, "learning_rate": 1.528661931202728e-05, "loss": 2.3423, "step": 3424 }, { "epoch": 0.34, "learning_rate": 1.5283864477520102e-05, "loss": 2.2703, "step": 3425 }, { "epoch": 0.34, "learning_rate": 1.5281109086582366e-05, "loss": 2.3926, "step": 3426 }, { "epoch": 0.34, "learning_rate": 1.527835313950424e-05, "loss": 2.3512, "step": 3427 }, { "epoch": 0.34, "learning_rate": 1.5275596636575942e-05, "loss": 2.4376, "step": 3428 }, { "epoch": 0.34, "learning_rate": 1.527283957808775e-05, "loss": 2.348, "step": 3429 }, { "epoch": 0.34, "learning_rate": 1.5270081964330005e-05, "loss": 2.3313, "step": 3430 }, { "epoch": 0.34, "learning_rate": 1.526732379559311e-05, "loss": 2.5136, "step": 3431 }, { "epoch": 0.34, "learning_rate": 1.5264565072167516e-05, "loss": 2.3642, "step": 3432 }, { "epoch": 0.34, "learning_rate": 1.5261805794343734e-05, "loss": 2.4077, "step": 3433 }, { "epoch": 0.34, "learning_rate": 1.525904596241234e-05, "loss": 2.43, "step": 3434 }, { "epoch": 0.34, "learning_rate": 1.5256285576663965e-05, "loss": 2.3207, "step": 3435 }, { "epoch": 0.34, "learning_rate": 1.5253524637389302e-05, "loss": 2.2264, "step": 3436 }, { "epoch": 0.34, "learning_rate": 1.5250763144879096e-05, "loss": 2.4866, "step": 3437 }, { "epoch": 0.34, "learning_rate": 1.5248001099424148e-05, "loss": 2.3555, "step": 3438 }, { "epoch": 0.34, "learning_rate": 1.5245238501315327e-05, "loss": 2.4262, "step": 3439 }, { "epoch": 0.34, "learning_rate": 1.5242475350843556e-05, "loss": 2.3929, "step": 3440 }, { "epoch": 0.34, "learning_rate": 1.5239711648299811e-05, "loss": 2.3616, "step": 3441 }, { "epoch": 0.34, "learning_rate": 1.5236947393975134e-05, "loss": 2.3197, "step": 3442 }, { "epoch": 0.34, "learning_rate": 1.523418258816062e-05, "loss": 2.3843, "step": 3443 }, { "epoch": 0.35, "learning_rate": 1.5231417231147427e-05, "loss": 2.3474, "step": 3444 }, { "epoch": 0.35, "learning_rate": 1.5228651323226766e-05, "loss": 2.4908, "step": 3445 }, { "epoch": 0.35, "learning_rate": 1.5225884864689909e-05, "loss": 2.2984, "step": 3446 }, { "epoch": 0.35, "learning_rate": 1.522311785582818e-05, "loss": 2.4174, "step": 3447 }, { "epoch": 0.35, "learning_rate": 1.522035029693297e-05, "loss": 2.3384, "step": 3448 }, { "epoch": 0.35, "learning_rate": 1.5217582188295725e-05, "loss": 2.4199, "step": 3449 }, { "epoch": 0.35, "learning_rate": 1.5214813530207943e-05, "loss": 2.3845, "step": 3450 }, { "epoch": 0.35, "learning_rate": 1.521204432296119e-05, "loss": 2.3797, "step": 3451 }, { "epoch": 0.35, "learning_rate": 1.5209274566847077e-05, "loss": 2.4626, "step": 3452 }, { "epoch": 0.35, "learning_rate": 1.5206504262157285e-05, "loss": 2.3996, "step": 3453 }, { "epoch": 0.35, "learning_rate": 1.520373340918355e-05, "loss": 2.3868, "step": 3454 }, { "epoch": 0.35, "learning_rate": 1.5200962008217661e-05, "loss": 2.3453, "step": 3455 }, { "epoch": 0.35, "learning_rate": 1.5198190059551463e-05, "loss": 2.4106, "step": 3456 }, { "epoch": 0.35, "learning_rate": 1.519541756347687e-05, "loss": 2.363, "step": 3457 }, { "epoch": 0.35, "learning_rate": 1.5192644520285842e-05, "loss": 2.4482, "step": 3458 }, { "epoch": 0.35, "learning_rate": 1.5189870930270407e-05, "loss": 2.2988, "step": 3459 }, { "epoch": 0.35, "learning_rate": 1.5187096793722638e-05, "loss": 2.3681, "step": 3460 }, { "epoch": 0.35, "learning_rate": 1.5184322110934675e-05, "loss": 2.3642, "step": 3461 }, { "epoch": 0.35, "learning_rate": 1.5181546882198712e-05, "loss": 2.3324, "step": 3462 }, { "epoch": 0.35, "learning_rate": 1.5178771107807004e-05, "loss": 2.3792, "step": 3463 }, { "epoch": 0.35, "learning_rate": 1.517599478805186e-05, "loss": 2.2641, "step": 3464 }, { "epoch": 0.35, "learning_rate": 1.5173217923225645e-05, "loss": 2.3967, "step": 3465 }, { "epoch": 0.35, "learning_rate": 1.5170440513620785e-05, "loss": 2.3612, "step": 3466 }, { "epoch": 0.35, "learning_rate": 1.5167662559529763e-05, "loss": 2.4438, "step": 3467 }, { "epoch": 0.35, "learning_rate": 1.516488406124512e-05, "loss": 2.3817, "step": 3468 }, { "epoch": 0.35, "learning_rate": 1.516210501905945e-05, "loss": 2.3552, "step": 3469 }, { "epoch": 0.35, "learning_rate": 1.5159325433265407e-05, "loss": 2.4741, "step": 3470 }, { "epoch": 0.35, "learning_rate": 1.5156545304155699e-05, "loss": 2.2721, "step": 3471 }, { "epoch": 0.35, "learning_rate": 1.5153764632023102e-05, "loss": 2.4274, "step": 3472 }, { "epoch": 0.35, "learning_rate": 1.5150983417160436e-05, "loss": 2.3995, "step": 3473 }, { "epoch": 0.35, "learning_rate": 1.5148201659860587e-05, "loss": 2.3291, "step": 3474 }, { "epoch": 0.35, "learning_rate": 1.5145419360416491e-05, "loss": 2.4388, "step": 3475 }, { "epoch": 0.35, "learning_rate": 1.514263651912115e-05, "loss": 2.347, "step": 3476 }, { "epoch": 0.35, "learning_rate": 1.5139853136267615e-05, "loss": 2.4206, "step": 3477 }, { "epoch": 0.35, "learning_rate": 1.5137069212148998e-05, "loss": 2.4329, "step": 3478 }, { "epoch": 0.35, "learning_rate": 1.5134284747058465e-05, "loss": 2.372, "step": 3479 }, { "epoch": 0.35, "learning_rate": 1.5131499741289245e-05, "loss": 2.3793, "step": 3480 }, { "epoch": 0.35, "learning_rate": 1.5128714195134617e-05, "loss": 2.3276, "step": 3481 }, { "epoch": 0.35, "learning_rate": 1.512592810888792e-05, "loss": 2.3963, "step": 3482 }, { "epoch": 0.35, "learning_rate": 1.5123141482842551e-05, "loss": 2.2574, "step": 3483 }, { "epoch": 0.35, "learning_rate": 1.5120354317291962e-05, "loss": 2.3647, "step": 3484 }, { "epoch": 0.35, "learning_rate": 1.5117566612529661e-05, "loss": 2.3742, "step": 3485 }, { "epoch": 0.35, "learning_rate": 1.5114778368849217e-05, "loss": 2.399, "step": 3486 }, { "epoch": 0.35, "learning_rate": 1.5111989586544251e-05, "loss": 2.4335, "step": 3487 }, { "epoch": 0.35, "learning_rate": 1.5109200265908444e-05, "loss": 2.3723, "step": 3488 }, { "epoch": 0.35, "learning_rate": 1.5106410407235532e-05, "loss": 2.4773, "step": 3489 }, { "epoch": 0.35, "learning_rate": 1.5103620010819306e-05, "loss": 2.3845, "step": 3490 }, { "epoch": 0.35, "learning_rate": 1.5100829076953623e-05, "loss": 2.3615, "step": 3491 }, { "epoch": 0.35, "learning_rate": 1.5098037605932376e-05, "loss": 2.2796, "step": 3492 }, { "epoch": 0.35, "learning_rate": 1.5095245598049539e-05, "loss": 2.3251, "step": 3493 }, { "epoch": 0.35, "learning_rate": 1.509245305359913e-05, "loss": 2.3982, "step": 3494 }, { "epoch": 0.35, "learning_rate": 1.5089659972875221e-05, "loss": 2.3419, "step": 3495 }, { "epoch": 0.35, "learning_rate": 1.5086866356171945e-05, "loss": 2.3878, "step": 3496 }, { "epoch": 0.35, "learning_rate": 1.5084072203783493e-05, "loss": 2.424, "step": 3497 }, { "epoch": 0.35, "learning_rate": 1.5081277516004109e-05, "loss": 2.4363, "step": 3498 }, { "epoch": 0.35, "learning_rate": 1.5078482293128093e-05, "loss": 2.3935, "step": 3499 }, { "epoch": 0.35, "learning_rate": 1.507568653544981e-05, "loss": 2.3877, "step": 3500 }, { "epoch": 0.35, "learning_rate": 1.5072890243263665e-05, "loss": 2.4626, "step": 3501 }, { "epoch": 0.35, "learning_rate": 1.5070093416864132e-05, "loss": 2.3627, "step": 3502 }, { "epoch": 0.35, "learning_rate": 1.5067296056545739e-05, "loss": 2.3281, "step": 3503 }, { "epoch": 0.35, "learning_rate": 1.5064498162603069e-05, "loss": 2.3997, "step": 3504 }, { "epoch": 0.35, "learning_rate": 1.506169973533076e-05, "loss": 2.3829, "step": 3505 }, { "epoch": 0.35, "learning_rate": 1.5058900775023506e-05, "loss": 2.3243, "step": 3506 }, { "epoch": 0.35, "learning_rate": 1.5056101281976063e-05, "loss": 2.4813, "step": 3507 }, { "epoch": 0.35, "learning_rate": 1.5053301256483235e-05, "loss": 2.3448, "step": 3508 }, { "epoch": 0.35, "learning_rate": 1.5050500698839887e-05, "loss": 2.3439, "step": 3509 }, { "epoch": 0.35, "learning_rate": 1.5047699609340937e-05, "loss": 2.3886, "step": 3510 }, { "epoch": 0.35, "learning_rate": 1.5044897988281365e-05, "loss": 2.3163, "step": 3511 }, { "epoch": 0.35, "learning_rate": 1.5042095835956198e-05, "loss": 2.3705, "step": 3512 }, { "epoch": 0.35, "learning_rate": 1.5039293152660525e-05, "loss": 2.4274, "step": 3513 }, { "epoch": 0.35, "learning_rate": 1.5036489938689492e-05, "loss": 2.4672, "step": 3514 }, { "epoch": 0.35, "learning_rate": 1.5033686194338293e-05, "loss": 2.4012, "step": 3515 }, { "epoch": 0.35, "learning_rate": 1.5030881919902189e-05, "loss": 2.4217, "step": 3516 }, { "epoch": 0.35, "learning_rate": 1.5028077115676487e-05, "loss": 2.2993, "step": 3517 }, { "epoch": 0.35, "learning_rate": 1.5025271781956559e-05, "loss": 2.322, "step": 3518 }, { "epoch": 0.35, "learning_rate": 1.502246591903782e-05, "loss": 2.4018, "step": 3519 }, { "epoch": 0.35, "learning_rate": 1.5019659527215757e-05, "loss": 2.3876, "step": 3520 }, { "epoch": 0.35, "learning_rate": 1.5016852606785901e-05, "loss": 2.4514, "step": 3521 }, { "epoch": 0.35, "learning_rate": 1.5014045158043838e-05, "loss": 2.3822, "step": 3522 }, { "epoch": 0.35, "learning_rate": 1.501123718128522e-05, "loss": 2.5222, "step": 3523 }, { "epoch": 0.35, "learning_rate": 1.500842867680574e-05, "loss": 2.3716, "step": 3524 }, { "epoch": 0.35, "learning_rate": 1.5005619644901161e-05, "loss": 2.2592, "step": 3525 }, { "epoch": 0.35, "learning_rate": 1.5002810085867291e-05, "loss": 2.4146, "step": 3526 }, { "epoch": 0.35, "learning_rate": 1.5000000000000002e-05, "loss": 2.4048, "step": 3527 }, { "epoch": 0.35, "learning_rate": 1.4997189387595212e-05, "loss": 2.4171, "step": 3528 }, { "epoch": 0.35, "learning_rate": 1.4994378248948904e-05, "loss": 2.5063, "step": 3529 }, { "epoch": 0.35, "learning_rate": 1.4991566584357111e-05, "loss": 2.3754, "step": 3530 }, { "epoch": 0.35, "learning_rate": 1.4988754394115921e-05, "loss": 2.3126, "step": 3531 }, { "epoch": 0.35, "learning_rate": 1.4985941678521479e-05, "loss": 2.4313, "step": 3532 }, { "epoch": 0.35, "learning_rate": 1.4983128437869984e-05, "loss": 2.4669, "step": 3533 }, { "epoch": 0.35, "learning_rate": 1.4980314672457696e-05, "loss": 2.2462, "step": 3534 }, { "epoch": 0.35, "learning_rate": 1.497750038258092e-05, "loss": 2.4592, "step": 3535 }, { "epoch": 0.35, "learning_rate": 1.4974685568536025e-05, "loss": 2.4263, "step": 3536 }, { "epoch": 0.35, "learning_rate": 1.497187023061943e-05, "loss": 2.4033, "step": 3537 }, { "epoch": 0.35, "learning_rate": 1.4969054369127613e-05, "loss": 2.4743, "step": 3538 }, { "epoch": 0.35, "learning_rate": 1.4966237984357105e-05, "loss": 2.4004, "step": 3539 }, { "epoch": 0.35, "learning_rate": 1.4963421076604495e-05, "loss": 2.3632, "step": 3540 }, { "epoch": 0.35, "learning_rate": 1.4960603646166416e-05, "loss": 2.3694, "step": 3541 }, { "epoch": 0.35, "learning_rate": 1.4957785693339573e-05, "loss": 2.3576, "step": 3542 }, { "epoch": 0.35, "learning_rate": 1.4954967218420718e-05, "loss": 2.3778, "step": 3543 }, { "epoch": 0.36, "learning_rate": 1.4952148221706649e-05, "loss": 2.4729, "step": 3544 }, { "epoch": 0.36, "learning_rate": 1.4949328703494237e-05, "loss": 2.4078, "step": 3545 }, { "epoch": 0.36, "learning_rate": 1.4946508664080389e-05, "loss": 2.407, "step": 3546 }, { "epoch": 0.36, "learning_rate": 1.4943688103762086e-05, "loss": 2.3556, "step": 3547 }, { "epoch": 0.36, "learning_rate": 1.4940867022836348e-05, "loss": 2.3679, "step": 3548 }, { "epoch": 0.36, "learning_rate": 1.4938045421600258e-05, "loss": 2.4273, "step": 3549 }, { "epoch": 0.36, "learning_rate": 1.4935223300350951e-05, "loss": 2.3568, "step": 3550 }, { "epoch": 0.36, "learning_rate": 1.4932400659385618e-05, "loss": 2.3485, "step": 3551 }, { "epoch": 0.36, "learning_rate": 1.4929577499001506e-05, "loss": 2.3912, "step": 3552 }, { "epoch": 0.36, "learning_rate": 1.4926753819495912e-05, "loss": 2.3954, "step": 3553 }, { "epoch": 0.36, "learning_rate": 1.4923929621166191e-05, "loss": 2.2538, "step": 3554 }, { "epoch": 0.36, "learning_rate": 1.4921104904309755e-05, "loss": 2.4746, "step": 3555 }, { "epoch": 0.36, "learning_rate": 1.4918279669224065e-05, "loss": 2.3565, "step": 3556 }, { "epoch": 0.36, "learning_rate": 1.4915453916206641e-05, "loss": 2.363, "step": 3557 }, { "epoch": 0.36, "learning_rate": 1.4912627645555055e-05, "loss": 2.4443, "step": 3558 }, { "epoch": 0.36, "learning_rate": 1.4909800857566934e-05, "loss": 2.3257, "step": 3559 }, { "epoch": 0.36, "learning_rate": 1.490697355253996e-05, "loss": 2.3169, "step": 3560 }, { "epoch": 0.36, "learning_rate": 1.4904145730771873e-05, "loss": 2.4033, "step": 3561 }, { "epoch": 0.36, "learning_rate": 1.490131739256046e-05, "loss": 2.2746, "step": 3562 }, { "epoch": 0.36, "learning_rate": 1.4898488538203568e-05, "loss": 2.3009, "step": 3563 }, { "epoch": 0.36, "learning_rate": 1.4895659167999095e-05, "loss": 2.3224, "step": 3564 }, { "epoch": 0.36, "learning_rate": 1.4892829282244997e-05, "loss": 2.3767, "step": 3565 }, { "epoch": 0.36, "learning_rate": 1.4889998881239281e-05, "loss": 2.4362, "step": 3566 }, { "epoch": 0.36, "learning_rate": 1.4887167965280007e-05, "loss": 2.3184, "step": 3567 }, { "epoch": 0.36, "learning_rate": 1.4884336534665295e-05, "loss": 2.4051, "step": 3568 }, { "epoch": 0.36, "learning_rate": 1.4881504589693317e-05, "loss": 2.3925, "step": 3569 }, { "epoch": 0.36, "learning_rate": 1.4878672130662295e-05, "loss": 2.4979, "step": 3570 }, { "epoch": 0.36, "learning_rate": 1.4875839157870508e-05, "loss": 2.3141, "step": 3571 }, { "epoch": 0.36, "learning_rate": 1.4873005671616292e-05, "loss": 2.3944, "step": 3572 }, { "epoch": 0.36, "learning_rate": 1.4870171672198033e-05, "loss": 2.3988, "step": 3573 }, { "epoch": 0.36, "learning_rate": 1.4867337159914171e-05, "loss": 2.4739, "step": 3574 }, { "epoch": 0.36, "learning_rate": 1.4864502135063205e-05, "loss": 2.4037, "step": 3575 }, { "epoch": 0.36, "learning_rate": 1.486166659794368e-05, "loss": 2.3988, "step": 3576 }, { "epoch": 0.36, "learning_rate": 1.4858830548854202e-05, "loss": 2.3871, "step": 3577 }, { "epoch": 0.36, "learning_rate": 1.4855993988093427e-05, "loss": 2.3685, "step": 3578 }, { "epoch": 0.36, "learning_rate": 1.4853156915960067e-05, "loss": 2.3813, "step": 3579 }, { "epoch": 0.36, "learning_rate": 1.485031933275289e-05, "loss": 2.3414, "step": 3580 }, { "epoch": 0.36, "learning_rate": 1.484748123877071e-05, "loss": 2.4011, "step": 3581 }, { "epoch": 0.36, "learning_rate": 1.4844642634312396e-05, "loss": 2.3821, "step": 3582 }, { "epoch": 0.36, "learning_rate": 1.4841803519676882e-05, "loss": 2.2948, "step": 3583 }, { "epoch": 0.36, "learning_rate": 1.483896389516315e-05, "loss": 2.346, "step": 3584 }, { "epoch": 0.36, "learning_rate": 1.4836123761070224e-05, "loss": 2.3692, "step": 3585 }, { "epoch": 0.36, "learning_rate": 1.4833283117697201e-05, "loss": 2.3854, "step": 3586 }, { "epoch": 0.36, "learning_rate": 1.4830441965343214e-05, "loss": 2.4264, "step": 3587 }, { "epoch": 0.36, "learning_rate": 1.4827600304307464e-05, "loss": 2.433, "step": 3588 }, { "epoch": 0.36, "learning_rate": 1.4824758134889196e-05, "loss": 2.393, "step": 3589 }, { "epoch": 0.36, "learning_rate": 1.4821915457387712e-05, "loss": 2.4389, "step": 3590 }, { "epoch": 0.36, "learning_rate": 1.4819072272102367e-05, "loss": 2.3514, "step": 3591 }, { "epoch": 0.36, "learning_rate": 1.481622857933257e-05, "loss": 2.3455, "step": 3592 }, { "epoch": 0.36, "learning_rate": 1.4813384379377784e-05, "loss": 2.4271, "step": 3593 }, { "epoch": 0.36, "learning_rate": 1.4810539672537524e-05, "loss": 2.3586, "step": 3594 }, { "epoch": 0.36, "learning_rate": 1.4807694459111362e-05, "loss": 2.3664, "step": 3595 }, { "epoch": 0.36, "learning_rate": 1.4804848739398914e-05, "loss": 2.4191, "step": 3596 }, { "epoch": 0.36, "learning_rate": 1.480200251369986e-05, "loss": 2.3492, "step": 3597 }, { "epoch": 0.36, "learning_rate": 1.4799155782313927e-05, "loss": 2.4197, "step": 3598 }, { "epoch": 0.36, "learning_rate": 1.47963085455409e-05, "loss": 2.3245, "step": 3599 }, { "epoch": 0.36, "learning_rate": 1.479346080368061e-05, "loss": 2.3924, "step": 3600 }, { "epoch": 0.36, "learning_rate": 1.479061255703295e-05, "loss": 2.3522, "step": 3601 }, { "epoch": 0.36, "learning_rate": 1.478776380589786e-05, "loss": 2.4138, "step": 3602 }, { "epoch": 0.36, "learning_rate": 1.4784914550575334e-05, "loss": 2.3937, "step": 3603 }, { "epoch": 0.36, "learning_rate": 1.4782064791365419e-05, "loss": 2.3869, "step": 3604 }, { "epoch": 0.36, "learning_rate": 1.477921452856822e-05, "loss": 2.4273, "step": 3605 }, { "epoch": 0.36, "learning_rate": 1.4776363762483887e-05, "loss": 2.395, "step": 3606 }, { "epoch": 0.36, "learning_rate": 1.4773512493412633e-05, "loss": 2.3299, "step": 3607 }, { "epoch": 0.36, "learning_rate": 1.4770660721654708e-05, "loss": 2.3653, "step": 3608 }, { "epoch": 0.36, "learning_rate": 1.4767808447510432e-05, "loss": 2.4134, "step": 3609 }, { "epoch": 0.36, "learning_rate": 1.4764955671280172e-05, "loss": 2.4192, "step": 3610 }, { "epoch": 0.36, "learning_rate": 1.4762102393264344e-05, "loss": 2.3705, "step": 3611 }, { "epoch": 0.36, "learning_rate": 1.4759248613763417e-05, "loss": 2.3247, "step": 3612 }, { "epoch": 0.36, "learning_rate": 1.4756394333077919e-05, "loss": 2.3472, "step": 3613 }, { "epoch": 0.36, "learning_rate": 1.4753539551508428e-05, "loss": 2.3964, "step": 3614 }, { "epoch": 0.36, "learning_rate": 1.4750684269355571e-05, "loss": 2.3292, "step": 3615 }, { "epoch": 0.36, "learning_rate": 1.4747828486920033e-05, "loss": 2.3555, "step": 3616 }, { "epoch": 0.36, "learning_rate": 1.4744972204502548e-05, "loss": 2.3547, "step": 3617 }, { "epoch": 0.36, "learning_rate": 1.4742115422403904e-05, "loss": 2.415, "step": 3618 }, { "epoch": 0.36, "learning_rate": 1.4739258140924942e-05, "loss": 2.3654, "step": 3619 }, { "epoch": 0.36, "learning_rate": 1.4736400360366554e-05, "loss": 2.3239, "step": 3620 }, { "epoch": 0.36, "learning_rate": 1.4733542081029688e-05, "loss": 2.4466, "step": 3621 }, { "epoch": 0.36, "learning_rate": 1.4730683303215338e-05, "loss": 2.3883, "step": 3622 }, { "epoch": 0.36, "learning_rate": 1.472782402722456e-05, "loss": 2.3084, "step": 3623 }, { "epoch": 0.36, "learning_rate": 1.4724964253358456e-05, "loss": 2.3397, "step": 3624 }, { "epoch": 0.36, "learning_rate": 1.472210398191818e-05, "loss": 2.3082, "step": 3625 }, { "epoch": 0.36, "learning_rate": 1.471924321320494e-05, "loss": 2.4213, "step": 3626 }, { "epoch": 0.36, "learning_rate": 1.4716381947519996e-05, "loss": 2.3015, "step": 3627 }, { "epoch": 0.36, "learning_rate": 1.4713520185164662e-05, "loss": 2.3906, "step": 3628 }, { "epoch": 0.36, "learning_rate": 1.4710657926440304e-05, "loss": 2.4324, "step": 3629 }, { "epoch": 0.36, "learning_rate": 1.4707795171648338e-05, "loss": 2.3798, "step": 3630 }, { "epoch": 0.36, "learning_rate": 1.470493192109023e-05, "loss": 2.4588, "step": 3631 }, { "epoch": 0.36, "learning_rate": 1.4702068175067509e-05, "loss": 2.4782, "step": 3632 }, { "epoch": 0.36, "learning_rate": 1.4699203933881746e-05, "loss": 2.3527, "step": 3633 }, { "epoch": 0.36, "learning_rate": 1.4696339197834564e-05, "loss": 2.3989, "step": 3634 }, { "epoch": 0.36, "learning_rate": 1.4693473967227644e-05, "loss": 2.2999, "step": 3635 }, { "epoch": 0.36, "learning_rate": 1.4690608242362714e-05, "loss": 2.3798, "step": 3636 }, { "epoch": 0.36, "learning_rate": 1.468774202354156e-05, "loss": 2.5047, "step": 3637 }, { "epoch": 0.36, "learning_rate": 1.4684875311066017e-05, "loss": 2.4243, "step": 3638 }, { "epoch": 0.36, "learning_rate": 1.4682008105237967e-05, "loss": 2.3338, "step": 3639 }, { "epoch": 0.36, "learning_rate": 1.4679140406359346e-05, "loss": 2.4122, "step": 3640 }, { "epoch": 0.36, "learning_rate": 1.4676272214732153e-05, "loss": 2.3377, "step": 3641 }, { "epoch": 0.36, "learning_rate": 1.4673403530658426e-05, "loss": 2.3181, "step": 3642 }, { "epoch": 0.36, "learning_rate": 1.4670534354440255e-05, "loss": 2.3642, "step": 3643 }, { "epoch": 0.37, "learning_rate": 1.466766468637979e-05, "loss": 2.4194, "step": 3644 }, { "epoch": 0.37, "learning_rate": 1.4664794526779227e-05, "loss": 2.4604, "step": 3645 }, { "epoch": 0.37, "learning_rate": 1.4661923875940819e-05, "loss": 2.4457, "step": 3646 }, { "epoch": 0.37, "learning_rate": 1.4659052734166861e-05, "loss": 2.3865, "step": 3647 }, { "epoch": 0.37, "learning_rate": 1.465618110175971e-05, "loss": 2.428, "step": 3648 }, { "epoch": 0.37, "learning_rate": 1.465330897902177e-05, "loss": 2.2807, "step": 3649 }, { "epoch": 0.37, "learning_rate": 1.4650436366255494e-05, "loss": 2.3718, "step": 3650 }, { "epoch": 0.37, "learning_rate": 1.4647563263763394e-05, "loss": 2.3485, "step": 3651 }, { "epoch": 0.37, "learning_rate": 1.4644689671848027e-05, "loss": 2.4384, "step": 3652 }, { "epoch": 0.37, "learning_rate": 1.4641815590812003e-05, "loss": 2.3273, "step": 3653 }, { "epoch": 0.37, "learning_rate": 1.4638941020957984e-05, "loss": 2.402, "step": 3654 }, { "epoch": 0.37, "learning_rate": 1.4636065962588687e-05, "loss": 2.4148, "step": 3655 }, { "epoch": 0.37, "learning_rate": 1.4633190416006874e-05, "loss": 2.5017, "step": 3656 }, { "epoch": 0.37, "learning_rate": 1.4630314381515365e-05, "loss": 2.3907, "step": 3657 }, { "epoch": 0.37, "learning_rate": 1.4627437859417024e-05, "loss": 2.453, "step": 3658 }, { "epoch": 0.37, "learning_rate": 1.4624560850014774e-05, "loss": 2.3811, "step": 3659 }, { "epoch": 0.37, "learning_rate": 1.4621683353611583e-05, "loss": 2.5021, "step": 3660 }, { "epoch": 0.37, "learning_rate": 1.4618805370510473e-05, "loss": 2.3589, "step": 3661 }, { "epoch": 0.37, "learning_rate": 1.4615926901014516e-05, "loss": 2.3253, "step": 3662 }, { "epoch": 0.37, "learning_rate": 1.4613047945426841e-05, "loss": 2.3521, "step": 3663 }, { "epoch": 0.37, "learning_rate": 1.4610168504050623e-05, "loss": 2.51, "step": 3664 }, { "epoch": 0.37, "learning_rate": 1.4607288577189084e-05, "loss": 2.5034, "step": 3665 }, { "epoch": 0.37, "learning_rate": 1.4604408165145504e-05, "loss": 2.3595, "step": 3666 }, { "epoch": 0.37, "learning_rate": 1.4601527268223214e-05, "loss": 2.4356, "step": 3667 }, { "epoch": 0.37, "learning_rate": 1.4598645886725593e-05, "loss": 2.2624, "step": 3668 }, { "epoch": 0.37, "learning_rate": 1.4595764020956073e-05, "loss": 2.2833, "step": 3669 }, { "epoch": 0.37, "learning_rate": 1.4592881671218134e-05, "loss": 2.4065, "step": 3670 }, { "epoch": 0.37, "learning_rate": 1.4589998837815312e-05, "loss": 2.4101, "step": 3671 }, { "epoch": 0.37, "learning_rate": 1.4587115521051185e-05, "loss": 2.3949, "step": 3672 }, { "epoch": 0.37, "learning_rate": 1.4584231721229395e-05, "loss": 2.4073, "step": 3673 }, { "epoch": 0.37, "learning_rate": 1.4581347438653624e-05, "loss": 2.4084, "step": 3674 }, { "epoch": 0.37, "learning_rate": 1.4578462673627607e-05, "loss": 2.3853, "step": 3675 }, { "epoch": 0.37, "learning_rate": 1.4575577426455134e-05, "loss": 2.4491, "step": 3676 }, { "epoch": 0.37, "learning_rate": 1.4572691697440045e-05, "loss": 2.2853, "step": 3677 }, { "epoch": 0.37, "learning_rate": 1.4569805486886223e-05, "loss": 2.37, "step": 3678 }, { "epoch": 0.37, "learning_rate": 1.4566918795097615e-05, "loss": 2.3907, "step": 3679 }, { "epoch": 0.37, "learning_rate": 1.4564031622378205e-05, "loss": 2.4445, "step": 3680 }, { "epoch": 0.37, "learning_rate": 1.4561143969032039e-05, "loss": 2.4007, "step": 3681 }, { "epoch": 0.37, "learning_rate": 1.4558255835363206e-05, "loss": 2.3797, "step": 3682 }, { "epoch": 0.37, "learning_rate": 1.4555367221675847e-05, "loss": 2.3162, "step": 3683 }, { "epoch": 0.37, "learning_rate": 1.4552478128274154e-05, "loss": 2.3577, "step": 3684 }, { "epoch": 0.37, "learning_rate": 1.4549588555462373e-05, "loss": 2.3054, "step": 3685 }, { "epoch": 0.37, "learning_rate": 1.4546698503544799e-05, "loss": 2.4848, "step": 3686 }, { "epoch": 0.37, "learning_rate": 1.4543807972825772e-05, "loss": 2.3886, "step": 3687 }, { "epoch": 0.37, "learning_rate": 1.4540916963609687e-05, "loss": 2.3151, "step": 3688 }, { "epoch": 0.37, "learning_rate": 1.4538025476200992e-05, "loss": 2.4467, "step": 3689 }, { "epoch": 0.37, "learning_rate": 1.4535133510904183e-05, "loss": 2.3552, "step": 3690 }, { "epoch": 0.37, "learning_rate": 1.4532241068023803e-05, "loss": 2.4111, "step": 3691 }, { "epoch": 0.37, "learning_rate": 1.4529348147864446e-05, "loss": 2.3754, "step": 3692 }, { "epoch": 0.37, "learning_rate": 1.4526454750730761e-05, "loss": 2.4188, "step": 3693 }, { "epoch": 0.37, "learning_rate": 1.4523560876927444e-05, "loss": 2.3628, "step": 3694 }, { "epoch": 0.37, "learning_rate": 1.452066652675924e-05, "loss": 2.3397, "step": 3695 }, { "epoch": 0.37, "learning_rate": 1.451777170053095e-05, "loss": 2.3392, "step": 3696 }, { "epoch": 0.37, "learning_rate": 1.4514876398547414e-05, "loss": 2.3681, "step": 3697 }, { "epoch": 0.37, "learning_rate": 1.4511980621113537e-05, "loss": 2.4531, "step": 3698 }, { "epoch": 0.37, "learning_rate": 1.4509084368534262e-05, "loss": 2.4249, "step": 3699 }, { "epoch": 0.37, "learning_rate": 1.4506187641114584e-05, "loss": 2.3175, "step": 3700 }, { "epoch": 0.37, "learning_rate": 1.4503290439159554e-05, "loss": 2.3252, "step": 3701 }, { "epoch": 0.37, "learning_rate": 1.4500392762974269e-05, "loss": 2.4745, "step": 3702 }, { "epoch": 0.37, "learning_rate": 1.4497494612863874e-05, "loss": 2.4772, "step": 3703 }, { "epoch": 0.37, "learning_rate": 1.4494595989133566e-05, "loss": 2.4214, "step": 3704 }, { "epoch": 0.37, "learning_rate": 1.4491696892088594e-05, "loss": 2.3326, "step": 3705 }, { "epoch": 0.37, "learning_rate": 1.4488797322034252e-05, "loss": 2.2997, "step": 3706 }, { "epoch": 0.37, "learning_rate": 1.4485897279275885e-05, "loss": 2.2989, "step": 3707 }, { "epoch": 0.37, "learning_rate": 1.4482996764118894e-05, "loss": 2.2936, "step": 3708 }, { "epoch": 0.37, "learning_rate": 1.4480095776868724e-05, "loss": 2.4096, "step": 3709 }, { "epoch": 0.37, "learning_rate": 1.4477194317830868e-05, "loss": 2.4348, "step": 3710 }, { "epoch": 0.37, "learning_rate": 1.4474292387310873e-05, "loss": 2.398, "step": 3711 }, { "epoch": 0.37, "learning_rate": 1.4471389985614334e-05, "loss": 2.3477, "step": 3712 }, { "epoch": 0.37, "learning_rate": 1.4468487113046896e-05, "loss": 2.3782, "step": 3713 }, { "epoch": 0.37, "learning_rate": 1.4465583769914253e-05, "loss": 2.3886, "step": 3714 }, { "epoch": 0.37, "learning_rate": 1.4462679956522148e-05, "loss": 2.2886, "step": 3715 }, { "epoch": 0.37, "learning_rate": 1.4459775673176375e-05, "loss": 2.2773, "step": 3716 }, { "epoch": 0.37, "learning_rate": 1.4456870920182777e-05, "loss": 2.3783, "step": 3717 }, { "epoch": 0.37, "learning_rate": 1.4453965697847245e-05, "loss": 2.364, "step": 3718 }, { "epoch": 0.37, "learning_rate": 1.4451060006475723e-05, "loss": 2.3435, "step": 3719 }, { "epoch": 0.37, "learning_rate": 1.4448153846374203e-05, "loss": 2.3785, "step": 3720 }, { "epoch": 0.37, "learning_rate": 1.444524721784872e-05, "loss": 2.4439, "step": 3721 }, { "epoch": 0.37, "learning_rate": 1.444234012120537e-05, "loss": 2.43, "step": 3722 }, { "epoch": 0.37, "learning_rate": 1.4439432556750288e-05, "loss": 2.4443, "step": 3723 }, { "epoch": 0.37, "learning_rate": 1.4436524524789663e-05, "loss": 2.3653, "step": 3724 }, { "epoch": 0.37, "learning_rate": 1.4433616025629734e-05, "loss": 2.3833, "step": 3725 }, { "epoch": 0.37, "learning_rate": 1.4430707059576782e-05, "loss": 2.3127, "step": 3726 }, { "epoch": 0.37, "learning_rate": 1.4427797626937155e-05, "loss": 2.4703, "step": 3727 }, { "epoch": 0.37, "learning_rate": 1.4424887728017228e-05, "loss": 2.3573, "step": 3728 }, { "epoch": 0.37, "learning_rate": 1.4421977363123438e-05, "loss": 2.3926, "step": 3729 }, { "epoch": 0.37, "learning_rate": 1.4419066532562266e-05, "loss": 2.3957, "step": 3730 }, { "epoch": 0.37, "learning_rate": 1.4416155236640251e-05, "loss": 2.3867, "step": 3731 }, { "epoch": 0.37, "learning_rate": 1.4413243475663968e-05, "loss": 2.3889, "step": 3732 }, { "epoch": 0.37, "learning_rate": 1.4410331249940049e-05, "loss": 2.3859, "step": 3733 }, { "epoch": 0.37, "learning_rate": 1.4407418559775172e-05, "loss": 2.3757, "step": 3734 }, { "epoch": 0.37, "learning_rate": 1.440450540547607e-05, "loss": 2.4291, "step": 3735 }, { "epoch": 0.37, "learning_rate": 1.4401591787349513e-05, "loss": 2.3521, "step": 3736 }, { "epoch": 0.37, "learning_rate": 1.4398677705702332e-05, "loss": 2.338, "step": 3737 }, { "epoch": 0.37, "learning_rate": 1.43957631608414e-05, "loss": 2.3381, "step": 3738 }, { "epoch": 0.37, "learning_rate": 1.439284815307364e-05, "loss": 2.297, "step": 3739 }, { "epoch": 0.37, "learning_rate": 1.4389932682706025e-05, "loss": 2.3396, "step": 3740 }, { "epoch": 0.37, "learning_rate": 1.4387016750045578e-05, "loss": 2.4118, "step": 3741 }, { "epoch": 0.37, "learning_rate": 1.4384100355399361e-05, "loss": 2.3822, "step": 3742 }, { "epoch": 0.38, "learning_rate": 1.43811834990745e-05, "loss": 2.4048, "step": 3743 }, { "epoch": 0.38, "learning_rate": 1.437826618137816e-05, "loss": 2.372, "step": 3744 }, { "epoch": 0.38, "learning_rate": 1.4375348402617554e-05, "loss": 2.4095, "step": 3745 }, { "epoch": 0.38, "learning_rate": 1.4372430163099948e-05, "loss": 2.3314, "step": 3746 }, { "epoch": 0.38, "learning_rate": 1.4369511463132656e-05, "loss": 2.3058, "step": 3747 }, { "epoch": 0.38, "learning_rate": 1.4366592303023035e-05, "loss": 2.3192, "step": 3748 }, { "epoch": 0.38, "learning_rate": 1.4363672683078495e-05, "loss": 2.392, "step": 3749 }, { "epoch": 0.38, "learning_rate": 1.4360752603606498e-05, "loss": 2.4697, "step": 3750 }, { "epoch": 0.38, "learning_rate": 1.4357832064914548e-05, "loss": 2.3331, "step": 3751 }, { "epoch": 0.38, "learning_rate": 1.4354911067310197e-05, "loss": 2.3843, "step": 3752 }, { "epoch": 0.38, "learning_rate": 1.4351989611101052e-05, "loss": 2.5028, "step": 3753 }, { "epoch": 0.38, "learning_rate": 1.4349067696594765e-05, "loss": 2.4196, "step": 3754 }, { "epoch": 0.38, "learning_rate": 1.434614532409903e-05, "loss": 2.3801, "step": 3755 }, { "epoch": 0.38, "learning_rate": 1.4343222493921595e-05, "loss": 2.3669, "step": 3756 }, { "epoch": 0.38, "learning_rate": 1.4340299206370263e-05, "loss": 2.3827, "step": 3757 }, { "epoch": 0.38, "learning_rate": 1.4337375461752872e-05, "loss": 2.3532, "step": 3758 }, { "epoch": 0.38, "learning_rate": 1.4334451260377317e-05, "loss": 2.3661, "step": 3759 }, { "epoch": 0.38, "learning_rate": 1.4331526602551538e-05, "loss": 2.3794, "step": 3760 }, { "epoch": 0.38, "learning_rate": 1.432860148858352e-05, "loss": 2.3013, "step": 3761 }, { "epoch": 0.38, "learning_rate": 1.4325675918781304e-05, "loss": 2.4512, "step": 3762 }, { "epoch": 0.38, "learning_rate": 1.4322749893452972e-05, "loss": 2.3559, "step": 3763 }, { "epoch": 0.38, "learning_rate": 1.4319823412906657e-05, "loss": 2.3981, "step": 3764 }, { "epoch": 0.38, "learning_rate": 1.4316896477450542e-05, "loss": 2.1445, "step": 3765 }, { "epoch": 0.38, "learning_rate": 1.4313969087392852e-05, "loss": 2.4004, "step": 3766 }, { "epoch": 0.38, "learning_rate": 1.4311041243041862e-05, "loss": 2.3515, "step": 3767 }, { "epoch": 0.38, "learning_rate": 1.43081129447059e-05, "loss": 2.4598, "step": 3768 }, { "epoch": 0.38, "learning_rate": 1.4305184192693334e-05, "loss": 2.3722, "step": 3769 }, { "epoch": 0.38, "learning_rate": 1.4302254987312582e-05, "loss": 2.3313, "step": 3770 }, { "epoch": 0.38, "learning_rate": 1.4299325328872118e-05, "loss": 2.4085, "step": 3771 }, { "epoch": 0.38, "learning_rate": 1.4296395217680453e-05, "loss": 2.4181, "step": 3772 }, { "epoch": 0.38, "learning_rate": 1.429346465404615e-05, "loss": 2.2955, "step": 3773 }, { "epoch": 0.38, "learning_rate": 1.429053363827782e-05, "loss": 2.4412, "step": 3774 }, { "epoch": 0.38, "learning_rate": 1.4287602170684119e-05, "loss": 2.3102, "step": 3775 }, { "epoch": 0.38, "learning_rate": 1.4284670251573754e-05, "loss": 2.4258, "step": 3776 }, { "epoch": 0.38, "learning_rate": 1.428173788125548e-05, "loss": 2.3541, "step": 3777 }, { "epoch": 0.38, "learning_rate": 1.4278805060038092e-05, "loss": 2.2582, "step": 3778 }, { "epoch": 0.38, "learning_rate": 1.4275871788230443e-05, "loss": 2.3643, "step": 3779 }, { "epoch": 0.38, "learning_rate": 1.4272938066141429e-05, "loss": 2.3978, "step": 3780 }, { "epoch": 0.38, "learning_rate": 1.4270003894079988e-05, "loss": 2.3461, "step": 3781 }, { "epoch": 0.38, "learning_rate": 1.4267069272355116e-05, "loss": 2.4202, "step": 3782 }, { "epoch": 0.38, "learning_rate": 1.4264134201275846e-05, "loss": 2.4215, "step": 3783 }, { "epoch": 0.38, "learning_rate": 1.4261198681151266e-05, "loss": 2.4719, "step": 3784 }, { "epoch": 0.38, "learning_rate": 1.4258262712290507e-05, "loss": 2.3438, "step": 3785 }, { "epoch": 0.38, "learning_rate": 1.4255326295002754e-05, "loss": 2.2096, "step": 3786 }, { "epoch": 0.38, "learning_rate": 1.4252389429597224e-05, "loss": 2.5092, "step": 3787 }, { "epoch": 0.38, "learning_rate": 1.4249452116383193e-05, "loss": 2.4468, "step": 3788 }, { "epoch": 0.38, "learning_rate": 1.424651435566999e-05, "loss": 2.4372, "step": 3789 }, { "epoch": 0.38, "learning_rate": 1.4243576147766973e-05, "loss": 2.332, "step": 3790 }, { "epoch": 0.38, "learning_rate": 1.4240637492983567e-05, "loss": 2.3861, "step": 3791 }, { "epoch": 0.38, "learning_rate": 1.4237698391629224e-05, "loss": 2.3868, "step": 3792 }, { "epoch": 0.38, "learning_rate": 1.4234758844013463e-05, "loss": 2.4646, "step": 3793 }, { "epoch": 0.38, "learning_rate": 1.4231818850445835e-05, "loss": 2.3797, "step": 3794 }, { "epoch": 0.38, "learning_rate": 1.4228878411235946e-05, "loss": 2.4058, "step": 3795 }, { "epoch": 0.38, "learning_rate": 1.4225937526693445e-05, "loss": 2.4065, "step": 3796 }, { "epoch": 0.38, "learning_rate": 1.4222996197128031e-05, "loss": 2.4202, "step": 3797 }, { "epoch": 0.38, "learning_rate": 1.4220054422849442e-05, "loss": 2.3483, "step": 3798 }, { "epoch": 0.38, "learning_rate": 1.4217112204167477e-05, "loss": 2.5016, "step": 3799 }, { "epoch": 0.38, "learning_rate": 1.4214169541391971e-05, "loss": 2.3553, "step": 3800 }, { "epoch": 0.38, "learning_rate": 1.4211226434832803e-05, "loss": 2.3715, "step": 3801 }, { "epoch": 0.38, "learning_rate": 1.4208282884799912e-05, "loss": 2.3718, "step": 3802 }, { "epoch": 0.38, "learning_rate": 1.420533889160327e-05, "loss": 2.2479, "step": 3803 }, { "epoch": 0.38, "learning_rate": 1.4202394455552908e-05, "loss": 2.3026, "step": 3804 }, { "epoch": 0.38, "learning_rate": 1.419944957695889e-05, "loss": 2.2528, "step": 3805 }, { "epoch": 0.38, "learning_rate": 1.4196504256131338e-05, "loss": 2.4073, "step": 3806 }, { "epoch": 0.38, "learning_rate": 1.4193558493380418e-05, "loss": 2.4036, "step": 3807 }, { "epoch": 0.38, "learning_rate": 1.4190612289016334e-05, "loss": 2.3735, "step": 3808 }, { "epoch": 0.38, "learning_rate": 1.418766564334935e-05, "loss": 2.3308, "step": 3809 }, { "epoch": 0.38, "learning_rate": 1.4184718556689768e-05, "loss": 2.4978, "step": 3810 }, { "epoch": 0.38, "learning_rate": 1.4181771029347938e-05, "loss": 2.3876, "step": 3811 }, { "epoch": 0.38, "learning_rate": 1.4178823061634254e-05, "loss": 2.3271, "step": 3812 }, { "epoch": 0.38, "learning_rate": 1.4175874653859165e-05, "loss": 2.3237, "step": 3813 }, { "epoch": 0.38, "learning_rate": 1.4172925806333158e-05, "loss": 2.3285, "step": 3814 }, { "epoch": 0.38, "learning_rate": 1.4169976519366763e-05, "loss": 2.402, "step": 3815 }, { "epoch": 0.38, "learning_rate": 1.4167026793270573e-05, "loss": 2.335, "step": 3816 }, { "epoch": 0.38, "learning_rate": 1.4164076628355208e-05, "loss": 2.3814, "step": 3817 }, { "epoch": 0.38, "learning_rate": 1.4161126024931346e-05, "loss": 2.3843, "step": 3818 }, { "epoch": 0.38, "learning_rate": 1.4158174983309705e-05, "loss": 2.5024, "step": 3819 }, { "epoch": 0.38, "learning_rate": 1.4155223503801052e-05, "loss": 2.4274, "step": 3820 }, { "epoch": 0.38, "learning_rate": 1.4152271586716205e-05, "loss": 2.3524, "step": 3821 }, { "epoch": 0.38, "learning_rate": 1.4149319232366017e-05, "loss": 2.3785, "step": 3822 }, { "epoch": 0.38, "learning_rate": 1.4146366441061397e-05, "loss": 2.4439, "step": 3823 }, { "epoch": 0.38, "learning_rate": 1.4143413213113291e-05, "loss": 2.4089, "step": 3824 }, { "epoch": 0.38, "learning_rate": 1.4140459548832702e-05, "loss": 2.2755, "step": 3825 }, { "epoch": 0.38, "learning_rate": 1.4137505448530671e-05, "loss": 2.2666, "step": 3826 }, { "epoch": 0.38, "learning_rate": 1.4134550912518286e-05, "loss": 2.4572, "step": 3827 }, { "epoch": 0.38, "learning_rate": 1.4131595941106681e-05, "loss": 2.4354, "step": 3828 }, { "epoch": 0.38, "learning_rate": 1.4128640534607038e-05, "loss": 2.404, "step": 3829 }, { "epoch": 0.38, "learning_rate": 1.4125684693330586e-05, "loss": 2.3172, "step": 3830 }, { "epoch": 0.38, "learning_rate": 1.4122728417588591e-05, "loss": 2.279, "step": 3831 }, { "epoch": 0.38, "learning_rate": 1.4119771707692374e-05, "loss": 2.4705, "step": 3832 }, { "epoch": 0.38, "learning_rate": 1.4116814563953303e-05, "loss": 2.3012, "step": 3833 }, { "epoch": 0.38, "learning_rate": 1.4113856986682782e-05, "loss": 2.4355, "step": 3834 }, { "epoch": 0.38, "learning_rate": 1.4110898976192267e-05, "loss": 2.3666, "step": 3835 }, { "epoch": 0.38, "learning_rate": 1.410794053279326e-05, "loss": 2.3572, "step": 3836 }, { "epoch": 0.38, "learning_rate": 1.4104981656797307e-05, "loss": 2.2822, "step": 3837 }, { "epoch": 0.38, "learning_rate": 1.4102022348516002e-05, "loss": 2.3622, "step": 3838 }, { "epoch": 0.38, "learning_rate": 1.4099062608260976e-05, "loss": 2.4178, "step": 3839 }, { "epoch": 0.38, "learning_rate": 1.409610243634392e-05, "loss": 2.3251, "step": 3840 }, { "epoch": 0.38, "learning_rate": 1.409314183307655e-05, "loss": 2.4114, "step": 3841 }, { "epoch": 0.38, "learning_rate": 1.4090180798770656e-05, "loss": 2.4234, "step": 3842 }, { "epoch": 0.39, "learning_rate": 1.4087219333738047e-05, "loss": 2.44, "step": 3843 }, { "epoch": 0.39, "learning_rate": 1.4084257438290587e-05, "loss": 2.3251, "step": 3844 }, { "epoch": 0.39, "learning_rate": 1.4081295112740192e-05, "loss": 2.3481, "step": 3845 }, { "epoch": 0.39, "learning_rate": 1.407833235739881e-05, "loss": 2.3415, "step": 3846 }, { "epoch": 0.39, "learning_rate": 1.4075369172578444e-05, "loss": 2.3246, "step": 3847 }, { "epoch": 0.39, "learning_rate": 1.4072405558591142e-05, "loss": 2.3085, "step": 3848 }, { "epoch": 0.39, "learning_rate": 1.4069441515748993e-05, "loss": 2.3596, "step": 3849 }, { "epoch": 0.39, "learning_rate": 1.4066477044364135e-05, "loss": 2.2642, "step": 3850 }, { "epoch": 0.39, "learning_rate": 1.4063512144748745e-05, "loss": 2.3952, "step": 3851 }, { "epoch": 0.39, "learning_rate": 1.4060546817215053e-05, "loss": 2.3586, "step": 3852 }, { "epoch": 0.39, "learning_rate": 1.4057581062075325e-05, "loss": 2.3517, "step": 3853 }, { "epoch": 0.39, "learning_rate": 1.4054614879641884e-05, "loss": 2.3655, "step": 3854 }, { "epoch": 0.39, "learning_rate": 1.4051648270227082e-05, "loss": 2.4057, "step": 3855 }, { "epoch": 0.39, "learning_rate": 1.4048681234143337e-05, "loss": 2.3392, "step": 3856 }, { "epoch": 0.39, "learning_rate": 1.4045713771703093e-05, "loss": 2.3552, "step": 3857 }, { "epoch": 0.39, "learning_rate": 1.4042745883218847e-05, "loss": 2.2811, "step": 3858 }, { "epoch": 0.39, "learning_rate": 1.4039777569003142e-05, "loss": 2.3576, "step": 3859 }, { "epoch": 0.39, "learning_rate": 1.403680882936856e-05, "loss": 2.4899, "step": 3860 }, { "epoch": 0.39, "learning_rate": 1.4033839664627735e-05, "loss": 2.3488, "step": 3861 }, { "epoch": 0.39, "learning_rate": 1.403087007509334e-05, "loss": 2.3887, "step": 3862 }, { "epoch": 0.39, "learning_rate": 1.4027900061078097e-05, "loss": 2.4791, "step": 3863 }, { "epoch": 0.39, "learning_rate": 1.4024929622894768e-05, "loss": 2.4064, "step": 3864 }, { "epoch": 0.39, "learning_rate": 1.4021958760856163e-05, "loss": 2.4609, "step": 3865 }, { "epoch": 0.39, "learning_rate": 1.4018987475275139e-05, "loss": 2.387, "step": 3866 }, { "epoch": 0.39, "learning_rate": 1.4016015766464595e-05, "loss": 2.3451, "step": 3867 }, { "epoch": 0.39, "learning_rate": 1.4013043634737467e-05, "loss": 2.3671, "step": 3868 }, { "epoch": 0.39, "learning_rate": 1.4010071080406751e-05, "loss": 2.4018, "step": 3869 }, { "epoch": 0.39, "learning_rate": 1.4007098103785476e-05, "loss": 2.3506, "step": 3870 }, { "epoch": 0.39, "learning_rate": 1.4004124705186719e-05, "loss": 2.3928, "step": 3871 }, { "epoch": 0.39, "learning_rate": 1.4001150884923601e-05, "loss": 2.3944, "step": 3872 }, { "epoch": 0.39, "learning_rate": 1.3998176643309287e-05, "loss": 2.3981, "step": 3873 }, { "epoch": 0.39, "learning_rate": 1.3995201980656988e-05, "loss": 2.3404, "step": 3874 }, { "epoch": 0.39, "learning_rate": 1.3992226897279957e-05, "loss": 2.3419, "step": 3875 }, { "epoch": 0.39, "learning_rate": 1.3989251393491494e-05, "loss": 2.3021, "step": 3876 }, { "epoch": 0.39, "learning_rate": 1.3986275469604937e-05, "loss": 2.3344, "step": 3877 }, { "epoch": 0.39, "learning_rate": 1.3983299125933683e-05, "loss": 2.4767, "step": 3878 }, { "epoch": 0.39, "learning_rate": 1.3980322362791156e-05, "loss": 2.3217, "step": 3879 }, { "epoch": 0.39, "learning_rate": 1.3977345180490833e-05, "loss": 2.4757, "step": 3880 }, { "epoch": 0.39, "learning_rate": 1.3974367579346236e-05, "loss": 2.3677, "step": 3881 }, { "epoch": 0.39, "learning_rate": 1.3971389559670923e-05, "loss": 2.2842, "step": 3882 }, { "epoch": 0.39, "learning_rate": 1.3968411121778506e-05, "loss": 2.3363, "step": 3883 }, { "epoch": 0.39, "learning_rate": 1.3965432265982638e-05, "loss": 2.4139, "step": 3884 }, { "epoch": 0.39, "learning_rate": 1.396245299259701e-05, "loss": 2.3764, "step": 3885 }, { "epoch": 0.39, "learning_rate": 1.3959473301935367e-05, "loss": 2.3799, "step": 3886 }, { "epoch": 0.39, "learning_rate": 1.395649319431149e-05, "loss": 2.315, "step": 3887 }, { "epoch": 0.39, "learning_rate": 1.3953512670039207e-05, "loss": 2.4736, "step": 3888 }, { "epoch": 0.39, "learning_rate": 1.395053172943239e-05, "loss": 2.2619, "step": 3889 }, { "epoch": 0.39, "learning_rate": 1.3947550372804957e-05, "loss": 2.4256, "step": 3890 }, { "epoch": 0.39, "learning_rate": 1.394456860047086e-05, "loss": 2.3759, "step": 3891 }, { "epoch": 0.39, "learning_rate": 1.394158641274411e-05, "loss": 2.4085, "step": 3892 }, { "epoch": 0.39, "learning_rate": 1.393860380993875e-05, "loss": 2.3505, "step": 3893 }, { "epoch": 0.39, "learning_rate": 1.3935620792368869e-05, "loss": 2.4562, "step": 3894 }, { "epoch": 0.39, "learning_rate": 1.3932637360348603e-05, "loss": 2.4144, "step": 3895 }, { "epoch": 0.39, "learning_rate": 1.3929653514192128e-05, "loss": 2.254, "step": 3896 }, { "epoch": 0.39, "learning_rate": 1.392666925421367e-05, "loss": 2.2893, "step": 3897 }, { "epoch": 0.39, "learning_rate": 1.3923684580727488e-05, "loss": 2.241, "step": 3898 }, { "epoch": 0.39, "learning_rate": 1.3920699494047895e-05, "loss": 2.3592, "step": 3899 }, { "epoch": 0.39, "learning_rate": 1.391771399448924e-05, "loss": 2.2694, "step": 3900 }, { "epoch": 0.39, "learning_rate": 1.391472808236592e-05, "loss": 2.3258, "step": 3901 }, { "epoch": 0.39, "learning_rate": 1.3911741757992378e-05, "loss": 2.4092, "step": 3902 }, { "epoch": 0.39, "learning_rate": 1.390875502168309e-05, "loss": 2.419, "step": 3903 }, { "epoch": 0.39, "learning_rate": 1.3905767873752581e-05, "loss": 2.3251, "step": 3904 }, { "epoch": 0.39, "learning_rate": 1.3902780314515424e-05, "loss": 2.3105, "step": 3905 }, { "epoch": 0.39, "learning_rate": 1.3899792344286232e-05, "loss": 2.3666, "step": 3906 }, { "epoch": 0.39, "learning_rate": 1.3896803963379659e-05, "loss": 2.1883, "step": 3907 }, { "epoch": 0.39, "learning_rate": 1.3893815172110403e-05, "loss": 2.4948, "step": 3908 }, { "epoch": 0.39, "learning_rate": 1.3890825970793205e-05, "loss": 2.3276, "step": 3909 }, { "epoch": 0.39, "learning_rate": 1.3887836359742854e-05, "loss": 2.5387, "step": 3910 }, { "epoch": 0.39, "learning_rate": 1.3884846339274179e-05, "loss": 2.4184, "step": 3911 }, { "epoch": 0.39, "learning_rate": 1.3881855909702049e-05, "loss": 2.293, "step": 3912 }, { "epoch": 0.39, "learning_rate": 1.3878865071341378e-05, "loss": 2.4228, "step": 3913 }, { "epoch": 0.39, "learning_rate": 1.3875873824507124e-05, "loss": 2.3881, "step": 3914 }, { "epoch": 0.39, "learning_rate": 1.387288216951429e-05, "loss": 2.3219, "step": 3915 }, { "epoch": 0.39, "learning_rate": 1.386989010667792e-05, "loss": 2.3576, "step": 3916 }, { "epoch": 0.39, "learning_rate": 1.3866897636313093e-05, "loss": 2.309, "step": 3917 }, { "epoch": 0.39, "learning_rate": 1.386390475873495e-05, "loss": 2.3671, "step": 3918 }, { "epoch": 0.39, "learning_rate": 1.3860911474258653e-05, "loss": 2.4389, "step": 3919 }, { "epoch": 0.39, "learning_rate": 1.3857917783199426e-05, "loss": 2.3433, "step": 3920 }, { "epoch": 0.39, "learning_rate": 1.3854923685872523e-05, "loss": 2.4126, "step": 3921 }, { "epoch": 0.39, "learning_rate": 1.3851929182593247e-05, "loss": 2.4028, "step": 3922 }, { "epoch": 0.39, "learning_rate": 1.3848934273676937e-05, "loss": 2.3069, "step": 3923 }, { "epoch": 0.39, "learning_rate": 1.3845938959438984e-05, "loss": 2.3873, "step": 3924 }, { "epoch": 0.39, "learning_rate": 1.3842943240194815e-05, "loss": 2.364, "step": 3925 }, { "epoch": 0.39, "learning_rate": 1.38399471162599e-05, "loss": 2.2951, "step": 3926 }, { "epoch": 0.39, "learning_rate": 1.3836950587949756e-05, "loss": 2.4084, "step": 3927 }, { "epoch": 0.39, "learning_rate": 1.3833953655579942e-05, "loss": 2.3782, "step": 3928 }, { "epoch": 0.39, "learning_rate": 1.3830956319466053e-05, "loss": 2.4012, "step": 3929 }, { "epoch": 0.39, "learning_rate": 1.3827958579923732e-05, "loss": 2.3351, "step": 3930 }, { "epoch": 0.39, "learning_rate": 1.3824960437268665e-05, "loss": 2.513, "step": 3931 }, { "epoch": 0.39, "learning_rate": 1.3821961891816576e-05, "loss": 2.4048, "step": 3932 }, { "epoch": 0.39, "learning_rate": 1.3818962943883239e-05, "loss": 2.3473, "step": 3933 }, { "epoch": 0.39, "learning_rate": 1.3815963593784463e-05, "loss": 2.4173, "step": 3934 }, { "epoch": 0.39, "learning_rate": 1.38129638418361e-05, "loss": 2.3823, "step": 3935 }, { "epoch": 0.39, "learning_rate": 1.380996368835405e-05, "loss": 2.4371, "step": 3936 }, { "epoch": 0.39, "learning_rate": 1.3806963133654253e-05, "loss": 2.3715, "step": 3937 }, { "epoch": 0.39, "learning_rate": 1.3803962178052683e-05, "loss": 2.2821, "step": 3938 }, { "epoch": 0.39, "learning_rate": 1.3800960821865368e-05, "loss": 2.3266, "step": 3939 }, { "epoch": 0.39, "learning_rate": 1.3797959065408372e-05, "loss": 2.4092, "step": 3940 }, { "epoch": 0.39, "learning_rate": 1.3794956908997806e-05, "loss": 2.3896, "step": 3941 }, { "epoch": 0.39, "learning_rate": 1.3791954352949812e-05, "loss": 2.4567, "step": 3942 }, { "epoch": 0.4, "learning_rate": 1.378895139758059e-05, "loss": 2.3377, "step": 3943 }, { "epoch": 0.4, "learning_rate": 1.3785948043206369e-05, "loss": 2.3939, "step": 3944 }, { "epoch": 0.4, "learning_rate": 1.3782944290143427e-05, "loss": 2.3152, "step": 3945 }, { "epoch": 0.4, "learning_rate": 1.3779940138708079e-05, "loss": 2.4372, "step": 3946 }, { "epoch": 0.4, "learning_rate": 1.3776935589216687e-05, "loss": 2.3783, "step": 3947 }, { "epoch": 0.4, "learning_rate": 1.3773930641985652e-05, "loss": 2.4412, "step": 3948 }, { "epoch": 0.4, "learning_rate": 1.3770925297331413e-05, "loss": 2.3719, "step": 3949 }, { "epoch": 0.4, "learning_rate": 1.3767919555570463e-05, "loss": 2.3852, "step": 3950 }, { "epoch": 0.4, "learning_rate": 1.3764913417019326e-05, "loss": 2.4067, "step": 3951 }, { "epoch": 0.4, "learning_rate": 1.3761906881994568e-05, "loss": 2.3282, "step": 3952 }, { "epoch": 0.4, "learning_rate": 1.3758899950812805e-05, "loss": 2.3848, "step": 3953 }, { "epoch": 0.4, "learning_rate": 1.3755892623790688e-05, "loss": 2.4476, "step": 3954 }, { "epoch": 0.4, "learning_rate": 1.3752884901244907e-05, "loss": 2.433, "step": 3955 }, { "epoch": 0.4, "learning_rate": 1.3749876783492203e-05, "loss": 2.3929, "step": 3956 }, { "epoch": 0.4, "learning_rate": 1.3746868270849349e-05, "loss": 2.3788, "step": 3957 }, { "epoch": 0.4, "learning_rate": 1.3743859363633165e-05, "loss": 2.3032, "step": 3958 }, { "epoch": 0.4, "learning_rate": 1.3740850062160513e-05, "loss": 2.3601, "step": 3959 }, { "epoch": 0.4, "learning_rate": 1.3737840366748297e-05, "loss": 2.3268, "step": 3960 }, { "epoch": 0.4, "learning_rate": 1.3734830277713457e-05, "loss": 2.4333, "step": 3961 }, { "epoch": 0.4, "learning_rate": 1.3731819795372973e-05, "loss": 2.2907, "step": 3962 }, { "epoch": 0.4, "learning_rate": 1.372880892004388e-05, "loss": 2.3253, "step": 3963 }, { "epoch": 0.4, "learning_rate": 1.3725797652043247e-05, "loss": 2.4262, "step": 3964 }, { "epoch": 0.4, "learning_rate": 1.3722785991688176e-05, "loss": 2.3388, "step": 3965 }, { "epoch": 0.4, "learning_rate": 1.3719773939295824e-05, "loss": 2.4468, "step": 3966 }, { "epoch": 0.4, "learning_rate": 1.3716761495183374e-05, "loss": 2.4442, "step": 3967 }, { "epoch": 0.4, "learning_rate": 1.3713748659668067e-05, "loss": 2.2725, "step": 3968 }, { "epoch": 0.4, "learning_rate": 1.3710735433067175e-05, "loss": 2.3648, "step": 3969 }, { "epoch": 0.4, "learning_rate": 1.3707721815698012e-05, "loss": 2.3444, "step": 3970 }, { "epoch": 0.4, "learning_rate": 1.3704707807877933e-05, "loss": 2.3978, "step": 3971 }, { "epoch": 0.4, "learning_rate": 1.370169340992434e-05, "loss": 2.2636, "step": 3972 }, { "epoch": 0.4, "learning_rate": 1.3698678622154668e-05, "loss": 2.417, "step": 3973 }, { "epoch": 0.4, "learning_rate": 1.3695663444886397e-05, "loss": 2.3834, "step": 3974 }, { "epoch": 0.4, "learning_rate": 1.3692647878437053e-05, "loss": 2.4061, "step": 3975 }, { "epoch": 0.4, "learning_rate": 1.3689631923124194e-05, "loss": 2.3869, "step": 3976 }, { "epoch": 0.4, "learning_rate": 1.3686615579265419e-05, "loss": 2.3822, "step": 3977 }, { "epoch": 0.4, "learning_rate": 1.3683598847178376e-05, "loss": 2.3874, "step": 3978 }, { "epoch": 0.4, "learning_rate": 1.368058172718075e-05, "loss": 2.4537, "step": 3979 }, { "epoch": 0.4, "learning_rate": 1.3677564219590262e-05, "loss": 2.3747, "step": 3980 }, { "epoch": 0.4, "learning_rate": 1.3674546324724685e-05, "loss": 2.4273, "step": 3981 }, { "epoch": 0.4, "learning_rate": 1.367152804290182e-05, "loss": 2.4326, "step": 3982 }, { "epoch": 0.4, "learning_rate": 1.3668509374439518e-05, "loss": 2.4397, "step": 3983 }, { "epoch": 0.4, "learning_rate": 1.3665490319655666e-05, "loss": 2.3551, "step": 3984 }, { "epoch": 0.4, "learning_rate": 1.3662470878868192e-05, "loss": 2.3425, "step": 3985 }, { "epoch": 0.4, "learning_rate": 1.3659451052395069e-05, "loss": 2.311, "step": 3986 }, { "epoch": 0.4, "learning_rate": 1.3656430840554306e-05, "loss": 2.3904, "step": 3987 }, { "epoch": 0.4, "learning_rate": 1.3653410243663953e-05, "loss": 2.396, "step": 3988 }, { "epoch": 0.4, "learning_rate": 1.3650389262042101e-05, "loss": 2.3607, "step": 3989 }, { "epoch": 0.4, "learning_rate": 1.3647367896006882e-05, "loss": 2.2791, "step": 3990 }, { "epoch": 0.4, "learning_rate": 1.3644346145876473e-05, "loss": 2.3573, "step": 3991 }, { "epoch": 0.4, "learning_rate": 1.3641324011969079e-05, "loss": 2.3433, "step": 3992 }, { "epoch": 0.4, "learning_rate": 1.3638301494602964e-05, "loss": 2.4726, "step": 3993 }, { "epoch": 0.4, "learning_rate": 1.3635278594096408e-05, "loss": 2.4577, "step": 3994 }, { "epoch": 0.4, "learning_rate": 1.3632255310767757e-05, "loss": 2.4177, "step": 3995 }, { "epoch": 0.4, "learning_rate": 1.3629231644935382e-05, "loss": 2.3449, "step": 3996 }, { "epoch": 0.4, "learning_rate": 1.3626207596917695e-05, "loss": 2.4124, "step": 3997 }, { "epoch": 0.4, "learning_rate": 1.3623183167033154e-05, "loss": 2.4608, "step": 3998 }, { "epoch": 0.4, "learning_rate": 1.3620158355600253e-05, "loss": 2.5012, "step": 3999 }, { "epoch": 0.4, "learning_rate": 1.3617133162937525e-05, "loss": 2.3768, "step": 4000 }, { "epoch": 0.4, "learning_rate": 1.361410758936355e-05, "loss": 2.3699, "step": 4001 }, { "epoch": 0.4, "learning_rate": 1.3611081635196938e-05, "loss": 2.4146, "step": 4002 }, { "epoch": 0.4, "learning_rate": 1.360805530075635e-05, "loss": 2.3384, "step": 4003 }, { "epoch": 0.4, "learning_rate": 1.360502858636048e-05, "loss": 2.4701, "step": 4004 }, { "epoch": 0.4, "learning_rate": 1.3602001492328065e-05, "loss": 2.4201, "step": 4005 }, { "epoch": 0.4, "learning_rate": 1.3598974018977877e-05, "loss": 2.3019, "step": 4006 }, { "epoch": 0.4, "learning_rate": 1.3595946166628735e-05, "loss": 2.4657, "step": 4007 }, { "epoch": 0.4, "learning_rate": 1.3592917935599493e-05, "loss": 2.3927, "step": 4008 }, { "epoch": 0.4, "learning_rate": 1.3589889326209044e-05, "loss": 2.3668, "step": 4009 }, { "epoch": 0.4, "learning_rate": 1.3586860338776329e-05, "loss": 2.3884, "step": 4010 }, { "epoch": 0.4, "learning_rate": 1.3583830973620318e-05, "loss": 2.3849, "step": 4011 }, { "epoch": 0.4, "learning_rate": 1.358080123106003e-05, "loss": 2.3895, "step": 4012 }, { "epoch": 0.4, "learning_rate": 1.3577771111414517e-05, "loss": 2.3881, "step": 4013 }, { "epoch": 0.4, "learning_rate": 1.3574740615002874e-05, "loss": 2.4572, "step": 4014 }, { "epoch": 0.4, "learning_rate": 1.3571709742144234e-05, "loss": 2.2854, "step": 4015 }, { "epoch": 0.4, "learning_rate": 1.3568678493157772e-05, "loss": 2.4107, "step": 4016 }, { "epoch": 0.4, "learning_rate": 1.35656468683627e-05, "loss": 2.3418, "step": 4017 }, { "epoch": 0.4, "learning_rate": 1.3562614868078275e-05, "loss": 2.3832, "step": 4018 }, { "epoch": 0.4, "learning_rate": 1.3559582492623783e-05, "loss": 2.3351, "step": 4019 }, { "epoch": 0.4, "learning_rate": 1.3556549742318559e-05, "loss": 2.3802, "step": 4020 }, { "epoch": 0.4, "learning_rate": 1.3553516617481974e-05, "loss": 2.3868, "step": 4021 }, { "epoch": 0.4, "learning_rate": 1.355048311843344e-05, "loss": 2.3548, "step": 4022 }, { "epoch": 0.4, "learning_rate": 1.3547449245492406e-05, "loss": 2.3362, "step": 4023 }, { "epoch": 0.4, "learning_rate": 1.3544414998978361e-05, "loss": 2.378, "step": 4024 }, { "epoch": 0.4, "learning_rate": 1.3541380379210836e-05, "loss": 2.3689, "step": 4025 }, { "epoch": 0.4, "learning_rate": 1.3538345386509394e-05, "loss": 2.3112, "step": 4026 }, { "epoch": 0.4, "learning_rate": 1.3535310021193653e-05, "loss": 2.3218, "step": 4027 }, { "epoch": 0.4, "learning_rate": 1.3532274283583249e-05, "loss": 2.3308, "step": 4028 }, { "epoch": 0.4, "learning_rate": 1.3529238173997874e-05, "loss": 2.3255, "step": 4029 }, { "epoch": 0.4, "learning_rate": 1.352620169275725e-05, "loss": 2.4729, "step": 4030 }, { "epoch": 0.4, "learning_rate": 1.3523164840181143e-05, "loss": 2.406, "step": 4031 }, { "epoch": 0.4, "learning_rate": 1.3520127616589355e-05, "loss": 2.3593, "step": 4032 }, { "epoch": 0.4, "learning_rate": 1.3517090022301731e-05, "loss": 2.4197, "step": 4033 }, { "epoch": 0.4, "learning_rate": 1.3514052057638148e-05, "loss": 2.2956, "step": 4034 }, { "epoch": 0.4, "learning_rate": 1.351101372291853e-05, "loss": 2.3868, "step": 4035 }, { "epoch": 0.4, "learning_rate": 1.3507975018462835e-05, "loss": 2.3837, "step": 4036 }, { "epoch": 0.4, "learning_rate": 1.3504935944591064e-05, "loss": 2.4299, "step": 4037 }, { "epoch": 0.4, "learning_rate": 1.3501896501623253e-05, "loss": 2.4113, "step": 4038 }, { "epoch": 0.4, "learning_rate": 1.3498856689879474e-05, "loss": 2.3154, "step": 4039 }, { "epoch": 0.4, "learning_rate": 1.3495816509679847e-05, "loss": 2.398, "step": 4040 }, { "epoch": 0.4, "learning_rate": 1.3492775961344525e-05, "loss": 2.3682, "step": 4041 }, { "epoch": 0.4, "learning_rate": 1.34897350451937e-05, "loss": 2.3784, "step": 4042 }, { "epoch": 0.41, "learning_rate": 1.3486693761547597e-05, "loss": 2.2899, "step": 4043 }, { "epoch": 0.41, "learning_rate": 1.3483652110726498e-05, "loss": 2.2811, "step": 4044 }, { "epoch": 0.41, "learning_rate": 1.3480610093050703e-05, "loss": 2.3958, "step": 4045 }, { "epoch": 0.41, "learning_rate": 1.3477567708840565e-05, "loss": 2.3283, "step": 4046 }, { "epoch": 0.41, "learning_rate": 1.3474524958416462e-05, "loss": 2.3358, "step": 4047 }, { "epoch": 0.41, "learning_rate": 1.3471481842098826e-05, "loss": 2.356, "step": 4048 }, { "epoch": 0.41, "learning_rate": 1.3468438360208117e-05, "loss": 2.3574, "step": 4049 }, { "epoch": 0.41, "learning_rate": 1.3465394513064838e-05, "loss": 2.367, "step": 4050 }, { "epoch": 0.41, "learning_rate": 1.3462350300989526e-05, "loss": 2.3439, "step": 4051 }, { "epoch": 0.41, "learning_rate": 1.3459305724302758e-05, "loss": 2.3963, "step": 4052 }, { "epoch": 0.41, "learning_rate": 1.3456260783325157e-05, "loss": 2.435, "step": 4053 }, { "epoch": 0.41, "learning_rate": 1.3453215478377374e-05, "loss": 2.2345, "step": 4054 }, { "epoch": 0.41, "learning_rate": 1.3450169809780105e-05, "loss": 2.348, "step": 4055 }, { "epoch": 0.41, "learning_rate": 1.3447123777854074e-05, "loss": 2.4249, "step": 4056 }, { "epoch": 0.41, "learning_rate": 1.3444077382920063e-05, "loss": 2.4014, "step": 4057 }, { "epoch": 0.41, "learning_rate": 1.3441030625298872e-05, "loss": 2.2786, "step": 4058 }, { "epoch": 0.41, "learning_rate": 1.343798350531135e-05, "loss": 2.3582, "step": 4059 }, { "epoch": 0.41, "learning_rate": 1.3434936023278382e-05, "loss": 2.2972, "step": 4060 }, { "epoch": 0.41, "learning_rate": 1.343188817952089e-05, "loss": 2.4367, "step": 4061 }, { "epoch": 0.41, "learning_rate": 1.3428839974359834e-05, "loss": 2.3217, "step": 4062 }, { "epoch": 0.41, "learning_rate": 1.3425791408116213e-05, "loss": 2.3618, "step": 4063 }, { "epoch": 0.41, "learning_rate": 1.3422742481111064e-05, "loss": 2.3376, "step": 4064 }, { "epoch": 0.41, "learning_rate": 1.3419693193665461e-05, "loss": 2.4563, "step": 4065 }, { "epoch": 0.41, "learning_rate": 1.341664354610052e-05, "loss": 2.3278, "step": 4066 }, { "epoch": 0.41, "learning_rate": 1.341359353873739e-05, "loss": 2.3797, "step": 4067 }, { "epoch": 0.41, "learning_rate": 1.3410543171897262e-05, "loss": 2.3743, "step": 4068 }, { "epoch": 0.41, "learning_rate": 1.3407492445901357e-05, "loss": 2.3914, "step": 4069 }, { "epoch": 0.41, "learning_rate": 1.3404441361070944e-05, "loss": 2.4058, "step": 4070 }, { "epoch": 0.41, "learning_rate": 1.3401389917727323e-05, "loss": 2.3967, "step": 4071 }, { "epoch": 0.41, "learning_rate": 1.3398338116191833e-05, "loss": 2.4047, "step": 4072 }, { "epoch": 0.41, "learning_rate": 1.3395285956785855e-05, "loss": 2.4277, "step": 4073 }, { "epoch": 0.41, "learning_rate": 1.33922334398308e-05, "loss": 2.3237, "step": 4074 }, { "epoch": 0.41, "learning_rate": 1.3389180565648125e-05, "loss": 2.385, "step": 4075 }, { "epoch": 0.41, "learning_rate": 1.3386127334559318e-05, "loss": 2.3675, "step": 4076 }, { "epoch": 0.41, "learning_rate": 1.3383073746885908e-05, "loss": 2.3882, "step": 4077 }, { "epoch": 0.41, "learning_rate": 1.3380019802949462e-05, "loss": 2.3969, "step": 4078 }, { "epoch": 0.41, "learning_rate": 1.337696550307158e-05, "loss": 2.4032, "step": 4079 }, { "epoch": 0.41, "learning_rate": 1.3373910847573903e-05, "loss": 2.2919, "step": 4080 }, { "epoch": 0.41, "learning_rate": 1.3370855836778114e-05, "loss": 2.2913, "step": 4081 }, { "epoch": 0.41, "learning_rate": 1.3367800471005926e-05, "loss": 2.385, "step": 4082 }, { "epoch": 0.41, "learning_rate": 1.3364744750579086e-05, "loss": 2.3461, "step": 4083 }, { "epoch": 0.41, "learning_rate": 1.3361688675819393e-05, "loss": 2.3466, "step": 4084 }, { "epoch": 0.41, "learning_rate": 1.335863224704867e-05, "loss": 2.222, "step": 4085 }, { "epoch": 0.41, "learning_rate": 1.3355575464588784e-05, "loss": 2.3897, "step": 4086 }, { "epoch": 0.41, "learning_rate": 1.3352518328761633e-05, "loss": 2.3698, "step": 4087 }, { "epoch": 0.41, "learning_rate": 1.3349460839889158e-05, "loss": 2.3872, "step": 4088 }, { "epoch": 0.41, "learning_rate": 1.3346402998293342e-05, "loss": 2.4641, "step": 4089 }, { "epoch": 0.41, "learning_rate": 1.334334480429619e-05, "loss": 2.3787, "step": 4090 }, { "epoch": 0.41, "learning_rate": 1.334028625821976e-05, "loss": 2.4383, "step": 4091 }, { "epoch": 0.41, "learning_rate": 1.3337227360386131e-05, "loss": 2.3588, "step": 4092 }, { "epoch": 0.41, "learning_rate": 1.3334168111117435e-05, "loss": 2.4365, "step": 4093 }, { "epoch": 0.41, "learning_rate": 1.3331108510735833e-05, "loss": 2.3187, "step": 4094 }, { "epoch": 0.41, "learning_rate": 1.3328048559563522e-05, "loss": 2.4634, "step": 4095 }, { "epoch": 0.41, "learning_rate": 1.3324988257922734e-05, "loss": 2.3585, "step": 4096 }, { "epoch": 0.41, "learning_rate": 1.3321927606135755e-05, "loss": 2.3659, "step": 4097 }, { "epoch": 0.41, "learning_rate": 1.3318866604524878e-05, "loss": 2.4377, "step": 4098 }, { "epoch": 0.41, "learning_rate": 1.3315805253412462e-05, "loss": 2.3813, "step": 4099 }, { "epoch": 0.41, "learning_rate": 1.3312743553120883e-05, "loss": 2.4264, "step": 4100 }, { "epoch": 0.41, "learning_rate": 1.3309681503972564e-05, "loss": 2.3759, "step": 4101 }, { "epoch": 0.41, "learning_rate": 1.3306619106289963e-05, "loss": 2.3075, "step": 4102 }, { "epoch": 0.41, "learning_rate": 1.3303556360395569e-05, "loss": 2.3038, "step": 4103 }, { "epoch": 0.41, "learning_rate": 1.3300493266611914e-05, "loss": 2.3171, "step": 4104 }, { "epoch": 0.41, "learning_rate": 1.3297429825261565e-05, "loss": 2.459, "step": 4105 }, { "epoch": 0.41, "learning_rate": 1.3294366036667128e-05, "loss": 2.3709, "step": 4106 }, { "epoch": 0.41, "learning_rate": 1.3291301901151241e-05, "loss": 2.4054, "step": 4107 }, { "epoch": 0.41, "learning_rate": 1.328823741903658e-05, "loss": 2.4041, "step": 4108 }, { "epoch": 0.41, "learning_rate": 1.3285172590645859e-05, "loss": 2.3708, "step": 4109 }, { "epoch": 0.41, "learning_rate": 1.3282107416301822e-05, "loss": 2.3499, "step": 4110 }, { "epoch": 0.41, "learning_rate": 1.3279041896327263e-05, "loss": 2.4823, "step": 4111 }, { "epoch": 0.41, "learning_rate": 1.3275976031045002e-05, "loss": 2.4643, "step": 4112 }, { "epoch": 0.41, "learning_rate": 1.3272909820777893e-05, "loss": 2.2614, "step": 4113 }, { "epoch": 0.41, "learning_rate": 1.3269843265848836e-05, "loss": 2.3244, "step": 4114 }, { "epoch": 0.41, "learning_rate": 1.326677636658076e-05, "loss": 2.3223, "step": 4115 }, { "epoch": 0.41, "learning_rate": 1.3263709123296633e-05, "loss": 2.3199, "step": 4116 }, { "epoch": 0.41, "learning_rate": 1.3260641536319458e-05, "loss": 2.397, "step": 4117 }, { "epoch": 0.41, "learning_rate": 1.3257573605972276e-05, "loss": 2.4196, "step": 4118 }, { "epoch": 0.41, "learning_rate": 1.3254505332578163e-05, "loss": 2.3328, "step": 4119 }, { "epoch": 0.41, "learning_rate": 1.3251436716460228e-05, "loss": 2.379, "step": 4120 }, { "epoch": 0.41, "learning_rate": 1.3248367757941627e-05, "loss": 2.3808, "step": 4121 }, { "epoch": 0.41, "learning_rate": 1.3245298457345536e-05, "loss": 2.4827, "step": 4122 }, { "epoch": 0.41, "learning_rate": 1.324222881499518e-05, "loss": 2.398, "step": 4123 }, { "epoch": 0.41, "learning_rate": 1.3239158831213814e-05, "loss": 2.2767, "step": 4124 }, { "epoch": 0.41, "learning_rate": 1.3236088506324731e-05, "loss": 2.298, "step": 4125 }, { "epoch": 0.41, "learning_rate": 1.3233017840651259e-05, "loss": 2.247, "step": 4126 }, { "epoch": 0.41, "learning_rate": 1.322994683451676e-05, "loss": 2.4116, "step": 4127 }, { "epoch": 0.41, "learning_rate": 1.3226875488244635e-05, "loss": 2.3441, "step": 4128 }, { "epoch": 0.41, "learning_rate": 1.3223803802158324e-05, "loss": 2.3316, "step": 4129 }, { "epoch": 0.41, "learning_rate": 1.3220731776581292e-05, "loss": 2.4456, "step": 4130 }, { "epoch": 0.41, "learning_rate": 1.3217659411837053e-05, "loss": 2.4262, "step": 4131 }, { "epoch": 0.41, "learning_rate": 1.3214586708249142e-05, "loss": 2.3113, "step": 4132 }, { "epoch": 0.41, "learning_rate": 1.3211513666141148e-05, "loss": 2.2934, "step": 4133 }, { "epoch": 0.41, "learning_rate": 1.3208440285836677e-05, "loss": 2.2901, "step": 4134 }, { "epoch": 0.41, "learning_rate": 1.3205366567659381e-05, "loss": 2.4312, "step": 4135 }, { "epoch": 0.41, "learning_rate": 1.3202292511932948e-05, "loss": 2.307, "step": 4136 }, { "epoch": 0.41, "learning_rate": 1.3199218118981093e-05, "loss": 2.2603, "step": 4137 }, { "epoch": 0.41, "learning_rate": 1.319614338912758e-05, "loss": 2.3488, "step": 4138 }, { "epoch": 0.41, "learning_rate": 1.31930683226962e-05, "loss": 2.3408, "step": 4139 }, { "epoch": 0.41, "learning_rate": 1.3189992920010777e-05, "loss": 2.3295, "step": 4140 }, { "epoch": 0.41, "learning_rate": 1.3186917181395174e-05, "loss": 2.4158, "step": 4141 }, { "epoch": 0.41, "learning_rate": 1.3183841107173291e-05, "loss": 2.3272, "step": 4142 }, { "epoch": 0.42, "learning_rate": 1.3180764697669066e-05, "loss": 2.3775, "step": 4143 }, { "epoch": 0.42, "learning_rate": 1.3177687953206459e-05, "loss": 2.3447, "step": 4144 }, { "epoch": 0.42, "learning_rate": 1.3174610874109484e-05, "loss": 2.4043, "step": 4145 }, { "epoch": 0.42, "learning_rate": 1.3171533460702173e-05, "loss": 2.4183, "step": 4146 }, { "epoch": 0.42, "learning_rate": 1.3168455713308601e-05, "loss": 2.2882, "step": 4147 }, { "epoch": 0.42, "learning_rate": 1.3165377632252883e-05, "loss": 2.3875, "step": 4148 }, { "epoch": 0.42, "learning_rate": 1.3162299217859161e-05, "loss": 2.407, "step": 4149 }, { "epoch": 0.42, "learning_rate": 1.315922047045161e-05, "loss": 2.3784, "step": 4150 }, { "epoch": 0.42, "learning_rate": 1.3156141390354456e-05, "loss": 2.3389, "step": 4151 }, { "epoch": 0.42, "learning_rate": 1.3153061977891941e-05, "loss": 2.3394, "step": 4152 }, { "epoch": 0.42, "learning_rate": 1.3149982233388355e-05, "loss": 2.3557, "step": 4153 }, { "epoch": 0.42, "learning_rate": 1.3146902157168015e-05, "loss": 2.3841, "step": 4154 }, { "epoch": 0.42, "learning_rate": 1.3143821749555276e-05, "loss": 2.3254, "step": 4155 }, { "epoch": 0.42, "learning_rate": 1.314074101087453e-05, "loss": 2.4405, "step": 4156 }, { "epoch": 0.42, "learning_rate": 1.3137659941450203e-05, "loss": 2.3585, "step": 4157 }, { "epoch": 0.42, "learning_rate": 1.313457854160675e-05, "loss": 2.4839, "step": 4158 }, { "epoch": 0.42, "learning_rate": 1.313149681166867e-05, "loss": 2.3751, "step": 4159 }, { "epoch": 0.42, "learning_rate": 1.312841475196049e-05, "loss": 2.3408, "step": 4160 }, { "epoch": 0.42, "learning_rate": 1.3125332362806773e-05, "loss": 2.3202, "step": 4161 }, { "epoch": 0.42, "learning_rate": 1.3122249644532122e-05, "loss": 2.23, "step": 4162 }, { "epoch": 0.42, "learning_rate": 1.3119166597461166e-05, "loss": 2.3616, "step": 4163 }, { "epoch": 0.42, "learning_rate": 1.3116083221918575e-05, "loss": 2.3531, "step": 4164 }, { "epoch": 0.42, "learning_rate": 1.3112999518229052e-05, "loss": 2.3727, "step": 4165 }, { "epoch": 0.42, "learning_rate": 1.3109915486717333e-05, "loss": 2.3761, "step": 4166 }, { "epoch": 0.42, "learning_rate": 1.310683112770819e-05, "loss": 2.3011, "step": 4167 }, { "epoch": 0.42, "learning_rate": 1.3103746441526426e-05, "loss": 2.4357, "step": 4168 }, { "epoch": 0.42, "learning_rate": 1.3100661428496888e-05, "loss": 2.2726, "step": 4169 }, { "epoch": 0.42, "learning_rate": 1.3097576088944445e-05, "loss": 2.3958, "step": 4170 }, { "epoch": 0.42, "learning_rate": 1.3094490423194012e-05, "loss": 2.3491, "step": 4171 }, { "epoch": 0.42, "learning_rate": 1.3091404431570526e-05, "loss": 2.2743, "step": 4172 }, { "epoch": 0.42, "learning_rate": 1.3088318114398973e-05, "loss": 2.364, "step": 4173 }, { "epoch": 0.42, "learning_rate": 1.3085231472004361e-05, "loss": 2.3736, "step": 4174 }, { "epoch": 0.42, "learning_rate": 1.3082144504711736e-05, "loss": 2.4022, "step": 4175 }, { "epoch": 0.42, "learning_rate": 1.3079057212846178e-05, "loss": 2.3203, "step": 4176 }, { "epoch": 0.42, "learning_rate": 1.3075969596732807e-05, "loss": 2.4033, "step": 4177 }, { "epoch": 0.42, "learning_rate": 1.3072881656696766e-05, "loss": 2.4144, "step": 4178 }, { "epoch": 0.42, "learning_rate": 1.3069793393063241e-05, "loss": 2.4278, "step": 4179 }, { "epoch": 0.42, "learning_rate": 1.306670480615745e-05, "loss": 2.3553, "step": 4180 }, { "epoch": 0.42, "learning_rate": 1.3063615896304643e-05, "loss": 2.4225, "step": 4181 }, { "epoch": 0.42, "learning_rate": 1.3060526663830106e-05, "loss": 2.3609, "step": 4182 }, { "epoch": 0.42, "learning_rate": 1.305743710905916e-05, "loss": 2.3709, "step": 4183 }, { "epoch": 0.42, "learning_rate": 1.3054347232317154e-05, "loss": 2.3139, "step": 4184 }, { "epoch": 0.42, "learning_rate": 1.3051257033929482e-05, "loss": 2.3907, "step": 4185 }, { "epoch": 0.42, "learning_rate": 1.304816651422156e-05, "loss": 2.2965, "step": 4186 }, { "epoch": 0.42, "learning_rate": 1.304507567351884e-05, "loss": 2.3702, "step": 4187 }, { "epoch": 0.42, "learning_rate": 1.3041984512146819e-05, "loss": 2.3665, "step": 4188 }, { "epoch": 0.42, "learning_rate": 1.3038893030431013e-05, "loss": 2.4155, "step": 4189 }, { "epoch": 0.42, "learning_rate": 1.3035801228696979e-05, "loss": 2.4449, "step": 4190 }, { "epoch": 0.42, "learning_rate": 1.303270910727031e-05, "loss": 2.3542, "step": 4191 }, { "epoch": 0.42, "learning_rate": 1.3029616666476626e-05, "loss": 2.3018, "step": 4192 }, { "epoch": 0.42, "learning_rate": 1.3026523906641586e-05, "loss": 2.4166, "step": 4193 }, { "epoch": 0.42, "learning_rate": 1.3023430828090883e-05, "loss": 2.2831, "step": 4194 }, { "epoch": 0.42, "learning_rate": 1.3020337431150237e-05, "loss": 2.4054, "step": 4195 }, { "epoch": 0.42, "learning_rate": 1.3017243716145407e-05, "loss": 2.3648, "step": 4196 }, { "epoch": 0.42, "learning_rate": 1.3014149683402191e-05, "loss": 2.4293, "step": 4197 }, { "epoch": 0.42, "learning_rate": 1.3011055333246406e-05, "loss": 2.427, "step": 4198 }, { "epoch": 0.42, "learning_rate": 1.3007960666003907e-05, "loss": 2.2793, "step": 4199 }, { "epoch": 0.42, "learning_rate": 1.3004865682000596e-05, "loss": 2.3996, "step": 4200 }, { "epoch": 0.42, "learning_rate": 1.3001770381562392e-05, "loss": 2.4545, "step": 4201 }, { "epoch": 0.42, "learning_rate": 1.2998674765015255e-05, "loss": 2.3881, "step": 4202 }, { "epoch": 0.42, "learning_rate": 1.2995578832685176e-05, "loss": 2.4206, "step": 4203 }, { "epoch": 0.42, "learning_rate": 1.299248258489818e-05, "loss": 2.4548, "step": 4204 }, { "epoch": 0.42, "learning_rate": 1.2989386021980325e-05, "loss": 2.4049, "step": 4205 }, { "epoch": 0.42, "learning_rate": 1.2986289144257705e-05, "loss": 2.3413, "step": 4206 }, { "epoch": 0.42, "learning_rate": 1.298319195205644e-05, "loss": 2.3199, "step": 4207 }, { "epoch": 0.42, "learning_rate": 1.2980094445702689e-05, "loss": 2.4139, "step": 4208 }, { "epoch": 0.42, "learning_rate": 1.2976996625522644e-05, "loss": 2.4033, "step": 4209 }, { "epoch": 0.42, "learning_rate": 1.2973898491842528e-05, "loss": 2.3496, "step": 4210 }, { "epoch": 0.42, "learning_rate": 1.2970800044988598e-05, "loss": 2.2641, "step": 4211 }, { "epoch": 0.42, "learning_rate": 1.2967701285287141e-05, "loss": 2.2654, "step": 4212 }, { "epoch": 0.42, "learning_rate": 1.2964602213064482e-05, "loss": 2.5034, "step": 4213 }, { "epoch": 0.42, "learning_rate": 1.2961502828646979e-05, "loss": 2.3549, "step": 4214 }, { "epoch": 0.42, "learning_rate": 1.2958403132361017e-05, "loss": 2.3299, "step": 4215 }, { "epoch": 0.42, "learning_rate": 1.2955303124533018e-05, "loss": 2.4054, "step": 4216 }, { "epoch": 0.42, "learning_rate": 1.2952202805489435e-05, "loss": 2.4536, "step": 4217 }, { "epoch": 0.42, "learning_rate": 1.2949102175556758e-05, "loss": 2.4748, "step": 4218 }, { "epoch": 0.42, "learning_rate": 1.2946001235061504e-05, "loss": 2.3697, "step": 4219 }, { "epoch": 0.42, "learning_rate": 1.2942899984330225e-05, "loss": 2.3337, "step": 4220 }, { "epoch": 0.42, "learning_rate": 1.293979842368951e-05, "loss": 2.3319, "step": 4221 }, { "epoch": 0.42, "learning_rate": 1.2936696553465968e-05, "loss": 2.3522, "step": 4222 }, { "epoch": 0.42, "learning_rate": 1.2933594373986257e-05, "loss": 2.3833, "step": 4223 }, { "epoch": 0.42, "learning_rate": 1.293049188557706e-05, "loss": 2.3693, "step": 4224 }, { "epoch": 0.42, "learning_rate": 1.2927389088565088e-05, "loss": 2.3954, "step": 4225 }, { "epoch": 0.42, "learning_rate": 1.2924285983277089e-05, "loss": 2.3482, "step": 4226 }, { "epoch": 0.42, "learning_rate": 1.2921182570039848e-05, "loss": 2.3935, "step": 4227 }, { "epoch": 0.42, "learning_rate": 1.2918078849180171e-05, "loss": 2.4044, "step": 4228 }, { "epoch": 0.42, "learning_rate": 1.2914974821024912e-05, "loss": 2.4702, "step": 4229 }, { "epoch": 0.42, "learning_rate": 1.2911870485900939e-05, "loss": 2.3397, "step": 4230 }, { "epoch": 0.42, "learning_rate": 1.2908765844135165e-05, "loss": 2.3646, "step": 4231 }, { "epoch": 0.42, "learning_rate": 1.2905660896054535e-05, "loss": 2.303, "step": 4232 }, { "epoch": 0.42, "learning_rate": 1.2902555641986021e-05, "loss": 2.3531, "step": 4233 }, { "epoch": 0.42, "learning_rate": 1.2899450082256629e-05, "loss": 2.405, "step": 4234 }, { "epoch": 0.42, "learning_rate": 1.2896344217193396e-05, "loss": 2.2888, "step": 4235 }, { "epoch": 0.42, "learning_rate": 1.28932380471234e-05, "loss": 2.3558, "step": 4236 }, { "epoch": 0.42, "learning_rate": 1.2890131572373736e-05, "loss": 2.3261, "step": 4237 }, { "epoch": 0.42, "learning_rate": 1.2887024793271544e-05, "loss": 2.2832, "step": 4238 }, { "epoch": 0.42, "learning_rate": 1.288391771014399e-05, "loss": 2.3639, "step": 4239 }, { "epoch": 0.42, "learning_rate": 1.288081032331827e-05, "loss": 2.3696, "step": 4240 }, { "epoch": 0.42, "learning_rate": 1.2877702633121623e-05, "loss": 2.3894, "step": 4241 }, { "epoch": 0.43, "learning_rate": 1.2874594639881303e-05, "loss": 2.2666, "step": 4242 }, { "epoch": 0.43, "learning_rate": 1.2871486343924611e-05, "loss": 2.3322, "step": 4243 }, { "epoch": 0.43, "learning_rate": 1.2868377745578869e-05, "loss": 2.3712, "step": 4244 }, { "epoch": 0.43, "learning_rate": 1.286526884517144e-05, "loss": 2.3406, "step": 4245 }, { "epoch": 0.43, "learning_rate": 1.2862159643029712e-05, "loss": 2.4078, "step": 4246 }, { "epoch": 0.43, "learning_rate": 1.285905013948111e-05, "loss": 2.351, "step": 4247 }, { "epoch": 0.43, "learning_rate": 1.2855940334853086e-05, "loss": 2.3043, "step": 4248 }, { "epoch": 0.43, "learning_rate": 1.2852830229473128e-05, "loss": 2.3916, "step": 4249 }, { "epoch": 0.43, "learning_rate": 1.284971982366875e-05, "loss": 2.2808, "step": 4250 }, { "epoch": 0.43, "learning_rate": 1.2846609117767502e-05, "loss": 2.4038, "step": 4251 }, { "epoch": 0.43, "learning_rate": 1.2843498112096967e-05, "loss": 2.365, "step": 4252 }, { "epoch": 0.43, "learning_rate": 1.284038680698475e-05, "loss": 2.2314, "step": 4253 }, { "epoch": 0.43, "learning_rate": 1.2837275202758507e-05, "loss": 2.4214, "step": 4254 }, { "epoch": 0.43, "learning_rate": 1.2834163299745904e-05, "loss": 2.4338, "step": 4255 }, { "epoch": 0.43, "learning_rate": 1.2831051098274649e-05, "loss": 2.2959, "step": 4256 }, { "epoch": 0.43, "learning_rate": 1.282793859867248e-05, "loss": 2.4012, "step": 4257 }, { "epoch": 0.43, "learning_rate": 1.282482580126717e-05, "loss": 2.2985, "step": 4258 }, { "epoch": 0.43, "learning_rate": 1.282171270638652e-05, "loss": 2.3932, "step": 4259 }, { "epoch": 0.43, "learning_rate": 1.281859931435836e-05, "loss": 2.3503, "step": 4260 }, { "epoch": 0.43, "learning_rate": 1.2815485625510555e-05, "loss": 2.4223, "step": 4261 }, { "epoch": 0.43, "learning_rate": 1.2812371640170993e-05, "loss": 2.3456, "step": 4262 }, { "epoch": 0.43, "learning_rate": 1.2809257358667608e-05, "loss": 2.3652, "step": 4263 }, { "epoch": 0.43, "learning_rate": 1.2806142781328357e-05, "loss": 2.3624, "step": 4264 }, { "epoch": 0.43, "learning_rate": 1.2803027908481225e-05, "loss": 2.3578, "step": 4265 }, { "epoch": 0.43, "learning_rate": 1.2799912740454227e-05, "loss": 2.2716, "step": 4266 }, { "epoch": 0.43, "learning_rate": 1.2796797277575425e-05, "loss": 2.3605, "step": 4267 }, { "epoch": 0.43, "learning_rate": 1.2793681520172893e-05, "loss": 2.3712, "step": 4268 }, { "epoch": 0.43, "learning_rate": 1.2790565468574747e-05, "loss": 2.3365, "step": 4269 }, { "epoch": 0.43, "learning_rate": 1.2787449123109129e-05, "loss": 2.4423, "step": 4270 }, { "epoch": 0.43, "learning_rate": 1.278433248410421e-05, "loss": 2.3171, "step": 4271 }, { "epoch": 0.43, "learning_rate": 1.27812155518882e-05, "loss": 2.3726, "step": 4272 }, { "epoch": 0.43, "learning_rate": 1.2778098326789335e-05, "loss": 2.3318, "step": 4273 }, { "epoch": 0.43, "learning_rate": 1.2774980809135883e-05, "loss": 2.418, "step": 4274 }, { "epoch": 0.43, "learning_rate": 1.2771862999256137e-05, "loss": 2.3392, "step": 4275 }, { "epoch": 0.43, "learning_rate": 1.276874489747843e-05, "loss": 2.4178, "step": 4276 }, { "epoch": 0.43, "learning_rate": 1.2765626504131121e-05, "loss": 2.3149, "step": 4277 }, { "epoch": 0.43, "learning_rate": 1.2762507819542602e-05, "loss": 2.3721, "step": 4278 }, { "epoch": 0.43, "learning_rate": 1.2759388844041289e-05, "loss": 2.3315, "step": 4279 }, { "epoch": 0.43, "learning_rate": 1.2756269577955636e-05, "loss": 2.4239, "step": 4280 }, { "epoch": 0.43, "learning_rate": 1.275315002161413e-05, "loss": 2.2707, "step": 4281 }, { "epoch": 0.43, "learning_rate": 1.2750030175345277e-05, "loss": 2.3516, "step": 4282 }, { "epoch": 0.43, "learning_rate": 1.274691003947762e-05, "loss": 2.365, "step": 4283 }, { "epoch": 0.43, "learning_rate": 1.2743789614339734e-05, "loss": 2.2892, "step": 4284 }, { "epoch": 0.43, "learning_rate": 1.2740668900260227e-05, "loss": 2.4178, "step": 4285 }, { "epoch": 0.43, "learning_rate": 1.2737547897567727e-05, "loss": 2.2239, "step": 4286 }, { "epoch": 0.43, "learning_rate": 1.2734426606590908e-05, "loss": 2.306, "step": 4287 }, { "epoch": 0.43, "learning_rate": 1.2731305027658456e-05, "loss": 2.3478, "step": 4288 }, { "epoch": 0.43, "learning_rate": 1.2728183161099102e-05, "loss": 2.3334, "step": 4289 }, { "epoch": 0.43, "learning_rate": 1.2725061007241601e-05, "loss": 2.4545, "step": 4290 }, { "epoch": 0.43, "learning_rate": 1.272193856641474e-05, "loss": 2.3822, "step": 4291 }, { "epoch": 0.43, "learning_rate": 1.2718815838947332e-05, "loss": 2.3749, "step": 4292 }, { "epoch": 0.43, "learning_rate": 1.2715692825168229e-05, "loss": 2.3151, "step": 4293 }, { "epoch": 0.43, "learning_rate": 1.2712569525406302e-05, "loss": 2.3779, "step": 4294 }, { "epoch": 0.43, "learning_rate": 1.2709445939990462e-05, "loss": 2.4268, "step": 4295 }, { "epoch": 0.43, "learning_rate": 1.2706322069249644e-05, "loss": 2.4006, "step": 4296 }, { "epoch": 0.43, "learning_rate": 1.2703197913512817e-05, "loss": 2.2815, "step": 4297 }, { "epoch": 0.43, "learning_rate": 1.2700073473108972e-05, "loss": 2.4683, "step": 4298 }, { "epoch": 0.43, "learning_rate": 1.2696948748367146e-05, "loss": 2.3552, "step": 4299 }, { "epoch": 0.43, "learning_rate": 1.269382373961639e-05, "loss": 2.3342, "step": 4300 }, { "epoch": 0.43, "learning_rate": 1.2690698447185788e-05, "loss": 2.3586, "step": 4301 }, { "epoch": 0.43, "learning_rate": 1.2687572871404464e-05, "loss": 2.3369, "step": 4302 }, { "epoch": 0.43, "learning_rate": 1.268444701260156e-05, "loss": 2.2049, "step": 4303 }, { "epoch": 0.43, "learning_rate": 1.268132087110625e-05, "loss": 2.4094, "step": 4304 }, { "epoch": 0.43, "learning_rate": 1.2678194447247747e-05, "loss": 2.3687, "step": 4305 }, { "epoch": 0.43, "learning_rate": 1.2675067741355282e-05, "loss": 2.2922, "step": 4306 }, { "epoch": 0.43, "learning_rate": 1.2671940753758119e-05, "loss": 2.3791, "step": 4307 }, { "epoch": 0.43, "learning_rate": 1.2668813484785559e-05, "loss": 2.4055, "step": 4308 }, { "epoch": 0.43, "learning_rate": 1.2665685934766923e-05, "loss": 2.4872, "step": 4309 }, { "epoch": 0.43, "learning_rate": 1.2662558104031568e-05, "loss": 2.3435, "step": 4310 }, { "epoch": 0.43, "learning_rate": 1.2659429992908872e-05, "loss": 2.29, "step": 4311 }, { "epoch": 0.43, "learning_rate": 1.2656301601728256e-05, "loss": 2.3349, "step": 4312 }, { "epoch": 0.43, "learning_rate": 1.2653172930819162e-05, "loss": 2.3433, "step": 4313 }, { "epoch": 0.43, "learning_rate": 1.265004398051106e-05, "loss": 2.437, "step": 4314 }, { "epoch": 0.43, "learning_rate": 1.264691475113345e-05, "loss": 2.3931, "step": 4315 }, { "epoch": 0.43, "learning_rate": 1.2643785243015865e-05, "loss": 2.3606, "step": 4316 }, { "epoch": 0.43, "learning_rate": 1.2640655456487867e-05, "loss": 2.3757, "step": 4317 }, { "epoch": 0.43, "learning_rate": 1.2637525391879048e-05, "loss": 2.3274, "step": 4318 }, { "epoch": 0.43, "learning_rate": 1.2634395049519024e-05, "loss": 2.4872, "step": 4319 }, { "epoch": 0.43, "learning_rate": 1.2631264429737441e-05, "loss": 2.3863, "step": 4320 }, { "epoch": 0.43, "learning_rate": 1.2628133532863982e-05, "loss": 2.4487, "step": 4321 }, { "epoch": 0.43, "learning_rate": 1.2625002359228352e-05, "loss": 2.3981, "step": 4322 }, { "epoch": 0.43, "learning_rate": 1.2621870909160288e-05, "loss": 2.3543, "step": 4323 }, { "epoch": 0.43, "learning_rate": 1.2618739182989554e-05, "loss": 2.4192, "step": 4324 }, { "epoch": 0.43, "learning_rate": 1.2615607181045943e-05, "loss": 2.4142, "step": 4325 }, { "epoch": 0.43, "learning_rate": 1.261247490365928e-05, "loss": 2.3529, "step": 4326 }, { "epoch": 0.43, "learning_rate": 1.2609342351159419e-05, "loss": 2.3931, "step": 4327 }, { "epoch": 0.43, "learning_rate": 1.2606209523876238e-05, "loss": 2.4053, "step": 4328 }, { "epoch": 0.43, "learning_rate": 1.2603076422139646e-05, "loss": 2.3434, "step": 4329 }, { "epoch": 0.43, "learning_rate": 1.2599943046279585e-05, "loss": 2.3909, "step": 4330 }, { "epoch": 0.43, "learning_rate": 1.2596809396626026e-05, "loss": 2.395, "step": 4331 }, { "epoch": 0.43, "learning_rate": 1.2593675473508959e-05, "loss": 2.3532, "step": 4332 }, { "epoch": 0.43, "learning_rate": 1.2590541277258417e-05, "loss": 2.3401, "step": 4333 }, { "epoch": 0.43, "learning_rate": 1.2587406808204448e-05, "loss": 2.4431, "step": 4334 }, { "epoch": 0.43, "learning_rate": 1.2584272066677137e-05, "loss": 2.2952, "step": 4335 }, { "epoch": 0.43, "learning_rate": 1.2581137053006595e-05, "loss": 2.4194, "step": 4336 }, { "epoch": 0.43, "learning_rate": 1.2578001767522967e-05, "loss": 2.447, "step": 4337 }, { "epoch": 0.43, "learning_rate": 1.2574866210556413e-05, "loss": 2.3784, "step": 4338 }, { "epoch": 0.43, "learning_rate": 1.2571730382437142e-05, "loss": 2.374, "step": 4339 }, { "epoch": 0.43, "learning_rate": 1.2568594283495372e-05, "loss": 2.3453, "step": 4340 }, { "epoch": 0.43, "learning_rate": 1.2565457914061362e-05, "loss": 2.203, "step": 4341 }, { "epoch": 0.44, "learning_rate": 1.2562321274465393e-05, "loss": 2.3653, "step": 4342 }, { "epoch": 0.44, "learning_rate": 1.2559184365037776e-05, "loss": 2.3626, "step": 4343 }, { "epoch": 0.44, "learning_rate": 1.2556047186108853e-05, "loss": 2.4689, "step": 4344 }, { "epoch": 0.44, "learning_rate": 1.2552909738008996e-05, "loss": 2.3995, "step": 4345 }, { "epoch": 0.44, "learning_rate": 1.2549772021068594e-05, "loss": 2.326, "step": 4346 }, { "epoch": 0.44, "learning_rate": 1.2546634035618073e-05, "loss": 2.423, "step": 4347 }, { "epoch": 0.44, "learning_rate": 1.2543495781987894e-05, "loss": 2.4434, "step": 4348 }, { "epoch": 0.44, "learning_rate": 1.2540357260508529e-05, "loss": 2.5165, "step": 4349 }, { "epoch": 0.44, "learning_rate": 1.2537218471510497e-05, "loss": 2.3937, "step": 4350 }, { "epoch": 0.44, "learning_rate": 1.2534079415324327e-05, "loss": 2.3564, "step": 4351 }, { "epoch": 0.44, "learning_rate": 1.2530940092280592e-05, "loss": 2.3177, "step": 4352 }, { "epoch": 0.44, "learning_rate": 1.2527800502709887e-05, "loss": 2.3659, "step": 4353 }, { "epoch": 0.44, "learning_rate": 1.252466064694283e-05, "loss": 2.3928, "step": 4354 }, { "epoch": 0.44, "learning_rate": 1.2521520525310071e-05, "loss": 2.5005, "step": 4355 }, { "epoch": 0.44, "learning_rate": 1.2518380138142292e-05, "loss": 2.2498, "step": 4356 }, { "epoch": 0.44, "learning_rate": 1.2515239485770199e-05, "loss": 2.3825, "step": 4357 }, { "epoch": 0.44, "learning_rate": 1.2512098568524519e-05, "loss": 2.3663, "step": 4358 }, { "epoch": 0.44, "learning_rate": 1.2508957386736025e-05, "loss": 2.4541, "step": 4359 }, { "epoch": 0.44, "learning_rate": 1.25058159407355e-05, "loss": 2.2982, "step": 4360 }, { "epoch": 0.44, "learning_rate": 1.2502674230853761e-05, "loss": 2.3573, "step": 4361 }, { "epoch": 0.44, "learning_rate": 1.249953225742166e-05, "loss": 2.3668, "step": 4362 }, { "epoch": 0.44, "learning_rate": 1.2496390020770068e-05, "loss": 2.3385, "step": 4363 }, { "epoch": 0.44, "learning_rate": 1.249324752122988e-05, "loss": 2.2623, "step": 4364 }, { "epoch": 0.44, "learning_rate": 1.2490104759132034e-05, "loss": 2.3043, "step": 4365 }, { "epoch": 0.44, "learning_rate": 1.2486961734807481e-05, "loss": 2.3918, "step": 4366 }, { "epoch": 0.44, "learning_rate": 1.2483818448587204e-05, "loss": 2.3077, "step": 4367 }, { "epoch": 0.44, "learning_rate": 1.2480674900802219e-05, "loss": 2.4193, "step": 4368 }, { "epoch": 0.44, "learning_rate": 1.2477531091783559e-05, "loss": 2.4481, "step": 4369 }, { "epoch": 0.44, "learning_rate": 1.2474387021862295e-05, "loss": 2.4292, "step": 4370 }, { "epoch": 0.44, "learning_rate": 1.2471242691369523e-05, "loss": 2.3556, "step": 4371 }, { "epoch": 0.44, "learning_rate": 1.2468098100636364e-05, "loss": 2.3921, "step": 4372 }, { "epoch": 0.44, "learning_rate": 1.2464953249993961e-05, "loss": 2.3208, "step": 4373 }, { "epoch": 0.44, "learning_rate": 1.2461808139773494e-05, "loss": 2.3686, "step": 4374 }, { "epoch": 0.44, "learning_rate": 1.245866277030617e-05, "loss": 2.3637, "step": 4375 }, { "epoch": 0.44, "learning_rate": 1.2455517141923217e-05, "loss": 2.3037, "step": 4376 }, { "epoch": 0.44, "learning_rate": 1.2452371254955892e-05, "loss": 2.3762, "step": 4377 }, { "epoch": 0.44, "learning_rate": 1.2449225109735483e-05, "loss": 2.4112, "step": 4378 }, { "epoch": 0.44, "learning_rate": 1.2446078706593301e-05, "loss": 2.3298, "step": 4379 }, { "epoch": 0.44, "learning_rate": 1.2442932045860688e-05, "loss": 2.3668, "step": 4380 }, { "epoch": 0.44, "learning_rate": 1.2439785127869007e-05, "loss": 2.4205, "step": 4381 }, { "epoch": 0.44, "learning_rate": 1.2436637952949655e-05, "loss": 2.3999, "step": 4382 }, { "epoch": 0.44, "learning_rate": 1.2433490521434051e-05, "loss": 2.2918, "step": 4383 }, { "epoch": 0.44, "learning_rate": 1.2430342833653649e-05, "loss": 2.4358, "step": 4384 }, { "epoch": 0.44, "learning_rate": 1.2427194889939918e-05, "loss": 2.3056, "step": 4385 }, { "epoch": 0.44, "learning_rate": 1.242404669062436e-05, "loss": 2.3526, "step": 4386 }, { "epoch": 0.44, "learning_rate": 1.2420898236038509e-05, "loss": 2.442, "step": 4387 }, { "epoch": 0.44, "learning_rate": 1.2417749526513915e-05, "loss": 2.3508, "step": 4388 }, { "epoch": 0.44, "learning_rate": 1.2414600562382167e-05, "loss": 2.4292, "step": 4389 }, { "epoch": 0.44, "learning_rate": 1.2411451343974868e-05, "loss": 2.2822, "step": 4390 }, { "epoch": 0.44, "learning_rate": 1.2408301871623658e-05, "loss": 2.4053, "step": 4391 }, { "epoch": 0.44, "learning_rate": 1.24051521456602e-05, "loss": 2.3587, "step": 4392 }, { "epoch": 0.44, "learning_rate": 1.2402002166416183e-05, "loss": 2.3325, "step": 4393 }, { "epoch": 0.44, "learning_rate": 1.2398851934223324e-05, "loss": 2.3692, "step": 4394 }, { "epoch": 0.44, "learning_rate": 1.2395701449413364e-05, "loss": 2.3587, "step": 4395 }, { "epoch": 0.44, "learning_rate": 1.2392550712318077e-05, "loss": 2.3354, "step": 4396 }, { "epoch": 0.44, "learning_rate": 1.2389399723269258e-05, "loss": 2.5222, "step": 4397 }, { "epoch": 0.44, "learning_rate": 1.2386248482598726e-05, "loss": 2.4027, "step": 4398 }, { "epoch": 0.44, "learning_rate": 1.2383096990638333e-05, "loss": 2.3644, "step": 4399 }, { "epoch": 0.44, "learning_rate": 1.2379945247719954e-05, "loss": 2.4431, "step": 4400 }, { "epoch": 0.44, "learning_rate": 1.237679325417549e-05, "loss": 2.3661, "step": 4401 }, { "epoch": 0.44, "learning_rate": 1.2373641010336875e-05, "loss": 2.2851, "step": 4402 }, { "epoch": 0.44, "learning_rate": 1.2370488516536056e-05, "loss": 2.3634, "step": 4403 }, { "epoch": 0.44, "learning_rate": 1.2367335773105023e-05, "loss": 2.4393, "step": 4404 }, { "epoch": 0.44, "learning_rate": 1.2364182780375776e-05, "loss": 2.3232, "step": 4405 }, { "epoch": 0.44, "learning_rate": 1.2361029538680352e-05, "loss": 2.3797, "step": 4406 }, { "epoch": 0.44, "learning_rate": 1.2357876048350809e-05, "loss": 2.4832, "step": 4407 }, { "epoch": 0.44, "learning_rate": 1.2354722309719238e-05, "loss": 2.4773, "step": 4408 }, { "epoch": 0.44, "learning_rate": 1.2351568323117748e-05, "loss": 2.4244, "step": 4409 }, { "epoch": 0.44, "learning_rate": 1.2348414088878476e-05, "loss": 2.4146, "step": 4410 }, { "epoch": 0.44, "learning_rate": 1.2345259607333589e-05, "loss": 2.3638, "step": 4411 }, { "epoch": 0.44, "learning_rate": 1.2342104878815278e-05, "loss": 2.3175, "step": 4412 }, { "epoch": 0.44, "learning_rate": 1.2338949903655755e-05, "loss": 2.4012, "step": 4413 }, { "epoch": 0.44, "learning_rate": 1.2335794682187266e-05, "loss": 2.4784, "step": 4414 }, { "epoch": 0.44, "learning_rate": 1.2332639214742081e-05, "loss": 2.22, "step": 4415 }, { "epoch": 0.44, "learning_rate": 1.2329483501652493e-05, "loss": 2.4107, "step": 4416 }, { "epoch": 0.44, "learning_rate": 1.2326327543250823e-05, "loss": 2.4237, "step": 4417 }, { "epoch": 0.44, "learning_rate": 1.2323171339869414e-05, "loss": 2.465, "step": 4418 }, { "epoch": 0.44, "learning_rate": 1.232001489184064e-05, "loss": 2.3514, "step": 4419 }, { "epoch": 0.44, "learning_rate": 1.2316858199496899e-05, "loss": 2.4141, "step": 4420 }, { "epoch": 0.44, "learning_rate": 1.2313701263170614e-05, "loss": 2.4717, "step": 4421 }, { "epoch": 0.44, "learning_rate": 1.2310544083194233e-05, "loss": 2.4026, "step": 4422 }, { "epoch": 0.44, "learning_rate": 1.2307386659900233e-05, "loss": 2.4037, "step": 4423 }, { "epoch": 0.44, "learning_rate": 1.2304228993621113e-05, "loss": 2.3319, "step": 4424 }, { "epoch": 0.44, "learning_rate": 1.2301071084689397e-05, "loss": 2.4037, "step": 4425 }, { "epoch": 0.44, "learning_rate": 1.229791293343764e-05, "loss": 2.4439, "step": 4426 }, { "epoch": 0.44, "learning_rate": 1.2294754540198417e-05, "loss": 2.4312, "step": 4427 }, { "epoch": 0.44, "learning_rate": 1.2291595905304332e-05, "loss": 2.2679, "step": 4428 }, { "epoch": 0.44, "learning_rate": 1.2288437029088016e-05, "loss": 2.3768, "step": 4429 }, { "epoch": 0.44, "learning_rate": 1.2285277911882114e-05, "loss": 2.3998, "step": 4430 }, { "epoch": 0.44, "learning_rate": 1.2282118554019309e-05, "loss": 2.3742, "step": 4431 }, { "epoch": 0.44, "learning_rate": 1.2278958955832306e-05, "loss": 2.3774, "step": 4432 }, { "epoch": 0.44, "learning_rate": 1.2275799117653833e-05, "loss": 2.4226, "step": 4433 }, { "epoch": 0.44, "learning_rate": 1.2272639039816646e-05, "loss": 2.3523, "step": 4434 }, { "epoch": 0.44, "learning_rate": 1.2269478722653521e-05, "loss": 2.4364, "step": 4435 }, { "epoch": 0.44, "learning_rate": 1.2266318166497266e-05, "loss": 2.3071, "step": 4436 }, { "epoch": 0.44, "learning_rate": 1.2263157371680716e-05, "loss": 2.3314, "step": 4437 }, { "epoch": 0.44, "learning_rate": 1.225999633853672e-05, "loss": 2.4045, "step": 4438 }, { "epoch": 0.44, "learning_rate": 1.2256835067398161e-05, "loss": 2.4682, "step": 4439 }, { "epoch": 0.44, "learning_rate": 1.2253673558597943e-05, "loss": 2.3774, "step": 4440 }, { "epoch": 0.44, "learning_rate": 1.2250511812468998e-05, "loss": 2.4367, "step": 4441 }, { "epoch": 0.45, "learning_rate": 1.224734982934428e-05, "loss": 2.4094, "step": 4442 }, { "epoch": 0.45, "learning_rate": 1.2244187609556772e-05, "loss": 2.3434, "step": 4443 }, { "epoch": 0.45, "learning_rate": 1.2241025153439477e-05, "loss": 2.3343, "step": 4444 }, { "epoch": 0.45, "learning_rate": 1.2237862461325425e-05, "loss": 2.3259, "step": 4445 }, { "epoch": 0.45, "learning_rate": 1.2234699533547674e-05, "loss": 2.3918, "step": 4446 }, { "epoch": 0.45, "learning_rate": 1.2231536370439305e-05, "loss": 2.2773, "step": 4447 }, { "epoch": 0.45, "learning_rate": 1.2228372972333418e-05, "loss": 2.3526, "step": 4448 }, { "epoch": 0.45, "learning_rate": 1.2225209339563144e-05, "loss": 2.2763, "step": 4449 }, { "epoch": 0.45, "learning_rate": 1.2222045472461641e-05, "loss": 2.3039, "step": 4450 }, { "epoch": 0.45, "learning_rate": 1.2218881371362086e-05, "loss": 2.3893, "step": 4451 }, { "epoch": 0.45, "learning_rate": 1.2215717036597678e-05, "loss": 2.3015, "step": 4452 }, { "epoch": 0.45, "learning_rate": 1.221255246850165e-05, "loss": 2.3527, "step": 4453 }, { "epoch": 0.45, "learning_rate": 1.2209387667407252e-05, "loss": 2.3011, "step": 4454 }, { "epoch": 0.45, "learning_rate": 1.2206222633647765e-05, "loss": 2.3267, "step": 4455 }, { "epoch": 0.45, "learning_rate": 1.2203057367556492e-05, "loss": 2.1966, "step": 4456 }, { "epoch": 0.45, "learning_rate": 1.219989186946675e-05, "loss": 2.4471, "step": 4457 }, { "epoch": 0.45, "learning_rate": 1.21967261397119e-05, "loss": 2.3261, "step": 4458 }, { "epoch": 0.45, "learning_rate": 1.219356017862531e-05, "loss": 2.4115, "step": 4459 }, { "epoch": 0.45, "learning_rate": 1.2190393986540385e-05, "loss": 2.4068, "step": 4460 }, { "epoch": 0.45, "learning_rate": 1.2187227563790547e-05, "loss": 2.4672, "step": 4461 }, { "epoch": 0.45, "learning_rate": 1.2184060910709242e-05, "loss": 2.314, "step": 4462 }, { "epoch": 0.45, "learning_rate": 1.218089402762994e-05, "loss": 2.1889, "step": 4463 }, { "epoch": 0.45, "learning_rate": 1.2177726914886142e-05, "loss": 2.3695, "step": 4464 }, { "epoch": 0.45, "learning_rate": 1.2174559572811368e-05, "loss": 2.3973, "step": 4465 }, { "epoch": 0.45, "learning_rate": 1.2171392001739163e-05, "loss": 2.2909, "step": 4466 }, { "epoch": 0.45, "learning_rate": 1.2168224202003098e-05, "loss": 2.2621, "step": 4467 }, { "epoch": 0.45, "learning_rate": 1.216505617393676e-05, "loss": 2.3224, "step": 4468 }, { "epoch": 0.45, "learning_rate": 1.2161887917873771e-05, "loss": 2.3154, "step": 4469 }, { "epoch": 0.45, "learning_rate": 1.215871943414777e-05, "loss": 2.405, "step": 4470 }, { "epoch": 0.45, "learning_rate": 1.2155550723092424e-05, "loss": 2.3602, "step": 4471 }, { "epoch": 0.45, "learning_rate": 1.2152381785041424e-05, "loss": 2.3459, "step": 4472 }, { "epoch": 0.45, "learning_rate": 1.2149212620328474e-05, "loss": 2.3381, "step": 4473 }, { "epoch": 0.45, "learning_rate": 1.214604322928732e-05, "loss": 2.3337, "step": 4474 }, { "epoch": 0.45, "learning_rate": 1.214287361225172e-05, "loss": 2.3243, "step": 4475 }, { "epoch": 0.45, "learning_rate": 1.2139703769555458e-05, "loss": 2.3051, "step": 4476 }, { "epoch": 0.45, "learning_rate": 1.2136533701532338e-05, "loss": 2.2809, "step": 4477 }, { "epoch": 0.45, "learning_rate": 1.21333634085162e-05, "loss": 2.325, "step": 4478 }, { "epoch": 0.45, "learning_rate": 1.2130192890840893e-05, "loss": 2.3567, "step": 4479 }, { "epoch": 0.45, "learning_rate": 1.21270221488403e-05, "loss": 2.2495, "step": 4480 }, { "epoch": 0.45, "learning_rate": 1.2123851182848323e-05, "loss": 2.4021, "step": 4481 }, { "epoch": 0.45, "learning_rate": 1.2120679993198889e-05, "loss": 2.422, "step": 4482 }, { "epoch": 0.45, "learning_rate": 1.2117508580225947e-05, "loss": 2.4851, "step": 4483 }, { "epoch": 0.45, "learning_rate": 1.211433694426347e-05, "loss": 2.2648, "step": 4484 }, { "epoch": 0.45, "learning_rate": 1.2111165085645456e-05, "loss": 2.3782, "step": 4485 }, { "epoch": 0.45, "learning_rate": 1.2107993004705924e-05, "loss": 2.3683, "step": 4486 }, { "epoch": 0.45, "learning_rate": 1.210482070177892e-05, "loss": 2.395, "step": 4487 }, { "epoch": 0.45, "learning_rate": 1.2101648177198512e-05, "loss": 2.3765, "step": 4488 }, { "epoch": 0.45, "learning_rate": 1.209847543129879e-05, "loss": 2.4168, "step": 4489 }, { "epoch": 0.45, "learning_rate": 1.2095302464413865e-05, "loss": 2.4046, "step": 4490 }, { "epoch": 0.45, "learning_rate": 1.2092129276877879e-05, "loss": 2.4834, "step": 4491 }, { "epoch": 0.45, "learning_rate": 1.2088955869024988e-05, "loss": 2.2874, "step": 4492 }, { "epoch": 0.45, "learning_rate": 1.208578224118938e-05, "loss": 2.4423, "step": 4493 }, { "epoch": 0.45, "learning_rate": 1.208260839370526e-05, "loss": 2.3718, "step": 4494 }, { "epoch": 0.45, "learning_rate": 1.2079434326906851e-05, "loss": 2.3607, "step": 4495 }, { "epoch": 0.45, "learning_rate": 1.2076260041128419e-05, "loss": 2.2544, "step": 4496 }, { "epoch": 0.45, "learning_rate": 1.207308553670423e-05, "loss": 2.3996, "step": 4497 }, { "epoch": 0.45, "learning_rate": 1.2069910813968586e-05, "loss": 2.3297, "step": 4498 }, { "epoch": 0.45, "learning_rate": 1.206673587325581e-05, "loss": 2.4372, "step": 4499 }, { "epoch": 0.45, "learning_rate": 1.2063560714900249e-05, "loss": 2.3816, "step": 4500 }, { "epoch": 0.45, "learning_rate": 1.2060385339236266e-05, "loss": 2.38, "step": 4501 }, { "epoch": 0.45, "learning_rate": 1.2057209746598257e-05, "loss": 2.375, "step": 4502 }, { "epoch": 0.45, "learning_rate": 1.2054033937320632e-05, "loss": 2.3874, "step": 4503 }, { "epoch": 0.45, "learning_rate": 1.205085791173783e-05, "loss": 2.268, "step": 4504 }, { "epoch": 0.45, "learning_rate": 1.2047681670184307e-05, "loss": 2.3433, "step": 4505 }, { "epoch": 0.45, "learning_rate": 1.204450521299455e-05, "loss": 2.3786, "step": 4506 }, { "epoch": 0.45, "learning_rate": 1.204132854050306e-05, "loss": 2.4117, "step": 4507 }, { "epoch": 0.45, "learning_rate": 1.2038151653044363e-05, "loss": 2.4156, "step": 4508 }, { "epoch": 0.45, "learning_rate": 1.2034974550953014e-05, "loss": 2.3334, "step": 4509 }, { "epoch": 0.45, "learning_rate": 1.2031797234563583e-05, "loss": 2.4544, "step": 4510 }, { "epoch": 0.45, "learning_rate": 1.2028619704210664e-05, "loss": 2.2311, "step": 4511 }, { "epoch": 0.45, "learning_rate": 1.2025441960228876e-05, "loss": 2.4347, "step": 4512 }, { "epoch": 0.45, "learning_rate": 1.2022264002952862e-05, "loss": 2.3763, "step": 4513 }, { "epoch": 0.45, "learning_rate": 1.2019085832717281e-05, "loss": 2.3827, "step": 4514 }, { "epoch": 0.45, "learning_rate": 1.201590744985682e-05, "loss": 2.4215, "step": 4515 }, { "epoch": 0.45, "learning_rate": 1.2012728854706186e-05, "loss": 2.3866, "step": 4516 }, { "epoch": 0.45, "learning_rate": 1.2009550047600105e-05, "loss": 2.4018, "step": 4517 }, { "epoch": 0.45, "learning_rate": 1.2006371028873335e-05, "loss": 2.358, "step": 4518 }, { "epoch": 0.45, "learning_rate": 1.2003191798860651e-05, "loss": 2.3794, "step": 4519 }, { "epoch": 0.45, "learning_rate": 1.2000012357896846e-05, "loss": 2.3845, "step": 4520 }, { "epoch": 0.45, "learning_rate": 1.1996832706316739e-05, "loss": 2.4183, "step": 4521 }, { "epoch": 0.45, "learning_rate": 1.1993652844455172e-05, "loss": 2.2917, "step": 4522 }, { "epoch": 0.45, "learning_rate": 1.1990472772647013e-05, "loss": 2.4357, "step": 4523 }, { "epoch": 0.45, "learning_rate": 1.1987292491227138e-05, "loss": 2.3275, "step": 4524 }, { "epoch": 0.45, "learning_rate": 1.1984112000530465e-05, "loss": 2.4233, "step": 4525 }, { "epoch": 0.45, "learning_rate": 1.1980931300891914e-05, "loss": 2.3014, "step": 4526 }, { "epoch": 0.45, "learning_rate": 1.1977750392646443e-05, "loss": 2.4342, "step": 4527 }, { "epoch": 0.45, "learning_rate": 1.1974569276129023e-05, "loss": 2.3225, "step": 4528 }, { "epoch": 0.45, "learning_rate": 1.1971387951674648e-05, "loss": 2.2571, "step": 4529 }, { "epoch": 0.45, "learning_rate": 1.1968206419618336e-05, "loss": 2.3491, "step": 4530 }, { "epoch": 0.45, "learning_rate": 1.196502468029513e-05, "loss": 2.3929, "step": 4531 }, { "epoch": 0.45, "learning_rate": 1.1961842734040088e-05, "loss": 2.2879, "step": 4532 }, { "epoch": 0.45, "learning_rate": 1.195866058118829e-05, "loss": 2.3356, "step": 4533 }, { "epoch": 0.45, "learning_rate": 1.1955478222074848e-05, "loss": 2.2262, "step": 4534 }, { "epoch": 0.45, "learning_rate": 1.195229565703488e-05, "loss": 2.3297, "step": 4535 }, { "epoch": 0.45, "learning_rate": 1.194911288640354e-05, "loss": 2.3619, "step": 4536 }, { "epoch": 0.45, "learning_rate": 1.1945929910515994e-05, "loss": 2.3751, "step": 4537 }, { "epoch": 0.45, "learning_rate": 1.1942746729707438e-05, "loss": 2.3519, "step": 4538 }, { "epoch": 0.45, "learning_rate": 1.1939563344313076e-05, "loss": 2.3502, "step": 4539 }, { "epoch": 0.45, "learning_rate": 1.193637975466815e-05, "loss": 2.3759, "step": 4540 }, { "epoch": 0.45, "learning_rate": 1.1933195961107915e-05, "loss": 2.3019, "step": 4541 }, { "epoch": 0.46, "learning_rate": 1.1930011963967644e-05, "loss": 2.4321, "step": 4542 }, { "epoch": 0.46, "learning_rate": 1.1926827763582643e-05, "loss": 2.2586, "step": 4543 }, { "epoch": 0.46, "learning_rate": 1.1923643360288227e-05, "loss": 2.4468, "step": 4544 }, { "epoch": 0.46, "learning_rate": 1.1920458754419734e-05, "loss": 2.4246, "step": 4545 }, { "epoch": 0.46, "learning_rate": 1.1917273946312537e-05, "loss": 2.3259, "step": 4546 }, { "epoch": 0.46, "learning_rate": 1.1914088936302013e-05, "loss": 2.4307, "step": 4547 }, { "epoch": 0.46, "learning_rate": 1.1910903724723566e-05, "loss": 2.3828, "step": 4548 }, { "epoch": 0.46, "learning_rate": 1.1907718311912628e-05, "loss": 2.3612, "step": 4549 }, { "epoch": 0.46, "learning_rate": 1.1904532698204646e-05, "loss": 2.3873, "step": 4550 }, { "epoch": 0.46, "learning_rate": 1.1901346883935086e-05, "loss": 2.3306, "step": 4551 }, { "epoch": 0.46, "learning_rate": 1.1898160869439437e-05, "loss": 2.417, "step": 4552 }, { "epoch": 0.46, "learning_rate": 1.1894974655053215e-05, "loss": 2.424, "step": 4553 }, { "epoch": 0.46, "learning_rate": 1.1891788241111951e-05, "loss": 2.5221, "step": 4554 }, { "epoch": 0.46, "learning_rate": 1.1888601627951197e-05, "loss": 2.3209, "step": 4555 }, { "epoch": 0.46, "learning_rate": 1.1885414815906531e-05, "loss": 2.4255, "step": 4556 }, { "epoch": 0.46, "learning_rate": 1.188222780531354e-05, "loss": 2.3105, "step": 4557 }, { "epoch": 0.46, "learning_rate": 1.1879040596507844e-05, "loss": 2.3679, "step": 4558 }, { "epoch": 0.46, "learning_rate": 1.1875853189825087e-05, "loss": 2.4411, "step": 4559 }, { "epoch": 0.46, "learning_rate": 1.1872665585600916e-05, "loss": 2.4367, "step": 4560 }, { "epoch": 0.46, "learning_rate": 1.1869477784171018e-05, "loss": 2.4234, "step": 4561 }, { "epoch": 0.46, "learning_rate": 1.1866289785871083e-05, "loss": 2.3963, "step": 4562 }, { "epoch": 0.46, "learning_rate": 1.1863101591036844e-05, "loss": 2.3367, "step": 4563 }, { "epoch": 0.46, "learning_rate": 1.185991320000403e-05, "loss": 2.3975, "step": 4564 }, { "epoch": 0.46, "learning_rate": 1.185672461310841e-05, "loss": 2.3699, "step": 4565 }, { "epoch": 0.46, "learning_rate": 1.1853535830685764e-05, "loss": 2.3245, "step": 4566 }, { "epoch": 0.46, "learning_rate": 1.185034685307189e-05, "loss": 2.3804, "step": 4567 }, { "epoch": 0.46, "learning_rate": 1.184715768060262e-05, "loss": 2.3209, "step": 4568 }, { "epoch": 0.46, "learning_rate": 1.1843968313613792e-05, "loss": 2.3636, "step": 4569 }, { "epoch": 0.46, "learning_rate": 1.1840778752441268e-05, "loss": 2.3649, "step": 4570 }, { "epoch": 0.46, "learning_rate": 1.1837588997420939e-05, "loss": 2.3657, "step": 4571 }, { "epoch": 0.46, "learning_rate": 1.1834399048888707e-05, "loss": 2.3854, "step": 4572 }, { "epoch": 0.46, "learning_rate": 1.1831208907180497e-05, "loss": 2.3698, "step": 4573 }, { "epoch": 0.46, "learning_rate": 1.1828018572632259e-05, "loss": 2.3328, "step": 4574 }, { "epoch": 0.46, "learning_rate": 1.182482804557995e-05, "loss": 2.3987, "step": 4575 }, { "epoch": 0.46, "learning_rate": 1.182163732635957e-05, "loss": 2.3745, "step": 4576 }, { "epoch": 0.46, "learning_rate": 1.1818446415307113e-05, "loss": 2.4005, "step": 4577 }, { "epoch": 0.46, "learning_rate": 1.1815255312758612e-05, "loss": 2.365, "step": 4578 }, { "epoch": 0.46, "learning_rate": 1.1812064019050111e-05, "loss": 2.2891, "step": 4579 }, { "epoch": 0.46, "learning_rate": 1.180887253451768e-05, "loss": 2.3333, "step": 4580 }, { "epoch": 0.46, "learning_rate": 1.1805680859497404e-05, "loss": 2.3067, "step": 4581 }, { "epoch": 0.46, "learning_rate": 1.1802488994325392e-05, "loss": 2.3811, "step": 4582 }, { "epoch": 0.46, "learning_rate": 1.1799296939337773e-05, "loss": 2.3102, "step": 4583 }, { "epoch": 0.46, "learning_rate": 1.1796104694870686e-05, "loss": 2.3907, "step": 4584 }, { "epoch": 0.46, "learning_rate": 1.1792912261260312e-05, "loss": 2.2887, "step": 4585 }, { "epoch": 0.46, "learning_rate": 1.1789719638842827e-05, "loss": 2.2801, "step": 4586 }, { "epoch": 0.46, "learning_rate": 1.1786526827954442e-05, "loss": 2.398, "step": 4587 }, { "epoch": 0.46, "learning_rate": 1.1783333828931387e-05, "loss": 2.2037, "step": 4588 }, { "epoch": 0.46, "learning_rate": 1.17801406421099e-05, "loss": 2.3641, "step": 4589 }, { "epoch": 0.46, "learning_rate": 1.1776947267826257e-05, "loss": 2.3701, "step": 4590 }, { "epoch": 0.46, "learning_rate": 1.1773753706416739e-05, "loss": 2.3126, "step": 4591 }, { "epoch": 0.46, "learning_rate": 1.1770559958217653e-05, "loss": 2.2773, "step": 4592 }, { "epoch": 0.46, "learning_rate": 1.1767366023565323e-05, "loss": 2.2996, "step": 4593 }, { "epoch": 0.46, "learning_rate": 1.1764171902796098e-05, "loss": 2.4207, "step": 4594 }, { "epoch": 0.46, "learning_rate": 1.1760977596246341e-05, "loss": 2.4314, "step": 4595 }, { "epoch": 0.46, "learning_rate": 1.1757783104252435e-05, "loss": 2.4355, "step": 4596 }, { "epoch": 0.46, "learning_rate": 1.1754588427150789e-05, "loss": 2.3343, "step": 4597 }, { "epoch": 0.46, "learning_rate": 1.175139356527782e-05, "loss": 2.2763, "step": 4598 }, { "epoch": 0.46, "learning_rate": 1.1748198518969973e-05, "loss": 2.3324, "step": 4599 }, { "epoch": 0.46, "learning_rate": 1.1745003288563712e-05, "loss": 2.4315, "step": 4600 }, { "epoch": 0.46, "learning_rate": 1.1741807874395519e-05, "loss": 2.3091, "step": 4601 }, { "epoch": 0.46, "learning_rate": 1.1738612276801891e-05, "loss": 2.4343, "step": 4602 }, { "epoch": 0.46, "learning_rate": 1.1735416496119354e-05, "loss": 2.3851, "step": 4603 }, { "epoch": 0.46, "learning_rate": 1.1732220532684444e-05, "loss": 2.3604, "step": 4604 }, { "epoch": 0.46, "learning_rate": 1.1729024386833721e-05, "loss": 2.3717, "step": 4605 }, { "epoch": 0.46, "learning_rate": 1.172582805890376e-05, "loss": 2.336, "step": 4606 }, { "epoch": 0.46, "learning_rate": 1.1722631549231166e-05, "loss": 2.3683, "step": 4607 }, { "epoch": 0.46, "learning_rate": 1.171943485815255e-05, "loss": 2.4119, "step": 4608 }, { "epoch": 0.46, "learning_rate": 1.1716237986004546e-05, "loss": 2.3809, "step": 4609 }, { "epoch": 0.46, "learning_rate": 1.1713040933123811e-05, "loss": 2.3727, "step": 4610 }, { "epoch": 0.46, "learning_rate": 1.1709843699847019e-05, "loss": 2.257, "step": 4611 }, { "epoch": 0.46, "learning_rate": 1.1706646286510863e-05, "loss": 2.3926, "step": 4612 }, { "epoch": 0.46, "learning_rate": 1.1703448693452054e-05, "loss": 2.3262, "step": 4613 }, { "epoch": 0.46, "learning_rate": 1.1700250921007322e-05, "loss": 2.3287, "step": 4614 }, { "epoch": 0.46, "learning_rate": 1.1697052969513414e-05, "loss": 2.273, "step": 4615 }, { "epoch": 0.46, "learning_rate": 1.1693854839307105e-05, "loss": 2.2734, "step": 4616 }, { "epoch": 0.46, "learning_rate": 1.1690656530725176e-05, "loss": 2.4071, "step": 4617 }, { "epoch": 0.46, "learning_rate": 1.1687458044104434e-05, "loss": 2.3452, "step": 4618 }, { "epoch": 0.46, "learning_rate": 1.1684259379781707e-05, "loss": 2.3736, "step": 4619 }, { "epoch": 0.46, "learning_rate": 1.1681060538093836e-05, "loss": 2.2458, "step": 4620 }, { "epoch": 0.46, "learning_rate": 1.167786151937768e-05, "loss": 2.3413, "step": 4621 }, { "epoch": 0.46, "learning_rate": 1.1674662323970125e-05, "loss": 2.3454, "step": 4622 }, { "epoch": 0.46, "learning_rate": 1.1671462952208069e-05, "loss": 2.3087, "step": 4623 }, { "epoch": 0.46, "learning_rate": 1.1668263404428424e-05, "loss": 2.2884, "step": 4624 }, { "epoch": 0.46, "learning_rate": 1.1665063680968133e-05, "loss": 2.3894, "step": 4625 }, { "epoch": 0.46, "learning_rate": 1.1661863782164154e-05, "loss": 2.4108, "step": 4626 }, { "epoch": 0.46, "learning_rate": 1.165866370835345e-05, "loss": 2.2834, "step": 4627 }, { "epoch": 0.46, "learning_rate": 1.165546345987302e-05, "loss": 2.4717, "step": 4628 }, { "epoch": 0.46, "learning_rate": 1.1652263037059872e-05, "loss": 2.3279, "step": 4629 }, { "epoch": 0.46, "learning_rate": 1.1649062440251035e-05, "loss": 2.2933, "step": 4630 }, { "epoch": 0.46, "learning_rate": 1.1645861669783556e-05, "loss": 2.4298, "step": 4631 }, { "epoch": 0.46, "learning_rate": 1.1642660725994499e-05, "loss": 2.4174, "step": 4632 }, { "epoch": 0.46, "learning_rate": 1.1639459609220946e-05, "loss": 2.2452, "step": 4633 }, { "epoch": 0.46, "learning_rate": 1.1636258319800002e-05, "loss": 2.353, "step": 4634 }, { "epoch": 0.46, "learning_rate": 1.1633056858068787e-05, "loss": 2.3481, "step": 4635 }, { "epoch": 0.46, "learning_rate": 1.1629855224364439e-05, "loss": 2.323, "step": 4636 }, { "epoch": 0.46, "learning_rate": 1.162665341902411e-05, "loss": 2.3189, "step": 4637 }, { "epoch": 0.46, "learning_rate": 1.1623451442384977e-05, "loss": 2.4099, "step": 4638 }, { "epoch": 0.46, "learning_rate": 1.1620249294784232e-05, "loss": 2.3413, "step": 4639 }, { "epoch": 0.46, "learning_rate": 1.1617046976559086e-05, "loss": 2.3985, "step": 4640 }, { "epoch": 0.46, "learning_rate": 1.1613844488046766e-05, "loss": 2.4017, "step": 4641 }, { "epoch": 0.47, "learning_rate": 1.1610641829584515e-05, "loss": 2.3178, "step": 4642 }, { "epoch": 0.47, "learning_rate": 1.1607439001509602e-05, "loss": 2.412, "step": 4643 }, { "epoch": 0.47, "learning_rate": 1.1604236004159306e-05, "loss": 2.3804, "step": 4644 }, { "epoch": 0.47, "learning_rate": 1.160103283787093e-05, "loss": 2.3455, "step": 4645 }, { "epoch": 0.47, "learning_rate": 1.1597829502981788e-05, "loss": 2.3932, "step": 4646 }, { "epoch": 0.47, "learning_rate": 1.1594625999829215e-05, "loss": 2.4433, "step": 4647 }, { "epoch": 0.47, "learning_rate": 1.1591422328750565e-05, "loss": 2.4462, "step": 4648 }, { "epoch": 0.47, "learning_rate": 1.158821849008321e-05, "loss": 2.4283, "step": 4649 }, { "epoch": 0.47, "learning_rate": 1.1585014484164536e-05, "loss": 2.3178, "step": 4650 }, { "epoch": 0.47, "learning_rate": 1.1581810311331951e-05, "loss": 2.357, "step": 4651 }, { "epoch": 0.47, "learning_rate": 1.1578605971922876e-05, "loss": 2.437, "step": 4652 }, { "epoch": 0.47, "learning_rate": 1.1575401466274753e-05, "loss": 2.2745, "step": 4653 }, { "epoch": 0.47, "learning_rate": 1.157219679472504e-05, "loss": 2.3385, "step": 4654 }, { "epoch": 0.47, "learning_rate": 1.1568991957611217e-05, "loss": 2.2905, "step": 4655 }, { "epoch": 0.47, "learning_rate": 1.156578695527077e-05, "loss": 2.4328, "step": 4656 }, { "epoch": 0.47, "learning_rate": 1.1562581788041215e-05, "loss": 2.373, "step": 4657 }, { "epoch": 0.47, "learning_rate": 1.1559376456260081e-05, "loss": 2.3924, "step": 4658 }, { "epoch": 0.47, "learning_rate": 1.1556170960264907e-05, "loss": 2.4527, "step": 4659 }, { "epoch": 0.47, "learning_rate": 1.1552965300393264e-05, "loss": 2.376, "step": 4660 }, { "epoch": 0.47, "learning_rate": 1.1549759476982727e-05, "loss": 2.2466, "step": 4661 }, { "epoch": 0.47, "learning_rate": 1.1546553490370896e-05, "loss": 2.3497, "step": 4662 }, { "epoch": 0.47, "learning_rate": 1.1543347340895381e-05, "loss": 2.3794, "step": 4663 }, { "epoch": 0.47, "learning_rate": 1.1540141028893819e-05, "loss": 2.4206, "step": 4664 }, { "epoch": 0.47, "learning_rate": 1.1536934554703852e-05, "loss": 2.2992, "step": 4665 }, { "epoch": 0.47, "learning_rate": 1.1533727918663154e-05, "loss": 2.3282, "step": 4666 }, { "epoch": 0.47, "learning_rate": 1.1530521121109401e-05, "loss": 2.4278, "step": 4667 }, { "epoch": 0.47, "learning_rate": 1.15273141623803e-05, "loss": 2.3146, "step": 4668 }, { "epoch": 0.47, "learning_rate": 1.1524107042813558e-05, "loss": 2.2798, "step": 4669 }, { "epoch": 0.47, "learning_rate": 1.1520899762746915e-05, "loss": 2.3527, "step": 4670 }, { "epoch": 0.47, "learning_rate": 1.1517692322518123e-05, "loss": 2.4001, "step": 4671 }, { "epoch": 0.47, "learning_rate": 1.1514484722464949e-05, "loss": 2.3666, "step": 4672 }, { "epoch": 0.47, "learning_rate": 1.1511276962925173e-05, "loss": 2.414, "step": 4673 }, { "epoch": 0.47, "learning_rate": 1.1508069044236597e-05, "loss": 2.3391, "step": 4674 }, { "epoch": 0.47, "learning_rate": 1.1504860966737042e-05, "loss": 2.3488, "step": 4675 }, { "epoch": 0.47, "learning_rate": 1.150165273076434e-05, "loss": 2.274, "step": 4676 }, { "epoch": 0.47, "learning_rate": 1.1498444336656347e-05, "loss": 2.417, "step": 4677 }, { "epoch": 0.47, "learning_rate": 1.1495235784750925e-05, "loss": 2.372, "step": 4678 }, { "epoch": 0.47, "learning_rate": 1.1492027075385961e-05, "loss": 2.3178, "step": 4679 }, { "epoch": 0.47, "learning_rate": 1.1488818208899357e-05, "loss": 2.3259, "step": 4680 }, { "epoch": 0.47, "learning_rate": 1.1485609185629032e-05, "loss": 2.3923, "step": 4681 }, { "epoch": 0.47, "learning_rate": 1.1482400005912915e-05, "loss": 2.3637, "step": 4682 }, { "epoch": 0.47, "learning_rate": 1.1479190670088962e-05, "loss": 2.3111, "step": 4683 }, { "epoch": 0.47, "learning_rate": 1.1475981178495137e-05, "loss": 2.3516, "step": 4684 }, { "epoch": 0.47, "learning_rate": 1.1472771531469427e-05, "loss": 2.4223, "step": 4685 }, { "epoch": 0.47, "learning_rate": 1.1469561729349824e-05, "loss": 2.3661, "step": 4686 }, { "epoch": 0.47, "learning_rate": 1.1466351772474353e-05, "loss": 2.3697, "step": 4687 }, { "epoch": 0.47, "learning_rate": 1.1463141661181043e-05, "loss": 2.4281, "step": 4688 }, { "epoch": 0.47, "learning_rate": 1.1459931395807944e-05, "loss": 2.2804, "step": 4689 }, { "epoch": 0.47, "learning_rate": 1.1456720976693118e-05, "loss": 2.3253, "step": 4690 }, { "epoch": 0.47, "learning_rate": 1.1453510404174648e-05, "loss": 2.2893, "step": 4691 }, { "epoch": 0.47, "learning_rate": 1.1450299678590637e-05, "loss": 2.431, "step": 4692 }, { "epoch": 0.47, "learning_rate": 1.144708880027919e-05, "loss": 2.3185, "step": 4693 }, { "epoch": 0.47, "learning_rate": 1.1443877769578438e-05, "loss": 2.3099, "step": 4694 }, { "epoch": 0.47, "learning_rate": 1.144066658682653e-05, "loss": 2.3557, "step": 4695 }, { "epoch": 0.47, "learning_rate": 1.1437455252361622e-05, "loss": 2.3445, "step": 4696 }, { "epoch": 0.47, "learning_rate": 1.1434243766521897e-05, "loss": 2.3241, "step": 4697 }, { "epoch": 0.47, "learning_rate": 1.143103212964555e-05, "loss": 2.4659, "step": 4698 }, { "epoch": 0.47, "learning_rate": 1.1427820342070785e-05, "loss": 2.4108, "step": 4699 }, { "epoch": 0.47, "learning_rate": 1.142460840413583e-05, "loss": 2.4297, "step": 4700 }, { "epoch": 0.47, "learning_rate": 1.1421396316178928e-05, "loss": 2.3386, "step": 4701 }, { "epoch": 0.47, "learning_rate": 1.1418184078538333e-05, "loss": 2.2967, "step": 4702 }, { "epoch": 0.47, "learning_rate": 1.1414971691552319e-05, "loss": 2.3764, "step": 4703 }, { "epoch": 0.47, "learning_rate": 1.1411759155559174e-05, "loss": 2.3667, "step": 4704 }, { "epoch": 0.47, "learning_rate": 1.1408546470897201e-05, "loss": 2.379, "step": 4705 }, { "epoch": 0.47, "learning_rate": 1.1405333637904722e-05, "loss": 2.3278, "step": 4706 }, { "epoch": 0.47, "learning_rate": 1.140212065692007e-05, "loss": 2.5003, "step": 4707 }, { "epoch": 0.47, "learning_rate": 1.1398907528281599e-05, "loss": 2.2573, "step": 4708 }, { "epoch": 0.47, "learning_rate": 1.1395694252327671e-05, "loss": 2.4297, "step": 4709 }, { "epoch": 0.47, "learning_rate": 1.1392480829396674e-05, "loss": 2.3745, "step": 4710 }, { "epoch": 0.47, "learning_rate": 1.1389267259827002e-05, "loss": 2.4818, "step": 4711 }, { "epoch": 0.47, "learning_rate": 1.138605354395707e-05, "loss": 2.3683, "step": 4712 }, { "epoch": 0.47, "learning_rate": 1.1382839682125301e-05, "loss": 2.3043, "step": 4713 }, { "epoch": 0.47, "learning_rate": 1.1379625674670147e-05, "loss": 2.3511, "step": 4714 }, { "epoch": 0.47, "learning_rate": 1.1376411521930059e-05, "loss": 2.3608, "step": 4715 }, { "epoch": 0.47, "learning_rate": 1.137319722424352e-05, "loss": 2.3954, "step": 4716 }, { "epoch": 0.47, "learning_rate": 1.1369982781949011e-05, "loss": 2.3429, "step": 4717 }, { "epoch": 0.47, "learning_rate": 1.1366768195385038e-05, "loss": 2.349, "step": 4718 }, { "epoch": 0.47, "learning_rate": 1.1363553464890127e-05, "loss": 2.314, "step": 4719 }, { "epoch": 0.47, "learning_rate": 1.136033859080281e-05, "loss": 2.2508, "step": 4720 }, { "epoch": 0.47, "learning_rate": 1.1357123573461639e-05, "loss": 2.3343, "step": 4721 }, { "epoch": 0.47, "learning_rate": 1.1353908413205177e-05, "loss": 2.3994, "step": 4722 }, { "epoch": 0.47, "learning_rate": 1.1350693110372002e-05, "loss": 2.3799, "step": 4723 }, { "epoch": 0.47, "learning_rate": 1.1347477665300717e-05, "loss": 2.4092, "step": 4724 }, { "epoch": 0.47, "learning_rate": 1.1344262078329926e-05, "loss": 2.3483, "step": 4725 }, { "epoch": 0.47, "learning_rate": 1.1341046349798257e-05, "loss": 2.3081, "step": 4726 }, { "epoch": 0.47, "learning_rate": 1.1337830480044348e-05, "loss": 2.2941, "step": 4727 }, { "epoch": 0.47, "learning_rate": 1.133461446940686e-05, "loss": 2.3536, "step": 4728 }, { "epoch": 0.47, "learning_rate": 1.1331398318224457e-05, "loss": 2.38, "step": 4729 }, { "epoch": 0.47, "learning_rate": 1.1328182026835825e-05, "loss": 2.4076, "step": 4730 }, { "epoch": 0.47, "learning_rate": 1.1324965595579667e-05, "loss": 2.3237, "step": 4731 }, { "epoch": 0.47, "learning_rate": 1.132174902479469e-05, "loss": 2.3605, "step": 4732 }, { "epoch": 0.47, "learning_rate": 1.1318532314819635e-05, "loss": 2.4473, "step": 4733 }, { "epoch": 0.47, "learning_rate": 1.1315315465993235e-05, "loss": 2.3985, "step": 4734 }, { "epoch": 0.47, "learning_rate": 1.1312098478654252e-05, "loss": 2.3403, "step": 4735 }, { "epoch": 0.47, "learning_rate": 1.130888135314146e-05, "loss": 2.3942, "step": 4736 }, { "epoch": 0.47, "learning_rate": 1.1305664089793647e-05, "loss": 2.539, "step": 4737 }, { "epoch": 0.47, "learning_rate": 1.130244668894961e-05, "loss": 2.333, "step": 4738 }, { "epoch": 0.47, "learning_rate": 1.129922915094817e-05, "loss": 2.2965, "step": 4739 }, { "epoch": 0.47, "learning_rate": 1.1296011476128157e-05, "loss": 2.3919, "step": 4740 }, { "epoch": 0.48, "learning_rate": 1.1292793664828414e-05, "loss": 2.3493, "step": 4741 }, { "epoch": 0.48, "learning_rate": 1.1289575717387803e-05, "loss": 2.4441, "step": 4742 }, { "epoch": 0.48, "learning_rate": 1.12863576341452e-05, "loss": 2.436, "step": 4743 }, { "epoch": 0.48, "learning_rate": 1.128313941543949e-05, "loss": 2.2806, "step": 4744 }, { "epoch": 0.48, "learning_rate": 1.1279921061609576e-05, "loss": 2.2848, "step": 4745 }, { "epoch": 0.48, "learning_rate": 1.1276702572994376e-05, "loss": 2.3583, "step": 4746 }, { "epoch": 0.48, "learning_rate": 1.127348394993282e-05, "loss": 2.3518, "step": 4747 }, { "epoch": 0.48, "learning_rate": 1.1270265192763854e-05, "loss": 2.2764, "step": 4748 }, { "epoch": 0.48, "learning_rate": 1.1267046301826435e-05, "loss": 2.3769, "step": 4749 }, { "epoch": 0.48, "learning_rate": 1.1263827277459536e-05, "loss": 2.3922, "step": 4750 }, { "epoch": 0.48, "learning_rate": 1.126060812000215e-05, "loss": 2.3116, "step": 4751 }, { "epoch": 0.48, "learning_rate": 1.1257388829793274e-05, "loss": 2.3079, "step": 4752 }, { "epoch": 0.48, "learning_rate": 1.1254169407171924e-05, "loss": 2.38, "step": 4753 }, { "epoch": 0.48, "learning_rate": 1.1250949852477126e-05, "loss": 2.3506, "step": 4754 }, { "epoch": 0.48, "learning_rate": 1.1247730166047932e-05, "loss": 2.3921, "step": 4755 }, { "epoch": 0.48, "learning_rate": 1.1244510348223394e-05, "loss": 2.4139, "step": 4756 }, { "epoch": 0.48, "learning_rate": 1.1241290399342583e-05, "loss": 2.225, "step": 4757 }, { "epoch": 0.48, "learning_rate": 1.1238070319744583e-05, "loss": 2.3096, "step": 4758 }, { "epoch": 0.48, "learning_rate": 1.1234850109768488e-05, "loss": 2.3593, "step": 4759 }, { "epoch": 0.48, "learning_rate": 1.123162976975342e-05, "loss": 2.426, "step": 4760 }, { "epoch": 0.48, "learning_rate": 1.1228409300038501e-05, "loss": 2.3492, "step": 4761 }, { "epoch": 0.48, "learning_rate": 1.122518870096287e-05, "loss": 2.4197, "step": 4762 }, { "epoch": 0.48, "learning_rate": 1.1221967972865677e-05, "loss": 2.3254, "step": 4763 }, { "epoch": 0.48, "learning_rate": 1.1218747116086094e-05, "loss": 2.4203, "step": 4764 }, { "epoch": 0.48, "learning_rate": 1.1215526130963302e-05, "loss": 2.3663, "step": 4765 }, { "epoch": 0.48, "learning_rate": 1.1212305017836491e-05, "loss": 2.3997, "step": 4766 }, { "epoch": 0.48, "learning_rate": 1.1209083777044869e-05, "loss": 2.2639, "step": 4767 }, { "epoch": 0.48, "learning_rate": 1.120586240892766e-05, "loss": 2.3929, "step": 4768 }, { "epoch": 0.48, "learning_rate": 1.1202640913824092e-05, "loss": 2.3603, "step": 4769 }, { "epoch": 0.48, "learning_rate": 1.1199419292073418e-05, "loss": 2.4079, "step": 4770 }, { "epoch": 0.48, "learning_rate": 1.1196197544014898e-05, "loss": 2.3018, "step": 4771 }, { "epoch": 0.48, "learning_rate": 1.1192975669987802e-05, "loss": 2.3589, "step": 4772 }, { "epoch": 0.48, "learning_rate": 1.1189753670331424e-05, "loss": 2.3964, "step": 4773 }, { "epoch": 0.48, "learning_rate": 1.1186531545385064e-05, "loss": 2.3903, "step": 4774 }, { "epoch": 0.48, "learning_rate": 1.1183309295488031e-05, "loss": 2.3839, "step": 4775 }, { "epoch": 0.48, "learning_rate": 1.1180086920979655e-05, "loss": 2.3817, "step": 4776 }, { "epoch": 0.48, "learning_rate": 1.1176864422199276e-05, "loss": 2.3927, "step": 4777 }, { "epoch": 0.48, "learning_rate": 1.1173641799486248e-05, "loss": 2.3938, "step": 4778 }, { "epoch": 0.48, "learning_rate": 1.1170419053179938e-05, "loss": 2.3686, "step": 4779 }, { "epoch": 0.48, "learning_rate": 1.1167196183619719e-05, "loss": 2.3759, "step": 4780 }, { "epoch": 0.48, "learning_rate": 1.116397319114499e-05, "loss": 2.359, "step": 4781 }, { "epoch": 0.48, "learning_rate": 1.1160750076095156e-05, "loss": 2.4431, "step": 4782 }, { "epoch": 0.48, "learning_rate": 1.1157526838809635e-05, "loss": 2.4265, "step": 4783 }, { "epoch": 0.48, "learning_rate": 1.1154303479627855e-05, "loss": 2.3613, "step": 4784 }, { "epoch": 0.48, "learning_rate": 1.115107999888926e-05, "loss": 2.2981, "step": 4785 }, { "epoch": 0.48, "learning_rate": 1.1147856396933312e-05, "loss": 2.444, "step": 4786 }, { "epoch": 0.48, "learning_rate": 1.1144632674099474e-05, "loss": 2.3859, "step": 4787 }, { "epoch": 0.48, "learning_rate": 1.1141408830727236e-05, "loss": 2.2179, "step": 4788 }, { "epoch": 0.48, "learning_rate": 1.1138184867156083e-05, "loss": 2.3681, "step": 4789 }, { "epoch": 0.48, "learning_rate": 1.1134960783725528e-05, "loss": 2.3583, "step": 4790 }, { "epoch": 0.48, "learning_rate": 1.1131736580775092e-05, "loss": 2.3306, "step": 4791 }, { "epoch": 0.48, "learning_rate": 1.1128512258644305e-05, "loss": 2.3796, "step": 4792 }, { "epoch": 0.48, "learning_rate": 1.1125287817672716e-05, "loss": 2.2631, "step": 4793 }, { "epoch": 0.48, "learning_rate": 1.1122063258199878e-05, "loss": 2.4202, "step": 4794 }, { "epoch": 0.48, "learning_rate": 1.1118838580565366e-05, "loss": 2.344, "step": 4795 }, { "epoch": 0.48, "learning_rate": 1.1115613785108758e-05, "loss": 2.3799, "step": 4796 }, { "epoch": 0.48, "learning_rate": 1.1112388872169652e-05, "loss": 2.3199, "step": 4797 }, { "epoch": 0.48, "learning_rate": 1.1109163842087658e-05, "loss": 2.3854, "step": 4798 }, { "epoch": 0.48, "learning_rate": 1.1105938695202392e-05, "loss": 2.3643, "step": 4799 }, { "epoch": 0.48, "learning_rate": 1.1102713431853487e-05, "loss": 2.3911, "step": 4800 }, { "epoch": 0.48, "learning_rate": 1.1099488052380587e-05, "loss": 2.4337, "step": 4801 }, { "epoch": 0.48, "learning_rate": 1.1096262557123351e-05, "loss": 2.3639, "step": 4802 }, { "epoch": 0.48, "learning_rate": 1.1093036946421442e-05, "loss": 2.4476, "step": 4803 }, { "epoch": 0.48, "learning_rate": 1.1089811220614548e-05, "loss": 2.3826, "step": 4804 }, { "epoch": 0.48, "learning_rate": 1.108658538004236e-05, "loss": 2.2756, "step": 4805 }, { "epoch": 0.48, "learning_rate": 1.1083359425044581e-05, "loss": 2.3844, "step": 4806 }, { "epoch": 0.48, "learning_rate": 1.1080133355960932e-05, "loss": 2.3587, "step": 4807 }, { "epoch": 0.48, "learning_rate": 1.1076907173131139e-05, "loss": 2.3807, "step": 4808 }, { "epoch": 0.48, "learning_rate": 1.1073680876894944e-05, "loss": 2.3602, "step": 4809 }, { "epoch": 0.48, "learning_rate": 1.10704544675921e-05, "loss": 2.3442, "step": 4810 }, { "epoch": 0.48, "learning_rate": 1.1067227945562373e-05, "loss": 2.4259, "step": 4811 }, { "epoch": 0.48, "learning_rate": 1.1064001311145538e-05, "loss": 2.3827, "step": 4812 }, { "epoch": 0.48, "learning_rate": 1.1060774564681385e-05, "loss": 2.2333, "step": 4813 }, { "epoch": 0.48, "learning_rate": 1.1057547706509718e-05, "loss": 2.3613, "step": 4814 }, { "epoch": 0.48, "learning_rate": 1.1054320736970343e-05, "loss": 2.315, "step": 4815 }, { "epoch": 0.48, "learning_rate": 1.105109365640309e-05, "loss": 2.4596, "step": 4816 }, { "epoch": 0.48, "learning_rate": 1.1047866465147789e-05, "loss": 2.4259, "step": 4817 }, { "epoch": 0.48, "learning_rate": 1.1044639163544292e-05, "loss": 2.2971, "step": 4818 }, { "epoch": 0.48, "learning_rate": 1.1041411751932458e-05, "loss": 2.3083, "step": 4819 }, { "epoch": 0.48, "learning_rate": 1.1038184230652159e-05, "loss": 2.3293, "step": 4820 }, { "epoch": 0.48, "learning_rate": 1.103495660004327e-05, "loss": 2.3417, "step": 4821 }, { "epoch": 0.48, "learning_rate": 1.103172886044569e-05, "loss": 2.3459, "step": 4822 }, { "epoch": 0.48, "learning_rate": 1.1028501012199321e-05, "loss": 2.3118, "step": 4823 }, { "epoch": 0.48, "learning_rate": 1.1025273055644088e-05, "loss": 2.3316, "step": 4824 }, { "epoch": 0.48, "learning_rate": 1.1022044991119908e-05, "loss": 2.291, "step": 4825 }, { "epoch": 0.48, "learning_rate": 1.1018816818966726e-05, "loss": 2.2792, "step": 4826 }, { "epoch": 0.48, "learning_rate": 1.1015588539524494e-05, "loss": 2.3385, "step": 4827 }, { "epoch": 0.48, "learning_rate": 1.1012360153133171e-05, "loss": 2.326, "step": 4828 }, { "epoch": 0.48, "learning_rate": 1.1009131660132733e-05, "loss": 2.3141, "step": 4829 }, { "epoch": 0.48, "learning_rate": 1.1005903060863162e-05, "loss": 2.2483, "step": 4830 }, { "epoch": 0.48, "learning_rate": 1.1002674355664455e-05, "loss": 2.4247, "step": 4831 }, { "epoch": 0.48, "learning_rate": 1.0999445544876618e-05, "loss": 2.3596, "step": 4832 }, { "epoch": 0.48, "learning_rate": 1.0996216628839671e-05, "loss": 2.363, "step": 4833 }, { "epoch": 0.48, "learning_rate": 1.0992987607893641e-05, "loss": 2.3541, "step": 4834 }, { "epoch": 0.48, "learning_rate": 1.0989758482378568e-05, "loss": 2.3702, "step": 4835 }, { "epoch": 0.48, "learning_rate": 1.0986529252634503e-05, "loss": 2.2968, "step": 4836 }, { "epoch": 0.48, "learning_rate": 1.0983299919001511e-05, "loss": 2.3086, "step": 4837 }, { "epoch": 0.48, "learning_rate": 1.0980070481819662e-05, "loss": 2.3132, "step": 4838 }, { "epoch": 0.48, "learning_rate": 1.097684094142904e-05, "loss": 2.3109, "step": 4839 }, { "epoch": 0.48, "learning_rate": 1.0973611298169746e-05, "loss": 2.4166, "step": 4840 }, { "epoch": 0.49, "learning_rate": 1.0970381552381876e-05, "loss": 2.3434, "step": 4841 }, { "epoch": 0.49, "learning_rate": 1.0967151704405553e-05, "loss": 2.4078, "step": 4842 }, { "epoch": 0.49, "learning_rate": 1.0963921754580901e-05, "loss": 2.3282, "step": 4843 }, { "epoch": 0.49, "learning_rate": 1.0960691703248058e-05, "loss": 2.3645, "step": 4844 }, { "epoch": 0.49, "learning_rate": 1.0957461550747176e-05, "loss": 2.3357, "step": 4845 }, { "epoch": 0.49, "learning_rate": 1.0954231297418414e-05, "loss": 2.3464, "step": 4846 }, { "epoch": 0.49, "learning_rate": 1.0951000943601938e-05, "loss": 2.3491, "step": 4847 }, { "epoch": 0.49, "learning_rate": 1.0947770489637927e-05, "loss": 2.3413, "step": 4848 }, { "epoch": 0.49, "learning_rate": 1.0944539935866578e-05, "loss": 2.3166, "step": 4849 }, { "epoch": 0.49, "learning_rate": 1.0941309282628092e-05, "loss": 2.3516, "step": 4850 }, { "epoch": 0.49, "learning_rate": 1.0938078530262677e-05, "loss": 2.3887, "step": 4851 }, { "epoch": 0.49, "learning_rate": 1.0934847679110559e-05, "loss": 2.3854, "step": 4852 }, { "epoch": 0.49, "learning_rate": 1.0931616729511967e-05, "loss": 2.3679, "step": 4853 }, { "epoch": 0.49, "learning_rate": 1.092838568180715e-05, "loss": 2.418, "step": 4854 }, { "epoch": 0.49, "learning_rate": 1.0925154536336355e-05, "loss": 2.3758, "step": 4855 }, { "epoch": 0.49, "learning_rate": 1.092192329343985e-05, "loss": 2.4458, "step": 4856 }, { "epoch": 0.49, "learning_rate": 1.0918691953457907e-05, "loss": 2.4191, "step": 4857 }, { "epoch": 0.49, "learning_rate": 1.0915460516730811e-05, "loss": 2.3737, "step": 4858 }, { "epoch": 0.49, "learning_rate": 1.091222898359886e-05, "loss": 2.242, "step": 4859 }, { "epoch": 0.49, "learning_rate": 1.0908997354402355e-05, "loss": 2.3816, "step": 4860 }, { "epoch": 0.49, "learning_rate": 1.090576562948161e-05, "loss": 2.3493, "step": 4861 }, { "epoch": 0.49, "learning_rate": 1.0902533809176952e-05, "loss": 2.3635, "step": 4862 }, { "epoch": 0.49, "learning_rate": 1.0899301893828716e-05, "loss": 2.3827, "step": 4863 }, { "epoch": 0.49, "learning_rate": 1.0896069883777246e-05, "loss": 2.3521, "step": 4864 }, { "epoch": 0.49, "learning_rate": 1.0892837779362895e-05, "loss": 2.4095, "step": 4865 }, { "epoch": 0.49, "learning_rate": 1.0889605580926031e-05, "loss": 2.3729, "step": 4866 }, { "epoch": 0.49, "learning_rate": 1.0886373288807026e-05, "loss": 2.3434, "step": 4867 }, { "epoch": 0.49, "learning_rate": 1.0883140903346268e-05, "loss": 2.4456, "step": 4868 }, { "epoch": 0.49, "learning_rate": 1.087990842488415e-05, "loss": 2.3449, "step": 4869 }, { "epoch": 0.49, "learning_rate": 1.0876675853761074e-05, "loss": 2.4055, "step": 4870 }, { "epoch": 0.49, "learning_rate": 1.0873443190317457e-05, "loss": 2.3364, "step": 4871 }, { "epoch": 0.49, "learning_rate": 1.0870210434893724e-05, "loss": 2.4436, "step": 4872 }, { "epoch": 0.49, "learning_rate": 1.0866977587830303e-05, "loss": 2.4221, "step": 4873 }, { "epoch": 0.49, "learning_rate": 1.086374464946764e-05, "loss": 2.3745, "step": 4874 }, { "epoch": 0.49, "learning_rate": 1.0860511620146188e-05, "loss": 2.3529, "step": 4875 }, { "epoch": 0.49, "learning_rate": 1.0857278500206408e-05, "loss": 2.3841, "step": 4876 }, { "epoch": 0.49, "learning_rate": 1.0854045289988775e-05, "loss": 2.4032, "step": 4877 }, { "epoch": 0.49, "learning_rate": 1.0850811989833767e-05, "loss": 2.3583, "step": 4878 }, { "epoch": 0.49, "learning_rate": 1.0847578600081871e-05, "loss": 2.4265, "step": 4879 }, { "epoch": 0.49, "learning_rate": 1.0844345121073599e-05, "loss": 2.3806, "step": 4880 }, { "epoch": 0.49, "learning_rate": 1.084111155314945e-05, "loss": 2.276, "step": 4881 }, { "epoch": 0.49, "learning_rate": 1.0837877896649947e-05, "loss": 2.4153, "step": 4882 }, { "epoch": 0.49, "learning_rate": 1.0834644151915617e-05, "loss": 2.3822, "step": 4883 }, { "epoch": 0.49, "learning_rate": 1.0831410319287e-05, "loss": 2.344, "step": 4884 }, { "epoch": 0.49, "learning_rate": 1.082817639910464e-05, "loss": 2.2987, "step": 4885 }, { "epoch": 0.49, "learning_rate": 1.0824942391709094e-05, "loss": 2.3836, "step": 4886 }, { "epoch": 0.49, "learning_rate": 1.0821708297440927e-05, "loss": 2.2782, "step": 4887 }, { "epoch": 0.49, "learning_rate": 1.0818474116640713e-05, "loss": 2.3029, "step": 4888 }, { "epoch": 0.49, "learning_rate": 1.0815239849649037e-05, "loss": 2.3178, "step": 4889 }, { "epoch": 0.49, "learning_rate": 1.0812005496806492e-05, "loss": 2.3392, "step": 4890 }, { "epoch": 0.49, "learning_rate": 1.0808771058453677e-05, "loss": 2.3944, "step": 4891 }, { "epoch": 0.49, "learning_rate": 1.0805536534931207e-05, "loss": 2.4164, "step": 4892 }, { "epoch": 0.49, "learning_rate": 1.0802301926579694e-05, "loss": 2.4037, "step": 4893 }, { "epoch": 0.49, "learning_rate": 1.0799067233739775e-05, "loss": 2.2892, "step": 4894 }, { "epoch": 0.49, "learning_rate": 1.0795832456752081e-05, "loss": 2.4262, "step": 4895 }, { "epoch": 0.49, "learning_rate": 1.0792597595957263e-05, "loss": 2.3747, "step": 4896 }, { "epoch": 0.49, "learning_rate": 1.0789362651695972e-05, "loss": 2.3015, "step": 4897 }, { "epoch": 0.49, "learning_rate": 1.0786127624308875e-05, "loss": 2.3353, "step": 4898 }, { "epoch": 0.49, "learning_rate": 1.0782892514136642e-05, "loss": 2.3526, "step": 4899 }, { "epoch": 0.49, "learning_rate": 1.0779657321519958e-05, "loss": 2.3767, "step": 4900 }, { "epoch": 0.49, "learning_rate": 1.0776422046799511e-05, "loss": 2.3192, "step": 4901 }, { "epoch": 0.49, "learning_rate": 1.0773186690315996e-05, "loss": 2.3205, "step": 4902 }, { "epoch": 0.49, "learning_rate": 1.0769951252410127e-05, "loss": 2.3293, "step": 4903 }, { "epoch": 0.49, "learning_rate": 1.0766715733422616e-05, "loss": 2.3255, "step": 4904 }, { "epoch": 0.49, "learning_rate": 1.0763480133694188e-05, "loss": 2.3862, "step": 4905 }, { "epoch": 0.49, "learning_rate": 1.0760244453565577e-05, "loss": 2.4087, "step": 4906 }, { "epoch": 0.49, "learning_rate": 1.0757008693377522e-05, "loss": 2.4224, "step": 4907 }, { "epoch": 0.49, "learning_rate": 1.0753772853470776e-05, "loss": 2.4163, "step": 4908 }, { "epoch": 0.49, "learning_rate": 1.0750536934186093e-05, "loss": 2.2886, "step": 4909 }, { "epoch": 0.49, "learning_rate": 1.0747300935864245e-05, "loss": 2.3407, "step": 4910 }, { "epoch": 0.49, "learning_rate": 1.0744064858846e-05, "loss": 2.4034, "step": 4911 }, { "epoch": 0.49, "learning_rate": 1.0740828703472147e-05, "loss": 2.3279, "step": 4912 }, { "epoch": 0.49, "learning_rate": 1.0737592470083477e-05, "loss": 2.2918, "step": 4913 }, { "epoch": 0.49, "learning_rate": 1.073435615902079e-05, "loss": 2.3274, "step": 4914 }, { "epoch": 0.49, "learning_rate": 1.0731119770624887e-05, "loss": 2.378, "step": 4915 }, { "epoch": 0.49, "learning_rate": 1.0727883305236593e-05, "loss": 2.3019, "step": 4916 }, { "epoch": 0.49, "learning_rate": 1.0724646763196726e-05, "loss": 2.2954, "step": 4917 }, { "epoch": 0.49, "learning_rate": 1.072141014484612e-05, "loss": 2.4473, "step": 4918 }, { "epoch": 0.49, "learning_rate": 1.0718173450525618e-05, "loss": 2.3738, "step": 4919 }, { "epoch": 0.49, "learning_rate": 1.0714936680576062e-05, "loss": 2.3989, "step": 4920 }, { "epoch": 0.49, "learning_rate": 1.0711699835338314e-05, "loss": 2.323, "step": 4921 }, { "epoch": 0.49, "learning_rate": 1.0708462915153234e-05, "loss": 2.4458, "step": 4922 }, { "epoch": 0.49, "learning_rate": 1.07052259203617e-05, "loss": 2.1803, "step": 4923 }, { "epoch": 0.49, "learning_rate": 1.0701988851304583e-05, "loss": 2.394, "step": 4924 }, { "epoch": 0.49, "learning_rate": 1.0698751708322779e-05, "loss": 2.3201, "step": 4925 }, { "epoch": 0.49, "learning_rate": 1.0695514491757178e-05, "loss": 2.3766, "step": 4926 }, { "epoch": 0.49, "learning_rate": 1.0692277201948684e-05, "loss": 2.3075, "step": 4927 }, { "epoch": 0.49, "learning_rate": 1.0689039839238208e-05, "loss": 2.263, "step": 4928 }, { "epoch": 0.49, "learning_rate": 1.068580240396667e-05, "loss": 2.399, "step": 4929 }, { "epoch": 0.49, "learning_rate": 1.0682564896474995e-05, "loss": 2.345, "step": 4930 }, { "epoch": 0.49, "learning_rate": 1.0679327317104123e-05, "loss": 2.3604, "step": 4931 }, { "epoch": 0.49, "learning_rate": 1.0676089666194985e-05, "loss": 2.3133, "step": 4932 }, { "epoch": 0.49, "learning_rate": 1.0672851944088532e-05, "loss": 2.2862, "step": 4933 }, { "epoch": 0.49, "learning_rate": 1.0669614151125726e-05, "loss": 2.3593, "step": 4934 }, { "epoch": 0.49, "learning_rate": 1.0666376287647531e-05, "loss": 2.2658, "step": 4935 }, { "epoch": 0.49, "learning_rate": 1.0663138353994915e-05, "loss": 2.3875, "step": 4936 }, { "epoch": 0.49, "learning_rate": 1.0659900350508852e-05, "loss": 2.3941, "step": 4937 }, { "epoch": 0.49, "learning_rate": 1.0656662277530337e-05, "loss": 2.346, "step": 4938 }, { "epoch": 0.49, "learning_rate": 1.0653424135400359e-05, "loss": 2.3651, "step": 4939 }, { "epoch": 0.49, "learning_rate": 1.0650185924459916e-05, "loss": 2.2708, "step": 4940 }, { "epoch": 0.5, "learning_rate": 1.0646947645050023e-05, "loss": 2.3127, "step": 4941 }, { "epoch": 0.5, "learning_rate": 1.0643709297511689e-05, "loss": 2.3235, "step": 4942 }, { "epoch": 0.5, "learning_rate": 1.0640470882185938e-05, "loss": 2.3819, "step": 4943 }, { "epoch": 0.5, "learning_rate": 1.06372323994138e-05, "loss": 2.3821, "step": 4944 }, { "epoch": 0.5, "learning_rate": 1.0633993849536312e-05, "loss": 2.4776, "step": 4945 }, { "epoch": 0.5, "learning_rate": 1.0630755232894518e-05, "loss": 2.4286, "step": 4946 }, { "epoch": 0.5, "learning_rate": 1.0627516549829466e-05, "loss": 2.3639, "step": 4947 }, { "epoch": 0.5, "learning_rate": 1.0624277800682216e-05, "loss": 2.311, "step": 4948 }, { "epoch": 0.5, "learning_rate": 1.0621038985793832e-05, "loss": 2.3017, "step": 4949 }, { "epoch": 0.5, "learning_rate": 1.0617800105505384e-05, "loss": 2.3968, "step": 4950 }, { "epoch": 0.5, "learning_rate": 1.061456116015795e-05, "loss": 2.3576, "step": 4951 }, { "epoch": 0.5, "learning_rate": 1.061132215009262e-05, "loss": 2.3468, "step": 4952 }, { "epoch": 0.5, "learning_rate": 1.0608083075650482e-05, "loss": 2.3724, "step": 4953 }, { "epoch": 0.5, "learning_rate": 1.0604843937172635e-05, "loss": 2.2632, "step": 4954 }, { "epoch": 0.5, "learning_rate": 1.0601604735000187e-05, "loss": 2.3923, "step": 4955 }, { "epoch": 0.5, "learning_rate": 1.0598365469474246e-05, "loss": 2.3076, "step": 4956 }, { "epoch": 0.5, "learning_rate": 1.0595126140935936e-05, "loss": 2.3085, "step": 4957 }, { "epoch": 0.5, "learning_rate": 1.059188674972638e-05, "loss": 2.3385, "step": 4958 }, { "epoch": 0.5, "learning_rate": 1.0588647296186709e-05, "loss": 2.3416, "step": 4959 }, { "epoch": 0.5, "learning_rate": 1.0585407780658061e-05, "loss": 2.2537, "step": 4960 }, { "epoch": 0.5, "learning_rate": 1.0582168203481586e-05, "loss": 2.3612, "step": 4961 }, { "epoch": 0.5, "learning_rate": 1.0578928564998431e-05, "loss": 2.2711, "step": 4962 }, { "epoch": 0.5, "learning_rate": 1.057568886554976e-05, "loss": 2.3211, "step": 4963 }, { "epoch": 0.5, "learning_rate": 1.057244910547673e-05, "loss": 2.3478, "step": 4964 }, { "epoch": 0.5, "learning_rate": 1.056920928512052e-05, "loss": 2.3997, "step": 4965 }, { "epoch": 0.5, "learning_rate": 1.0565969404822301e-05, "loss": 2.2611, "step": 4966 }, { "epoch": 0.5, "learning_rate": 1.0562729464923263e-05, "loss": 2.3436, "step": 4967 }, { "epoch": 0.5, "learning_rate": 1.0559489465764588e-05, "loss": 2.3164, "step": 4968 }, { "epoch": 0.5, "learning_rate": 1.0556249407687476e-05, "loss": 2.3778, "step": 4969 }, { "epoch": 0.5, "learning_rate": 1.055300929103313e-05, "loss": 2.325, "step": 4970 }, { "epoch": 0.5, "learning_rate": 1.0549769116142758e-05, "loss": 2.39, "step": 4971 }, { "epoch": 0.5, "learning_rate": 1.0546528883357577e-05, "loss": 2.4028, "step": 4972 }, { "epoch": 0.5, "learning_rate": 1.0543288593018803e-05, "loss": 2.4407, "step": 4973 }, { "epoch": 0.5, "learning_rate": 1.0540048245467667e-05, "loss": 2.3301, "step": 4974 }, { "epoch": 0.5, "learning_rate": 1.0536807841045401e-05, "loss": 2.3321, "step": 4975 }, { "epoch": 0.5, "learning_rate": 1.0533567380093243e-05, "loss": 2.3889, "step": 4976 }, { "epoch": 0.5, "learning_rate": 1.053032686295244e-05, "loss": 2.4163, "step": 4977 }, { "epoch": 0.5, "learning_rate": 1.0527086289964241e-05, "loss": 2.346, "step": 4978 }, { "epoch": 0.5, "learning_rate": 1.0523845661469903e-05, "loss": 2.2526, "step": 4979 }, { "epoch": 0.5, "learning_rate": 1.0520604977810684e-05, "loss": 2.3458, "step": 4980 }, { "epoch": 0.5, "learning_rate": 1.051736423932786e-05, "loss": 2.3155, "step": 4981 }, { "epoch": 0.5, "learning_rate": 1.05141234463627e-05, "loss": 2.3624, "step": 4982 }, { "epoch": 0.5, "learning_rate": 1.0510882599256486e-05, "loss": 2.4032, "step": 4983 }, { "epoch": 0.5, "learning_rate": 1.0507641698350504e-05, "loss": 2.3224, "step": 4984 }, { "epoch": 0.5, "learning_rate": 1.0504400743986043e-05, "loss": 2.3305, "step": 4985 }, { "epoch": 0.5, "learning_rate": 1.05011597365044e-05, "loss": 2.4179, "step": 4986 }, { "epoch": 0.5, "learning_rate": 1.0497918676246879e-05, "loss": 2.4158, "step": 4987 }, { "epoch": 0.5, "learning_rate": 1.0494677563554788e-05, "loss": 2.3946, "step": 4988 }, { "epoch": 0.5, "learning_rate": 1.049143639876944e-05, "loss": 2.3399, "step": 4989 }, { "epoch": 0.5, "learning_rate": 1.0488195182232153e-05, "loss": 2.4429, "step": 4990 }, { "epoch": 0.5, "learning_rate": 1.0484953914284248e-05, "loss": 2.2946, "step": 4991 }, { "epoch": 0.5, "learning_rate": 1.0481712595267062e-05, "loss": 2.4308, "step": 4992 }, { "epoch": 0.5, "learning_rate": 1.047847122552193e-05, "loss": 2.4052, "step": 4993 }, { "epoch": 0.5, "learning_rate": 1.0475229805390185e-05, "loss": 2.4818, "step": 4994 }, { "epoch": 0.5, "learning_rate": 1.0471988335213178e-05, "loss": 2.1939, "step": 4995 }, { "epoch": 0.5, "learning_rate": 1.0468746815332261e-05, "loss": 2.2969, "step": 4996 }, { "epoch": 0.5, "learning_rate": 1.0465505246088789e-05, "loss": 2.4513, "step": 4997 }, { "epoch": 0.5, "learning_rate": 1.0462263627824122e-05, "loss": 2.3596, "step": 4998 }, { "epoch": 0.5, "learning_rate": 1.0459021960879634e-05, "loss": 2.4065, "step": 4999 }, { "epoch": 0.5, "learning_rate": 1.0455780245596682e-05, "loss": 2.317, "step": 5000 }, { "epoch": 0.5, "learning_rate": 1.0452538482316658e-05, "loss": 2.425, "step": 5001 }, { "epoch": 0.5, "learning_rate": 1.0449296671380937e-05, "loss": 2.4238, "step": 5002 }, { "epoch": 0.5, "learning_rate": 1.0446054813130907e-05, "loss": 2.3616, "step": 5003 }, { "epoch": 0.5, "learning_rate": 1.044281290790796e-05, "loss": 2.2788, "step": 5004 }, { "epoch": 0.5, "learning_rate": 1.043957095605349e-05, "loss": 2.4282, "step": 5005 }, { "epoch": 0.5, "learning_rate": 1.0436328957908903e-05, "loss": 2.3305, "step": 5006 }, { "epoch": 0.5, "learning_rate": 1.0433086913815605e-05, "loss": 2.3955, "step": 5007 }, { "epoch": 0.5, "learning_rate": 1.0429844824115007e-05, "loss": 2.3555, "step": 5008 }, { "epoch": 0.5, "learning_rate": 1.0426602689148527e-05, "loss": 2.2693, "step": 5009 }, { "epoch": 0.5, "learning_rate": 1.0423360509257583e-05, "loss": 2.3744, "step": 5010 }, { "epoch": 0.5, "learning_rate": 1.0420118284783603e-05, "loss": 2.3458, "step": 5011 }, { "epoch": 0.5, "learning_rate": 1.0416876016068016e-05, "loss": 2.296, "step": 5012 }, { "epoch": 0.5, "learning_rate": 1.0413633703452257e-05, "loss": 2.3531, "step": 5013 }, { "epoch": 0.5, "learning_rate": 1.0410391347277767e-05, "loss": 2.3811, "step": 5014 }, { "epoch": 0.5, "learning_rate": 1.0407148947885993e-05, "loss": 2.3224, "step": 5015 }, { "epoch": 0.5, "learning_rate": 1.0403906505618378e-05, "loss": 2.3121, "step": 5016 }, { "epoch": 0.5, "learning_rate": 1.040066402081638e-05, "loss": 2.4869, "step": 5017 }, { "epoch": 0.5, "learning_rate": 1.0397421493821456e-05, "loss": 2.4012, "step": 5018 }, { "epoch": 0.5, "learning_rate": 1.0394178924975068e-05, "loss": 2.2948, "step": 5019 }, { "epoch": 0.5, "learning_rate": 1.0390936314618685e-05, "loss": 2.3637, "step": 5020 }, { "epoch": 0.5, "learning_rate": 1.0387693663093776e-05, "loss": 2.4356, "step": 5021 }, { "epoch": 0.5, "learning_rate": 1.0384450970741813e-05, "loss": 2.3111, "step": 5022 }, { "epoch": 0.5, "learning_rate": 1.038120823790428e-05, "loss": 2.3735, "step": 5023 }, { "epoch": 0.5, "learning_rate": 1.0377965464922663e-05, "loss": 2.2934, "step": 5024 }, { "epoch": 0.5, "learning_rate": 1.037472265213845e-05, "loss": 2.4055, "step": 5025 }, { "epoch": 0.5, "learning_rate": 1.0371479799893129e-05, "loss": 2.2709, "step": 5026 }, { "epoch": 0.5, "learning_rate": 1.0368236908528195e-05, "loss": 2.4056, "step": 5027 }, { "epoch": 0.5, "learning_rate": 1.0364993978385158e-05, "loss": 2.326, "step": 5028 }, { "epoch": 0.5, "learning_rate": 1.0361751009805517e-05, "loss": 2.3696, "step": 5029 }, { "epoch": 0.5, "learning_rate": 1.035850800313078e-05, "loss": 2.273, "step": 5030 }, { "epoch": 0.5, "learning_rate": 1.0355264958702465e-05, "loss": 2.3107, "step": 5031 }, { "epoch": 0.5, "learning_rate": 1.0352021876862084e-05, "loss": 2.3843, "step": 5032 }, { "epoch": 0.5, "learning_rate": 1.034877875795116e-05, "loss": 2.389, "step": 5033 }, { "epoch": 0.5, "learning_rate": 1.0345535602311214e-05, "loss": 2.3343, "step": 5034 }, { "epoch": 0.5, "learning_rate": 1.0342292410283778e-05, "loss": 2.3386, "step": 5035 }, { "epoch": 0.5, "learning_rate": 1.0339049182210386e-05, "loss": 2.3586, "step": 5036 }, { "epoch": 0.5, "learning_rate": 1.033580591843257e-05, "loss": 2.3058, "step": 5037 }, { "epoch": 0.5, "learning_rate": 1.0332562619291876e-05, "loss": 2.3992, "step": 5038 }, { "epoch": 0.5, "learning_rate": 1.0329319285129842e-05, "loss": 2.3691, "step": 5039 }, { "epoch": 0.5, "learning_rate": 1.0326075916288019e-05, "loss": 2.3386, "step": 5040 }, { "epoch": 0.51, "learning_rate": 1.0322832513107955e-05, "loss": 2.3453, "step": 5041 }, { "epoch": 0.51, "learning_rate": 1.0319589075931207e-05, "loss": 2.3227, "step": 5042 }, { "epoch": 0.51, "learning_rate": 1.0316345605099332e-05, "loss": 2.303, "step": 5043 }, { "epoch": 0.51, "learning_rate": 1.0313102100953893e-05, "loss": 2.3371, "step": 5044 }, { "epoch": 0.51, "learning_rate": 1.0309858563836453e-05, "loss": 2.3308, "step": 5045 }, { "epoch": 0.51, "learning_rate": 1.0306614994088582e-05, "loss": 2.3704, "step": 5046 }, { "epoch": 0.51, "learning_rate": 1.0303371392051855e-05, "loss": 2.3707, "step": 5047 }, { "epoch": 0.51, "learning_rate": 1.0300127758067844e-05, "loss": 2.3316, "step": 5048 }, { "epoch": 0.51, "learning_rate": 1.0296884092478128e-05, "loss": 2.4368, "step": 5049 }, { "epoch": 0.51, "learning_rate": 1.0293640395624292e-05, "loss": 2.334, "step": 5050 }, { "epoch": 0.51, "learning_rate": 1.0290396667847921e-05, "loss": 2.3828, "step": 5051 }, { "epoch": 0.51, "learning_rate": 1.0287152909490603e-05, "loss": 2.3454, "step": 5052 }, { "epoch": 0.51, "learning_rate": 1.0283909120893929e-05, "loss": 2.3193, "step": 5053 }, { "epoch": 0.51, "learning_rate": 1.0280665302399496e-05, "loss": 2.3579, "step": 5054 }, { "epoch": 0.51, "learning_rate": 1.02774214543489e-05, "loss": 2.3609, "step": 5055 }, { "epoch": 0.51, "learning_rate": 1.0274177577083746e-05, "loss": 2.3785, "step": 5056 }, { "epoch": 0.51, "learning_rate": 1.0270933670945635e-05, "loss": 2.3426, "step": 5057 }, { "epoch": 0.51, "learning_rate": 1.0267689736276176e-05, "loss": 2.3828, "step": 5058 }, { "epoch": 0.51, "learning_rate": 1.0264445773416984e-05, "loss": 2.3419, "step": 5059 }, { "epoch": 0.51, "learning_rate": 1.0261201782709667e-05, "loss": 2.2617, "step": 5060 }, { "epoch": 0.51, "learning_rate": 1.0257957764495842e-05, "loss": 2.3199, "step": 5061 }, { "epoch": 0.51, "learning_rate": 1.0254713719117133e-05, "loss": 2.2457, "step": 5062 }, { "epoch": 0.51, "learning_rate": 1.0251469646915158e-05, "loss": 2.3471, "step": 5063 }, { "epoch": 0.51, "learning_rate": 1.0248225548231543e-05, "loss": 2.3398, "step": 5064 }, { "epoch": 0.51, "learning_rate": 1.0244981423407915e-05, "loss": 2.329, "step": 5065 }, { "epoch": 0.51, "learning_rate": 1.0241737272785907e-05, "loss": 2.3384, "step": 5066 }, { "epoch": 0.51, "learning_rate": 1.0238493096707149e-05, "loss": 2.3454, "step": 5067 }, { "epoch": 0.51, "learning_rate": 1.023524889551328e-05, "loss": 2.3958, "step": 5068 }, { "epoch": 0.51, "learning_rate": 1.023200466954594e-05, "loss": 2.2763, "step": 5069 }, { "epoch": 0.51, "learning_rate": 1.0228760419146768e-05, "loss": 2.4299, "step": 5070 }, { "epoch": 0.51, "learning_rate": 1.0225516144657408e-05, "loss": 2.3574, "step": 5071 }, { "epoch": 0.51, "learning_rate": 1.0222271846419507e-05, "loss": 2.3885, "step": 5072 }, { "epoch": 0.51, "learning_rate": 1.0219027524774714e-05, "loss": 2.3127, "step": 5073 }, { "epoch": 0.51, "learning_rate": 1.0215783180064678e-05, "loss": 2.3615, "step": 5074 }, { "epoch": 0.51, "learning_rate": 1.0212538812631056e-05, "loss": 2.2832, "step": 5075 }, { "epoch": 0.51, "learning_rate": 1.02092944228155e-05, "loss": 2.3512, "step": 5076 }, { "epoch": 0.51, "learning_rate": 1.0206050010959677e-05, "loss": 2.427, "step": 5077 }, { "epoch": 0.51, "learning_rate": 1.0202805577405239e-05, "loss": 2.3634, "step": 5078 }, { "epoch": 0.51, "learning_rate": 1.0199561122493852e-05, "loss": 2.317, "step": 5079 }, { "epoch": 0.51, "learning_rate": 1.0196316646567186e-05, "loss": 2.3123, "step": 5080 }, { "epoch": 0.51, "learning_rate": 1.0193072149966901e-05, "loss": 2.4483, "step": 5081 }, { "epoch": 0.51, "learning_rate": 1.0189827633034672e-05, "loss": 2.3799, "step": 5082 }, { "epoch": 0.51, "learning_rate": 1.0186583096112173e-05, "loss": 2.3192, "step": 5083 }, { "epoch": 0.51, "learning_rate": 1.0183338539541072e-05, "loss": 2.3579, "step": 5084 }, { "epoch": 0.51, "learning_rate": 1.0180093963663045e-05, "loss": 2.3152, "step": 5085 }, { "epoch": 0.51, "learning_rate": 1.0176849368819776e-05, "loss": 2.3681, "step": 5086 }, { "epoch": 0.51, "learning_rate": 1.0173604755352942e-05, "loss": 2.353, "step": 5087 }, { "epoch": 0.51, "learning_rate": 1.0170360123604224e-05, "loss": 2.4513, "step": 5088 }, { "epoch": 0.51, "learning_rate": 1.016711547391531e-05, "loss": 2.3338, "step": 5089 }, { "epoch": 0.51, "learning_rate": 1.0163870806627877e-05, "loss": 2.44, "step": 5090 }, { "epoch": 0.51, "learning_rate": 1.0160626122083626e-05, "loss": 2.3353, "step": 5091 }, { "epoch": 0.51, "learning_rate": 1.0157381420624237e-05, "loss": 2.2287, "step": 5092 }, { "epoch": 0.51, "learning_rate": 1.0154136702591404e-05, "loss": 2.4681, "step": 5093 }, { "epoch": 0.51, "learning_rate": 1.0150891968326822e-05, "loss": 2.3087, "step": 5094 }, { "epoch": 0.51, "learning_rate": 1.0147647218172183e-05, "loss": 2.4264, "step": 5095 }, { "epoch": 0.51, "learning_rate": 1.0144402452469184e-05, "loss": 2.3537, "step": 5096 }, { "epoch": 0.51, "learning_rate": 1.0141157671559524e-05, "loss": 2.4202, "step": 5097 }, { "epoch": 0.51, "learning_rate": 1.0137912875784902e-05, "loss": 2.4228, "step": 5098 }, { "epoch": 0.51, "learning_rate": 1.0134668065487021e-05, "loss": 2.3095, "step": 5099 }, { "epoch": 0.51, "learning_rate": 1.0131423241007581e-05, "loss": 2.3498, "step": 5100 }, { "epoch": 0.51, "learning_rate": 1.0128178402688291e-05, "loss": 2.3256, "step": 5101 }, { "epoch": 0.51, "learning_rate": 1.0124933550870853e-05, "loss": 2.3967, "step": 5102 }, { "epoch": 0.51, "learning_rate": 1.0121688685896973e-05, "loss": 2.3638, "step": 5103 }, { "epoch": 0.51, "learning_rate": 1.0118443808108365e-05, "loss": 2.5224, "step": 5104 }, { "epoch": 0.51, "learning_rate": 1.0115198917846733e-05, "loss": 2.3564, "step": 5105 }, { "epoch": 0.51, "learning_rate": 1.0111954015453792e-05, "loss": 2.3849, "step": 5106 }, { "epoch": 0.51, "learning_rate": 1.0108709101271252e-05, "loss": 2.3696, "step": 5107 }, { "epoch": 0.51, "learning_rate": 1.0105464175640828e-05, "loss": 2.3352, "step": 5108 }, { "epoch": 0.51, "learning_rate": 1.0102219238904238e-05, "loss": 2.3765, "step": 5109 }, { "epoch": 0.51, "learning_rate": 1.0098974291403196e-05, "loss": 2.3146, "step": 5110 }, { "epoch": 0.51, "learning_rate": 1.0095729333479417e-05, "loss": 2.2825, "step": 5111 }, { "epoch": 0.51, "learning_rate": 1.0092484365474622e-05, "loss": 2.4185, "step": 5112 }, { "epoch": 0.51, "learning_rate": 1.008923938773053e-05, "loss": 2.4045, "step": 5113 }, { "epoch": 0.51, "learning_rate": 1.0085994400588859e-05, "loss": 2.4236, "step": 5114 }, { "epoch": 0.51, "learning_rate": 1.0082749404391337e-05, "loss": 2.3902, "step": 5115 }, { "epoch": 0.51, "learning_rate": 1.0079504399479677e-05, "loss": 2.2986, "step": 5116 }, { "epoch": 0.51, "learning_rate": 1.007625938619561e-05, "loss": 2.3479, "step": 5117 }, { "epoch": 0.51, "learning_rate": 1.007301436488086e-05, "loss": 2.388, "step": 5118 }, { "epoch": 0.51, "learning_rate": 1.0069769335877146e-05, "loss": 2.3723, "step": 5119 }, { "epoch": 0.51, "learning_rate": 1.0066524299526202e-05, "loss": 2.4473, "step": 5120 }, { "epoch": 0.51, "learning_rate": 1.0063279256169745e-05, "loss": 2.3548, "step": 5121 }, { "epoch": 0.51, "learning_rate": 1.006003420614951e-05, "loss": 2.4165, "step": 5122 }, { "epoch": 0.51, "learning_rate": 1.0056789149807223e-05, "loss": 2.3379, "step": 5123 }, { "epoch": 0.51, "learning_rate": 1.0053544087484612e-05, "loss": 2.4244, "step": 5124 }, { "epoch": 0.51, "learning_rate": 1.0050299019523408e-05, "loss": 2.3682, "step": 5125 }, { "epoch": 0.51, "learning_rate": 1.0047053946265341e-05, "loss": 2.3588, "step": 5126 }, { "epoch": 0.51, "learning_rate": 1.004380886805214e-05, "loss": 2.3971, "step": 5127 }, { "epoch": 0.51, "learning_rate": 1.0040563785225536e-05, "loss": 2.401, "step": 5128 }, { "epoch": 0.51, "learning_rate": 1.0037318698127261e-05, "loss": 2.2707, "step": 5129 }, { "epoch": 0.51, "learning_rate": 1.0034073607099046e-05, "loss": 2.4564, "step": 5130 }, { "epoch": 0.51, "learning_rate": 1.0030828512482627e-05, "loss": 2.3312, "step": 5131 }, { "epoch": 0.51, "learning_rate": 1.0027583414619733e-05, "loss": 2.4137, "step": 5132 }, { "epoch": 0.51, "learning_rate": 1.00243383138521e-05, "loss": 2.295, "step": 5133 }, { "epoch": 0.51, "learning_rate": 1.0021093210521457e-05, "loss": 2.4138, "step": 5134 }, { "epoch": 0.51, "learning_rate": 1.0017848104969544e-05, "loss": 2.1811, "step": 5135 }, { "epoch": 0.51, "learning_rate": 1.0014602997538092e-05, "loss": 2.4042, "step": 5136 }, { "epoch": 0.51, "learning_rate": 1.0011357888568834e-05, "loss": 2.3065, "step": 5137 }, { "epoch": 0.51, "learning_rate": 1.0008112778403505e-05, "loss": 2.3968, "step": 5138 }, { "epoch": 0.51, "learning_rate": 1.0004867667383837e-05, "loss": 2.2978, "step": 5139 }, { "epoch": 0.51, "learning_rate": 1.000162255585157e-05, "loss": 2.4038, "step": 5140 }, { "epoch": 0.52, "learning_rate": 9.998377444148434e-06, "loss": 2.3014, "step": 5141 }, { "epoch": 0.52, "learning_rate": 9.995132332616167e-06, "loss": 2.4049, "step": 5142 }, { "epoch": 0.52, "learning_rate": 9.991887221596502e-06, "loss": 2.3604, "step": 5143 }, { "epoch": 0.52, "learning_rate": 9.988642111431171e-06, "loss": 2.4503, "step": 5144 }, { "epoch": 0.52, "learning_rate": 9.985397002461911e-06, "loss": 2.3726, "step": 5145 }, { "epoch": 0.52, "learning_rate": 9.982151895030457e-06, "loss": 2.3708, "step": 5146 }, { "epoch": 0.52, "learning_rate": 9.978906789478544e-06, "loss": 2.3414, "step": 5147 }, { "epoch": 0.52, "learning_rate": 9.975661686147904e-06, "loss": 2.431, "step": 5148 }, { "epoch": 0.52, "learning_rate": 9.97241658538027e-06, "loss": 2.3789, "step": 5149 }, { "epoch": 0.52, "learning_rate": 9.969171487517377e-06, "loss": 2.36, "step": 5150 }, { "epoch": 0.52, "learning_rate": 9.965926392900956e-06, "loss": 2.3461, "step": 5151 }, { "epoch": 0.52, "learning_rate": 9.962681301872742e-06, "loss": 2.3598, "step": 5152 }, { "epoch": 0.52, "learning_rate": 9.959436214774469e-06, "loss": 2.3872, "step": 5153 }, { "epoch": 0.52, "learning_rate": 9.956191131947862e-06, "loss": 2.2613, "step": 5154 }, { "epoch": 0.52, "learning_rate": 9.952946053734662e-06, "loss": 2.3782, "step": 5155 }, { "epoch": 0.52, "learning_rate": 9.949700980476594e-06, "loss": 2.3506, "step": 5156 }, { "epoch": 0.52, "learning_rate": 9.94645591251539e-06, "loss": 2.2531, "step": 5157 }, { "epoch": 0.52, "learning_rate": 9.94321085019278e-06, "loss": 2.3647, "step": 5158 }, { "epoch": 0.52, "learning_rate": 9.939965793850494e-06, "loss": 2.3983, "step": 5159 }, { "epoch": 0.52, "learning_rate": 9.936720743830259e-06, "loss": 2.3429, "step": 5160 }, { "epoch": 0.52, "learning_rate": 9.933475700473805e-06, "loss": 2.3819, "step": 5161 }, { "epoch": 0.52, "learning_rate": 9.93023066412286e-06, "loss": 2.319, "step": 5162 }, { "epoch": 0.52, "learning_rate": 9.926985635119142e-06, "loss": 2.4325, "step": 5163 }, { "epoch": 0.52, "learning_rate": 9.92374061380439e-06, "loss": 2.3874, "step": 5164 }, { "epoch": 0.52, "learning_rate": 9.920495600520322e-06, "loss": 2.2819, "step": 5165 }, { "epoch": 0.52, "learning_rate": 9.917250595608665e-06, "loss": 2.4761, "step": 5166 }, { "epoch": 0.52, "learning_rate": 9.914005599411143e-06, "loss": 2.3206, "step": 5167 }, { "epoch": 0.52, "learning_rate": 9.910760612269474e-06, "loss": 2.443, "step": 5168 }, { "epoch": 0.52, "learning_rate": 9.907515634525382e-06, "loss": 2.3339, "step": 5169 }, { "epoch": 0.52, "learning_rate": 9.904270666520588e-06, "loss": 2.2793, "step": 5170 }, { "epoch": 0.52, "learning_rate": 9.901025708596809e-06, "loss": 2.3032, "step": 5171 }, { "epoch": 0.52, "learning_rate": 9.897780761095762e-06, "loss": 2.3821, "step": 5172 }, { "epoch": 0.52, "learning_rate": 9.89453582435917e-06, "loss": 2.2725, "step": 5173 }, { "epoch": 0.52, "learning_rate": 9.89129089872875e-06, "loss": 2.3037, "step": 5174 }, { "epoch": 0.52, "learning_rate": 9.888045984546211e-06, "loss": 2.342, "step": 5175 }, { "epoch": 0.52, "learning_rate": 9.88480108215327e-06, "loss": 2.191, "step": 5176 }, { "epoch": 0.52, "learning_rate": 9.88155619189164e-06, "loss": 2.3823, "step": 5177 }, { "epoch": 0.52, "learning_rate": 9.878311314103029e-06, "loss": 2.3353, "step": 5178 }, { "epoch": 0.52, "learning_rate": 9.875066449129154e-06, "loss": 2.3515, "step": 5179 }, { "epoch": 0.52, "learning_rate": 9.871821597311715e-06, "loss": 2.3659, "step": 5180 }, { "epoch": 0.52, "learning_rate": 9.868576758992419e-06, "loss": 2.2073, "step": 5181 }, { "epoch": 0.52, "learning_rate": 9.86533193451298e-06, "loss": 2.3564, "step": 5182 }, { "epoch": 0.52, "learning_rate": 9.8620871242151e-06, "loss": 2.3553, "step": 5183 }, { "epoch": 0.52, "learning_rate": 9.858842328440479e-06, "loss": 2.2757, "step": 5184 }, { "epoch": 0.52, "learning_rate": 9.85559754753082e-06, "loss": 2.3758, "step": 5185 }, { "epoch": 0.52, "learning_rate": 9.85235278182782e-06, "loss": 2.2308, "step": 5186 }, { "epoch": 0.52, "learning_rate": 9.849108031673181e-06, "loss": 2.3302, "step": 5187 }, { "epoch": 0.52, "learning_rate": 9.845863297408598e-06, "loss": 2.3335, "step": 5188 }, { "epoch": 0.52, "learning_rate": 9.842618579375766e-06, "loss": 2.3023, "step": 5189 }, { "epoch": 0.52, "learning_rate": 9.839373877916375e-06, "loss": 2.3821, "step": 5190 }, { "epoch": 0.52, "learning_rate": 9.836129193372121e-06, "loss": 2.3219, "step": 5191 }, { "epoch": 0.52, "learning_rate": 9.832884526084694e-06, "loss": 2.44, "step": 5192 }, { "epoch": 0.52, "learning_rate": 9.829639876395778e-06, "loss": 2.382, "step": 5193 }, { "epoch": 0.52, "learning_rate": 9.826395244647062e-06, "loss": 2.3392, "step": 5194 }, { "epoch": 0.52, "learning_rate": 9.823150631180227e-06, "loss": 2.3046, "step": 5195 }, { "epoch": 0.52, "learning_rate": 9.819906036336958e-06, "loss": 2.3444, "step": 5196 }, { "epoch": 0.52, "learning_rate": 9.816661460458933e-06, "loss": 2.4006, "step": 5197 }, { "epoch": 0.52, "learning_rate": 9.813416903887832e-06, "loss": 2.4444, "step": 5198 }, { "epoch": 0.52, "learning_rate": 9.810172366965328e-06, "loss": 2.352, "step": 5199 }, { "epoch": 0.52, "learning_rate": 9.8069278500331e-06, "loss": 2.3824, "step": 5200 }, { "epoch": 0.52, "learning_rate": 9.803683353432818e-06, "loss": 2.3599, "step": 5201 }, { "epoch": 0.52, "learning_rate": 9.80043887750615e-06, "loss": 2.3823, "step": 5202 }, { "epoch": 0.52, "learning_rate": 9.797194422594763e-06, "loss": 2.3681, "step": 5203 }, { "epoch": 0.52, "learning_rate": 9.793949989040327e-06, "loss": 2.3759, "step": 5204 }, { "epoch": 0.52, "learning_rate": 9.790705577184501e-06, "loss": 2.2373, "step": 5205 }, { "epoch": 0.52, "learning_rate": 9.787461187368949e-06, "loss": 2.373, "step": 5206 }, { "epoch": 0.52, "learning_rate": 9.784216819935327e-06, "loss": 2.3785, "step": 5207 }, { "epoch": 0.52, "learning_rate": 9.78097247522529e-06, "loss": 2.3528, "step": 5208 }, { "epoch": 0.52, "learning_rate": 9.777728153580495e-06, "loss": 2.2583, "step": 5209 }, { "epoch": 0.52, "learning_rate": 9.774483855342594e-06, "loss": 2.3945, "step": 5210 }, { "epoch": 0.52, "learning_rate": 9.771239580853234e-06, "loss": 2.2992, "step": 5211 }, { "epoch": 0.52, "learning_rate": 9.767995330454061e-06, "loss": 2.3878, "step": 5212 }, { "epoch": 0.52, "learning_rate": 9.764751104486721e-06, "loss": 2.3697, "step": 5213 }, { "epoch": 0.52, "learning_rate": 9.761506903292855e-06, "loss": 2.3611, "step": 5214 }, { "epoch": 0.52, "learning_rate": 9.758262727214098e-06, "loss": 2.424, "step": 5215 }, { "epoch": 0.52, "learning_rate": 9.75501857659209e-06, "loss": 2.3505, "step": 5216 }, { "epoch": 0.52, "learning_rate": 9.751774451768459e-06, "loss": 2.3091, "step": 5217 }, { "epoch": 0.52, "learning_rate": 9.748530353084842e-06, "loss": 2.4178, "step": 5218 }, { "epoch": 0.52, "learning_rate": 9.745286280882869e-06, "loss": 2.2967, "step": 5219 }, { "epoch": 0.52, "learning_rate": 9.74204223550416e-06, "loss": 2.3499, "step": 5220 }, { "epoch": 0.52, "learning_rate": 9.738798217290336e-06, "loss": 2.3125, "step": 5221 }, { "epoch": 0.52, "learning_rate": 9.735554226583019e-06, "loss": 2.346, "step": 5222 }, { "epoch": 0.52, "learning_rate": 9.732310263723826e-06, "loss": 2.4187, "step": 5223 }, { "epoch": 0.52, "learning_rate": 9.729066329054368e-06, "loss": 2.4065, "step": 5224 }, { "epoch": 0.52, "learning_rate": 9.725822422916259e-06, "loss": 2.3154, "step": 5225 }, { "epoch": 0.52, "learning_rate": 9.722578545651102e-06, "loss": 2.3267, "step": 5226 }, { "epoch": 0.52, "learning_rate": 9.719334697600506e-06, "loss": 2.3395, "step": 5227 }, { "epoch": 0.52, "learning_rate": 9.716090879106074e-06, "loss": 2.3493, "step": 5228 }, { "epoch": 0.52, "learning_rate": 9.7128470905094e-06, "loss": 2.3502, "step": 5229 }, { "epoch": 0.52, "learning_rate": 9.70960333215208e-06, "loss": 2.3644, "step": 5230 }, { "epoch": 0.52, "learning_rate": 9.706359604375711e-06, "loss": 2.3583, "step": 5231 }, { "epoch": 0.52, "learning_rate": 9.703115907521875e-06, "loss": 2.3931, "step": 5232 }, { "epoch": 0.52, "learning_rate": 9.699872241932161e-06, "loss": 2.2302, "step": 5233 }, { "epoch": 0.52, "learning_rate": 9.696628607948151e-06, "loss": 2.2573, "step": 5234 }, { "epoch": 0.52, "learning_rate": 9.69338500591142e-06, "loss": 2.4452, "step": 5235 }, { "epoch": 0.52, "learning_rate": 9.690141436163549e-06, "loss": 2.5118, "step": 5236 }, { "epoch": 0.52, "learning_rate": 9.68689789904611e-06, "loss": 2.4046, "step": 5237 }, { "epoch": 0.52, "learning_rate": 9.683654394900671e-06, "loss": 2.3208, "step": 5238 }, { "epoch": 0.52, "learning_rate": 9.680410924068797e-06, "loss": 2.383, "step": 5239 }, { "epoch": 0.52, "learning_rate": 9.677167486892049e-06, "loss": 2.402, "step": 5240 }, { "epoch": 0.53, "learning_rate": 9.673924083711985e-06, "loss": 2.4113, "step": 5241 }, { "epoch": 0.53, "learning_rate": 9.670680714870162e-06, "loss": 2.3266, "step": 5242 }, { "epoch": 0.53, "learning_rate": 9.66743738070813e-06, "loss": 2.3886, "step": 5243 }, { "epoch": 0.53, "learning_rate": 9.66419408156743e-06, "loss": 2.3376, "step": 5244 }, { "epoch": 0.53, "learning_rate": 9.660950817789615e-06, "loss": 2.2642, "step": 5245 }, { "epoch": 0.53, "learning_rate": 9.657707589716223e-06, "loss": 2.3898, "step": 5246 }, { "epoch": 0.53, "learning_rate": 9.65446439768879e-06, "loss": 2.2311, "step": 5247 }, { "epoch": 0.53, "learning_rate": 9.651221242048846e-06, "loss": 2.3655, "step": 5248 }, { "epoch": 0.53, "learning_rate": 9.647978123137919e-06, "loss": 2.2896, "step": 5249 }, { "epoch": 0.53, "learning_rate": 9.644735041297539e-06, "loss": 2.2225, "step": 5250 }, { "epoch": 0.53, "learning_rate": 9.641491996869221e-06, "loss": 2.3391, "step": 5251 }, { "epoch": 0.53, "learning_rate": 9.638248990194485e-06, "loss": 2.386, "step": 5252 }, { "epoch": 0.53, "learning_rate": 9.635006021614842e-06, "loss": 2.3447, "step": 5253 }, { "epoch": 0.53, "learning_rate": 9.631763091471805e-06, "loss": 2.4713, "step": 5254 }, { "epoch": 0.53, "learning_rate": 9.628520200106874e-06, "loss": 2.3496, "step": 5255 }, { "epoch": 0.53, "learning_rate": 9.625277347861554e-06, "loss": 2.2037, "step": 5256 }, { "epoch": 0.53, "learning_rate": 9.622034535077338e-06, "loss": 2.3185, "step": 5257 }, { "epoch": 0.53, "learning_rate": 9.618791762095721e-06, "loss": 2.3765, "step": 5258 }, { "epoch": 0.53, "learning_rate": 9.61554902925819e-06, "loss": 2.3269, "step": 5259 }, { "epoch": 0.53, "learning_rate": 9.612306336906229e-06, "loss": 2.3874, "step": 5260 }, { "epoch": 0.53, "learning_rate": 9.609063685381318e-06, "loss": 2.2995, "step": 5261 }, { "epoch": 0.53, "learning_rate": 9.605821075024933e-06, "loss": 2.3121, "step": 5262 }, { "epoch": 0.53, "learning_rate": 9.602578506178546e-06, "loss": 2.1811, "step": 5263 }, { "epoch": 0.53, "learning_rate": 9.599335979183621e-06, "loss": 2.2833, "step": 5264 }, { "epoch": 0.53, "learning_rate": 9.596093494381625e-06, "loss": 2.3451, "step": 5265 }, { "epoch": 0.53, "learning_rate": 9.592851052114012e-06, "loss": 2.2022, "step": 5266 }, { "epoch": 0.53, "learning_rate": 9.589608652722236e-06, "loss": 2.3525, "step": 5267 }, { "epoch": 0.53, "learning_rate": 9.586366296547748e-06, "loss": 2.261, "step": 5268 }, { "epoch": 0.53, "learning_rate": 9.58312398393199e-06, "loss": 2.2575, "step": 5269 }, { "epoch": 0.53, "learning_rate": 9.579881715216404e-06, "loss": 2.2782, "step": 5270 }, { "epoch": 0.53, "learning_rate": 9.576639490742422e-06, "loss": 2.4191, "step": 5271 }, { "epoch": 0.53, "learning_rate": 9.573397310851477e-06, "loss": 2.2589, "step": 5272 }, { "epoch": 0.53, "learning_rate": 9.570155175884996e-06, "loss": 2.3555, "step": 5273 }, { "epoch": 0.53, "learning_rate": 9.566913086184397e-06, "loss": 2.2565, "step": 5274 }, { "epoch": 0.53, "learning_rate": 9.5636710420911e-06, "loss": 2.283, "step": 5275 }, { "epoch": 0.53, "learning_rate": 9.560429043946514e-06, "loss": 2.3865, "step": 5276 }, { "epoch": 0.53, "learning_rate": 9.557187092092046e-06, "loss": 2.2819, "step": 5277 }, { "epoch": 0.53, "learning_rate": 9.553945186869099e-06, "loss": 2.315, "step": 5278 }, { "epoch": 0.53, "learning_rate": 9.550703328619068e-06, "loss": 2.2551, "step": 5279 }, { "epoch": 0.53, "learning_rate": 9.547461517683342e-06, "loss": 2.4178, "step": 5280 }, { "epoch": 0.53, "learning_rate": 9.544219754403316e-06, "loss": 2.3074, "step": 5281 }, { "epoch": 0.53, "learning_rate": 9.54097803912037e-06, "loss": 2.301, "step": 5282 }, { "epoch": 0.53, "learning_rate": 9.53773637217588e-06, "loss": 2.2615, "step": 5283 }, { "epoch": 0.53, "learning_rate": 9.534494753911214e-06, "loss": 2.5064, "step": 5284 }, { "epoch": 0.53, "learning_rate": 9.53125318466774e-06, "loss": 2.3224, "step": 5285 }, { "epoch": 0.53, "learning_rate": 9.528011664786825e-06, "loss": 2.3615, "step": 5286 }, { "epoch": 0.53, "learning_rate": 9.52477019460982e-06, "loss": 2.2855, "step": 5287 }, { "epoch": 0.53, "learning_rate": 9.521528774478077e-06, "loss": 2.3695, "step": 5288 }, { "epoch": 0.53, "learning_rate": 9.518287404732938e-06, "loss": 2.3703, "step": 5289 }, { "epoch": 0.53, "learning_rate": 9.515046085715752e-06, "loss": 2.3415, "step": 5290 }, { "epoch": 0.53, "learning_rate": 9.51180481776785e-06, "loss": 2.4311, "step": 5291 }, { "epoch": 0.53, "learning_rate": 9.508563601230564e-06, "loss": 2.3508, "step": 5292 }, { "epoch": 0.53, "learning_rate": 9.505322436445214e-06, "loss": 2.401, "step": 5293 }, { "epoch": 0.53, "learning_rate": 9.502081323753123e-06, "loss": 2.349, "step": 5294 }, { "epoch": 0.53, "learning_rate": 9.498840263495605e-06, "loss": 2.3908, "step": 5295 }, { "epoch": 0.53, "learning_rate": 9.495599256013963e-06, "loss": 2.304, "step": 5296 }, { "epoch": 0.53, "learning_rate": 9.492358301649503e-06, "loss": 2.3995, "step": 5297 }, { "epoch": 0.53, "learning_rate": 9.489117400743515e-06, "loss": 2.2358, "step": 5298 }, { "epoch": 0.53, "learning_rate": 9.485876553637302e-06, "loss": 2.3309, "step": 5299 }, { "epoch": 0.53, "learning_rate": 9.482635760672142e-06, "loss": 2.4405, "step": 5300 }, { "epoch": 0.53, "learning_rate": 9.479395022189318e-06, "loss": 2.4312, "step": 5301 }, { "epoch": 0.53, "learning_rate": 9.476154338530102e-06, "loss": 2.4281, "step": 5302 }, { "epoch": 0.53, "learning_rate": 9.472913710035762e-06, "loss": 2.3838, "step": 5303 }, { "epoch": 0.53, "learning_rate": 9.469673137047562e-06, "loss": 2.3397, "step": 5304 }, { "epoch": 0.53, "learning_rate": 9.466432619906758e-06, "loss": 2.235, "step": 5305 }, { "epoch": 0.53, "learning_rate": 9.4631921589546e-06, "loss": 2.3482, "step": 5306 }, { "epoch": 0.53, "learning_rate": 9.459951754532333e-06, "loss": 2.2566, "step": 5307 }, { "epoch": 0.53, "learning_rate": 9.456711406981197e-06, "loss": 2.432, "step": 5308 }, { "epoch": 0.53, "learning_rate": 9.453471116642425e-06, "loss": 2.4246, "step": 5309 }, { "epoch": 0.53, "learning_rate": 9.450230883857244e-06, "loss": 2.3527, "step": 5310 }, { "epoch": 0.53, "learning_rate": 9.446990708966874e-06, "loss": 2.3888, "step": 5311 }, { "epoch": 0.53, "learning_rate": 9.443750592312528e-06, "loss": 2.3844, "step": 5312 }, { "epoch": 0.53, "learning_rate": 9.440510534235418e-06, "loss": 2.2453, "step": 5313 }, { "epoch": 0.53, "learning_rate": 9.437270535076744e-06, "loss": 2.4021, "step": 5314 }, { "epoch": 0.53, "learning_rate": 9.4340305951777e-06, "loss": 2.3062, "step": 5315 }, { "epoch": 0.53, "learning_rate": 9.430790714879482e-06, "loss": 2.3388, "step": 5316 }, { "epoch": 0.53, "learning_rate": 9.42755089452327e-06, "loss": 2.3688, "step": 5317 }, { "epoch": 0.53, "learning_rate": 9.424311134450242e-06, "loss": 2.4227, "step": 5318 }, { "epoch": 0.53, "learning_rate": 9.42107143500157e-06, "loss": 2.3293, "step": 5319 }, { "epoch": 0.53, "learning_rate": 9.417831796518418e-06, "loss": 2.3574, "step": 5320 }, { "epoch": 0.53, "learning_rate": 9.41459221934194e-06, "loss": 2.4163, "step": 5321 }, { "epoch": 0.53, "learning_rate": 9.411352703813298e-06, "loss": 2.2837, "step": 5322 }, { "epoch": 0.53, "learning_rate": 9.408113250273626e-06, "loss": 2.3683, "step": 5323 }, { "epoch": 0.53, "learning_rate": 9.404873859064068e-06, "loss": 2.2805, "step": 5324 }, { "epoch": 0.53, "learning_rate": 9.401634530525755e-06, "loss": 2.3406, "step": 5325 }, { "epoch": 0.53, "learning_rate": 9.398395264999817e-06, "loss": 2.3078, "step": 5326 }, { "epoch": 0.53, "learning_rate": 9.395156062827367e-06, "loss": 2.4837, "step": 5327 }, { "epoch": 0.53, "learning_rate": 9.391916924349521e-06, "loss": 2.3182, "step": 5328 }, { "epoch": 0.53, "learning_rate": 9.388677849907383e-06, "loss": 2.2649, "step": 5329 }, { "epoch": 0.53, "learning_rate": 9.385438839842053e-06, "loss": 2.3356, "step": 5330 }, { "epoch": 0.53, "learning_rate": 9.382199894494621e-06, "loss": 2.3004, "step": 5331 }, { "epoch": 0.53, "learning_rate": 9.378961014206173e-06, "loss": 2.3703, "step": 5332 }, { "epoch": 0.53, "learning_rate": 9.375722199317785e-06, "loss": 2.278, "step": 5333 }, { "epoch": 0.53, "learning_rate": 9.372483450170536e-06, "loss": 2.2778, "step": 5334 }, { "epoch": 0.53, "learning_rate": 9.369244767105486e-06, "loss": 2.272, "step": 5335 }, { "epoch": 0.53, "learning_rate": 9.36600615046369e-06, "loss": 2.3877, "step": 5336 }, { "epoch": 0.53, "learning_rate": 9.362767600586202e-06, "loss": 2.2707, "step": 5337 }, { "epoch": 0.53, "learning_rate": 9.359529117814065e-06, "loss": 2.4044, "step": 5338 }, { "epoch": 0.53, "learning_rate": 9.356290702488316e-06, "loss": 2.3952, "step": 5339 }, { "epoch": 0.54, "learning_rate": 9.353052354949982e-06, "loss": 2.4362, "step": 5340 }, { "epoch": 0.54, "learning_rate": 9.349814075540089e-06, "loss": 2.3373, "step": 5341 }, { "epoch": 0.54, "learning_rate": 9.346575864599643e-06, "loss": 2.3361, "step": 5342 }, { "epoch": 0.54, "learning_rate": 9.343337722469665e-06, "loss": 2.3775, "step": 5343 }, { "epoch": 0.54, "learning_rate": 9.340099649491148e-06, "loss": 2.2882, "step": 5344 }, { "epoch": 0.54, "learning_rate": 9.336861646005088e-06, "loss": 2.319, "step": 5345 }, { "epoch": 0.54, "learning_rate": 9.333623712352474e-06, "loss": 2.3432, "step": 5346 }, { "epoch": 0.54, "learning_rate": 9.330385848874275e-06, "loss": 2.273, "step": 5347 }, { "epoch": 0.54, "learning_rate": 9.32714805591147e-06, "loss": 2.2988, "step": 5348 }, { "epoch": 0.54, "learning_rate": 9.32391033380502e-06, "loss": 2.3094, "step": 5349 }, { "epoch": 0.54, "learning_rate": 9.320672682895884e-06, "loss": 2.3463, "step": 5350 }, { "epoch": 0.54, "learning_rate": 9.317435103525003e-06, "loss": 2.3754, "step": 5351 }, { "epoch": 0.54, "learning_rate": 9.314197596033329e-06, "loss": 2.3563, "step": 5352 }, { "epoch": 0.54, "learning_rate": 9.310960160761793e-06, "loss": 2.4122, "step": 5353 }, { "epoch": 0.54, "learning_rate": 9.307722798051318e-06, "loss": 2.3323, "step": 5354 }, { "epoch": 0.54, "learning_rate": 9.304485508242826e-06, "loss": 2.3972, "step": 5355 }, { "epoch": 0.54, "learning_rate": 9.301248291677225e-06, "loss": 2.3222, "step": 5356 }, { "epoch": 0.54, "learning_rate": 9.298011148695419e-06, "loss": 2.3988, "step": 5357 }, { "epoch": 0.54, "learning_rate": 9.294774079638305e-06, "loss": 2.479, "step": 5358 }, { "epoch": 0.54, "learning_rate": 9.29153708484677e-06, "loss": 2.3158, "step": 5359 }, { "epoch": 0.54, "learning_rate": 9.288300164661688e-06, "loss": 2.2624, "step": 5360 }, { "epoch": 0.54, "learning_rate": 9.28506331942394e-06, "loss": 2.3, "step": 5361 }, { "epoch": 0.54, "learning_rate": 9.281826549474385e-06, "loss": 2.369, "step": 5362 }, { "epoch": 0.54, "learning_rate": 9.278589855153882e-06, "loss": 2.3224, "step": 5363 }, { "epoch": 0.54, "learning_rate": 9.275353236803276e-06, "loss": 2.272, "step": 5364 }, { "epoch": 0.54, "learning_rate": 9.27211669476341e-06, "loss": 2.3995, "step": 5365 }, { "epoch": 0.54, "learning_rate": 9.268880229375115e-06, "loss": 2.3322, "step": 5366 }, { "epoch": 0.54, "learning_rate": 9.265643840979215e-06, "loss": 2.3413, "step": 5367 }, { "epoch": 0.54, "learning_rate": 9.262407529916525e-06, "loss": 2.2776, "step": 5368 }, { "epoch": 0.54, "learning_rate": 9.259171296527853e-06, "loss": 2.2581, "step": 5369 }, { "epoch": 0.54, "learning_rate": 9.255935141154e-06, "loss": 2.2259, "step": 5370 }, { "epoch": 0.54, "learning_rate": 9.252699064135759e-06, "loss": 2.3192, "step": 5371 }, { "epoch": 0.54, "learning_rate": 9.249463065813908e-06, "loss": 2.3593, "step": 5372 }, { "epoch": 0.54, "learning_rate": 9.246227146529228e-06, "loss": 2.345, "step": 5373 }, { "epoch": 0.54, "learning_rate": 9.242991306622481e-06, "loss": 2.3203, "step": 5374 }, { "epoch": 0.54, "learning_rate": 9.239755546434427e-06, "loss": 2.3828, "step": 5375 }, { "epoch": 0.54, "learning_rate": 9.236519866305816e-06, "loss": 2.4288, "step": 5376 }, { "epoch": 0.54, "learning_rate": 9.233284266577387e-06, "loss": 2.4135, "step": 5377 }, { "epoch": 0.54, "learning_rate": 9.230048747589874e-06, "loss": 2.378, "step": 5378 }, { "epoch": 0.54, "learning_rate": 9.226813309684006e-06, "loss": 2.3788, "step": 5379 }, { "epoch": 0.54, "learning_rate": 9.223577953200494e-06, "loss": 2.3552, "step": 5380 }, { "epoch": 0.54, "learning_rate": 9.220342678480045e-06, "loss": 2.3205, "step": 5381 }, { "epoch": 0.54, "learning_rate": 9.21710748586336e-06, "loss": 2.4155, "step": 5382 }, { "epoch": 0.54, "learning_rate": 9.213872375691128e-06, "loss": 2.3828, "step": 5383 }, { "epoch": 0.54, "learning_rate": 9.210637348304031e-06, "loss": 2.37, "step": 5384 }, { "epoch": 0.54, "learning_rate": 9.20740240404274e-06, "loss": 2.3817, "step": 5385 }, { "epoch": 0.54, "learning_rate": 9.204167543247922e-06, "loss": 2.3729, "step": 5386 }, { "epoch": 0.54, "learning_rate": 9.200932766260227e-06, "loss": 2.3902, "step": 5387 }, { "epoch": 0.54, "learning_rate": 9.197698073420307e-06, "loss": 2.3988, "step": 5388 }, { "epoch": 0.54, "learning_rate": 9.194463465068797e-06, "loss": 2.4566, "step": 5389 }, { "epoch": 0.54, "learning_rate": 9.191228941546324e-06, "loss": 2.3584, "step": 5390 }, { "epoch": 0.54, "learning_rate": 9.187994503193511e-06, "loss": 2.3045, "step": 5391 }, { "epoch": 0.54, "learning_rate": 9.184760150350965e-06, "loss": 2.3423, "step": 5392 }, { "epoch": 0.54, "learning_rate": 9.18152588335929e-06, "loss": 2.3711, "step": 5393 }, { "epoch": 0.54, "learning_rate": 9.178291702559078e-06, "loss": 2.3608, "step": 5394 }, { "epoch": 0.54, "learning_rate": 9.175057608290911e-06, "loss": 2.3756, "step": 5395 }, { "epoch": 0.54, "learning_rate": 9.171823600895361e-06, "loss": 2.3677, "step": 5396 }, { "epoch": 0.54, "learning_rate": 9.168589680713002e-06, "loss": 2.2671, "step": 5397 }, { "epoch": 0.54, "learning_rate": 9.165355848084385e-06, "loss": 2.2714, "step": 5398 }, { "epoch": 0.54, "learning_rate": 9.162122103350056e-06, "loss": 2.278, "step": 5399 }, { "epoch": 0.54, "learning_rate": 9.158888446850553e-06, "loss": 2.3271, "step": 5400 }, { "epoch": 0.54, "learning_rate": 9.155654878926406e-06, "loss": 2.4018, "step": 5401 }, { "epoch": 0.54, "learning_rate": 9.15242139991813e-06, "loss": 2.3206, "step": 5402 }, { "epoch": 0.54, "learning_rate": 9.14918801016624e-06, "loss": 2.4051, "step": 5403 }, { "epoch": 0.54, "learning_rate": 9.14595471001123e-06, "loss": 2.3195, "step": 5404 }, { "epoch": 0.54, "learning_rate": 9.142721499793592e-06, "loss": 2.3832, "step": 5405 }, { "epoch": 0.54, "learning_rate": 9.139488379853814e-06, "loss": 2.3644, "step": 5406 }, { "epoch": 0.54, "learning_rate": 9.136255350532362e-06, "loss": 2.4166, "step": 5407 }, { "epoch": 0.54, "learning_rate": 9.1330224121697e-06, "loss": 2.2209, "step": 5408 }, { "epoch": 0.54, "learning_rate": 9.12978956510628e-06, "loss": 2.3001, "step": 5409 }, { "epoch": 0.54, "learning_rate": 9.126556809682546e-06, "loss": 2.2927, "step": 5410 }, { "epoch": 0.54, "learning_rate": 9.12332414623893e-06, "loss": 2.2937, "step": 5411 }, { "epoch": 0.54, "learning_rate": 9.120091575115855e-06, "loss": 2.229, "step": 5412 }, { "epoch": 0.54, "learning_rate": 9.116859096653737e-06, "loss": 2.3429, "step": 5413 }, { "epoch": 0.54, "learning_rate": 9.113626711192974e-06, "loss": 2.2962, "step": 5414 }, { "epoch": 0.54, "learning_rate": 9.11039441907397e-06, "loss": 2.3431, "step": 5415 }, { "epoch": 0.54, "learning_rate": 9.107162220637108e-06, "loss": 2.354, "step": 5416 }, { "epoch": 0.54, "learning_rate": 9.103930116222758e-06, "loss": 2.3681, "step": 5417 }, { "epoch": 0.54, "learning_rate": 9.100698106171288e-06, "loss": 2.3818, "step": 5418 }, { "epoch": 0.54, "learning_rate": 9.097466190823051e-06, "loss": 2.2893, "step": 5419 }, { "epoch": 0.54, "learning_rate": 9.094234370518393e-06, "loss": 2.3921, "step": 5420 }, { "epoch": 0.54, "learning_rate": 9.091002645597649e-06, "loss": 2.3592, "step": 5421 }, { "epoch": 0.54, "learning_rate": 9.087771016401143e-06, "loss": 2.3239, "step": 5422 }, { "epoch": 0.54, "learning_rate": 9.084539483269187e-06, "loss": 2.4295, "step": 5423 }, { "epoch": 0.54, "learning_rate": 9.081308046542095e-06, "loss": 2.2282, "step": 5424 }, { "epoch": 0.54, "learning_rate": 9.078076706560153e-06, "loss": 2.4079, "step": 5425 }, { "epoch": 0.54, "learning_rate": 9.074845463663648e-06, "loss": 2.2344, "step": 5426 }, { "epoch": 0.54, "learning_rate": 9.071614318192854e-06, "loss": 2.3745, "step": 5427 }, { "epoch": 0.54, "learning_rate": 9.068383270488035e-06, "loss": 2.4182, "step": 5428 }, { "epoch": 0.54, "learning_rate": 9.065152320889445e-06, "loss": 2.3286, "step": 5429 }, { "epoch": 0.54, "learning_rate": 9.061921469737326e-06, "loss": 2.3123, "step": 5430 }, { "epoch": 0.54, "learning_rate": 9.058690717371911e-06, "loss": 2.3085, "step": 5431 }, { "epoch": 0.54, "learning_rate": 9.055460064133422e-06, "loss": 2.2593, "step": 5432 }, { "epoch": 0.54, "learning_rate": 9.052229510362074e-06, "loss": 2.3953, "step": 5433 }, { "epoch": 0.54, "learning_rate": 9.048999056398066e-06, "loss": 2.374, "step": 5434 }, { "epoch": 0.54, "learning_rate": 9.04576870258159e-06, "loss": 2.2856, "step": 5435 }, { "epoch": 0.54, "learning_rate": 9.042538449252825e-06, "loss": 2.4228, "step": 5436 }, { "epoch": 0.54, "learning_rate": 9.039308296751944e-06, "loss": 2.3161, "step": 5437 }, { "epoch": 0.54, "learning_rate": 9.036078245419102e-06, "loss": 2.3392, "step": 5438 }, { "epoch": 0.54, "learning_rate": 9.03284829559445e-06, "loss": 2.3511, "step": 5439 }, { "epoch": 0.55, "learning_rate": 9.029618447618127e-06, "loss": 2.3211, "step": 5440 }, { "epoch": 0.55, "learning_rate": 9.026388701830256e-06, "loss": 2.4049, "step": 5441 }, { "epoch": 0.55, "learning_rate": 9.02315905857096e-06, "loss": 2.331, "step": 5442 }, { "epoch": 0.55, "learning_rate": 9.01992951818034e-06, "loss": 2.2131, "step": 5443 }, { "epoch": 0.55, "learning_rate": 9.016700080998492e-06, "loss": 2.3732, "step": 5444 }, { "epoch": 0.55, "learning_rate": 9.0134707473655e-06, "loss": 2.4287, "step": 5445 }, { "epoch": 0.55, "learning_rate": 9.010241517621437e-06, "loss": 2.2912, "step": 5446 }, { "epoch": 0.55, "learning_rate": 9.007012392106364e-06, "loss": 2.3383, "step": 5447 }, { "epoch": 0.55, "learning_rate": 9.003783371160334e-06, "loss": 2.3584, "step": 5448 }, { "epoch": 0.55, "learning_rate": 9.000554455123387e-06, "loss": 2.4061, "step": 5449 }, { "epoch": 0.55, "learning_rate": 8.997325644335548e-06, "loss": 2.3255, "step": 5450 }, { "epoch": 0.55, "learning_rate": 8.994096939136842e-06, "loss": 2.3599, "step": 5451 }, { "epoch": 0.55, "learning_rate": 8.99086833986727e-06, "loss": 2.4253, "step": 5452 }, { "epoch": 0.55, "learning_rate": 8.98763984686683e-06, "loss": 2.2854, "step": 5453 }, { "epoch": 0.55, "learning_rate": 8.98441146047551e-06, "loss": 2.2253, "step": 5454 }, { "epoch": 0.55, "learning_rate": 8.981183181033277e-06, "loss": 2.3284, "step": 5455 }, { "epoch": 0.55, "learning_rate": 8.977955008880097e-06, "loss": 2.3523, "step": 5456 }, { "epoch": 0.55, "learning_rate": 8.974726944355918e-06, "loss": 2.3065, "step": 5457 }, { "epoch": 0.55, "learning_rate": 8.971498987800682e-06, "loss": 2.365, "step": 5458 }, { "epoch": 0.55, "learning_rate": 8.968271139554312e-06, "loss": 2.3795, "step": 5459 }, { "epoch": 0.55, "learning_rate": 8.965043399956732e-06, "loss": 2.3847, "step": 5460 }, { "epoch": 0.55, "learning_rate": 8.961815769347844e-06, "loss": 2.4155, "step": 5461 }, { "epoch": 0.55, "learning_rate": 8.958588248067544e-06, "loss": 2.3768, "step": 5462 }, { "epoch": 0.55, "learning_rate": 8.95536083645571e-06, "loss": 2.2898, "step": 5463 }, { "epoch": 0.55, "learning_rate": 8.952133534852214e-06, "loss": 2.3117, "step": 5464 }, { "epoch": 0.55, "learning_rate": 8.948906343596914e-06, "loss": 2.2328, "step": 5465 }, { "epoch": 0.55, "learning_rate": 8.94567926302966e-06, "loss": 2.3276, "step": 5466 }, { "epoch": 0.55, "learning_rate": 8.942452293490287e-06, "loss": 2.3113, "step": 5467 }, { "epoch": 0.55, "learning_rate": 8.939225435318615e-06, "loss": 2.2136, "step": 5468 }, { "epoch": 0.55, "learning_rate": 8.935998688854464e-06, "loss": 2.4235, "step": 5469 }, { "epoch": 0.55, "learning_rate": 8.932772054437629e-06, "loss": 2.2833, "step": 5470 }, { "epoch": 0.55, "learning_rate": 8.929545532407903e-06, "loss": 2.2707, "step": 5471 }, { "epoch": 0.55, "learning_rate": 8.92631912310506e-06, "loss": 2.3873, "step": 5472 }, { "epoch": 0.55, "learning_rate": 8.923092826868865e-06, "loss": 2.3918, "step": 5473 }, { "epoch": 0.55, "learning_rate": 8.919866644039073e-06, "loss": 2.2754, "step": 5474 }, { "epoch": 0.55, "learning_rate": 8.916640574955424e-06, "loss": 2.2078, "step": 5475 }, { "epoch": 0.55, "learning_rate": 8.913414619957644e-06, "loss": 2.3409, "step": 5476 }, { "epoch": 0.55, "learning_rate": 8.91018877938545e-06, "loss": 2.2529, "step": 5477 }, { "epoch": 0.55, "learning_rate": 8.906963053578558e-06, "loss": 2.3077, "step": 5478 }, { "epoch": 0.55, "learning_rate": 8.903737442876652e-06, "loss": 2.2985, "step": 5479 }, { "epoch": 0.55, "learning_rate": 8.900511947619415e-06, "loss": 2.3056, "step": 5480 }, { "epoch": 0.55, "learning_rate": 8.897286568146516e-06, "loss": 2.3632, "step": 5481 }, { "epoch": 0.55, "learning_rate": 8.894061304797611e-06, "loss": 2.3715, "step": 5482 }, { "epoch": 0.55, "learning_rate": 8.890836157912345e-06, "loss": 2.2516, "step": 5483 }, { "epoch": 0.55, "learning_rate": 8.88761112783035e-06, "loss": 2.378, "step": 5484 }, { "epoch": 0.55, "learning_rate": 8.884386214891243e-06, "loss": 2.43, "step": 5485 }, { "epoch": 0.55, "learning_rate": 8.881161419434636e-06, "loss": 2.4278, "step": 5486 }, { "epoch": 0.55, "learning_rate": 8.877936741800124e-06, "loss": 2.2336, "step": 5487 }, { "epoch": 0.55, "learning_rate": 8.874712182327287e-06, "loss": 2.3415, "step": 5488 }, { "epoch": 0.55, "learning_rate": 8.871487741355696e-06, "loss": 2.4086, "step": 5489 }, { "epoch": 0.55, "learning_rate": 8.86826341922491e-06, "loss": 2.4161, "step": 5490 }, { "epoch": 0.55, "learning_rate": 8.865039216274475e-06, "loss": 2.2732, "step": 5491 }, { "epoch": 0.55, "learning_rate": 8.86181513284392e-06, "loss": 2.2816, "step": 5492 }, { "epoch": 0.55, "learning_rate": 8.85859116927277e-06, "loss": 2.2118, "step": 5493 }, { "epoch": 0.55, "learning_rate": 8.855367325900526e-06, "loss": 2.3223, "step": 5494 }, { "epoch": 0.55, "learning_rate": 8.85214360306669e-06, "loss": 2.3446, "step": 5495 }, { "epoch": 0.55, "learning_rate": 8.84892000111074e-06, "loss": 2.3683, "step": 5496 }, { "epoch": 0.55, "learning_rate": 8.845696520372148e-06, "loss": 2.3544, "step": 5497 }, { "epoch": 0.55, "learning_rate": 8.842473161190368e-06, "loss": 2.2965, "step": 5498 }, { "epoch": 0.55, "learning_rate": 8.839249923904845e-06, "loss": 2.3639, "step": 5499 }, { "epoch": 0.55, "learning_rate": 8.836026808855012e-06, "loss": 2.3473, "step": 5500 }, { "epoch": 0.55, "learning_rate": 8.832803816380285e-06, "loss": 2.3758, "step": 5501 }, { "epoch": 0.55, "learning_rate": 8.829580946820069e-06, "loss": 2.3601, "step": 5502 }, { "epoch": 0.55, "learning_rate": 8.826358200513755e-06, "loss": 2.3527, "step": 5503 }, { "epoch": 0.55, "learning_rate": 8.823135577800727e-06, "loss": 2.3802, "step": 5504 }, { "epoch": 0.55, "learning_rate": 8.819913079020348e-06, "loss": 2.3192, "step": 5505 }, { "epoch": 0.55, "learning_rate": 8.816690704511972e-06, "loss": 2.3708, "step": 5506 }, { "epoch": 0.55, "learning_rate": 8.81346845461494e-06, "loss": 2.4177, "step": 5507 }, { "epoch": 0.55, "learning_rate": 8.810246329668577e-06, "loss": 2.4287, "step": 5508 }, { "epoch": 0.55, "learning_rate": 8.8070243300122e-06, "loss": 2.2814, "step": 5509 }, { "epoch": 0.55, "learning_rate": 8.803802455985106e-06, "loss": 2.3594, "step": 5510 }, { "epoch": 0.55, "learning_rate": 8.800580707926585e-06, "loss": 2.2221, "step": 5511 }, { "epoch": 0.55, "learning_rate": 8.797359086175908e-06, "loss": 2.2852, "step": 5512 }, { "epoch": 0.55, "learning_rate": 8.794137591072342e-06, "loss": 2.4496, "step": 5513 }, { "epoch": 0.55, "learning_rate": 8.790916222955134e-06, "loss": 2.396, "step": 5514 }, { "epoch": 0.55, "learning_rate": 8.78769498216351e-06, "loss": 2.3194, "step": 5515 }, { "epoch": 0.55, "learning_rate": 8.7844738690367e-06, "loss": 2.2308, "step": 5516 }, { "epoch": 0.55, "learning_rate": 8.781252883913907e-06, "loss": 2.3926, "step": 5517 }, { "epoch": 0.55, "learning_rate": 8.778032027134325e-06, "loss": 2.3778, "step": 5518 }, { "epoch": 0.55, "learning_rate": 8.774811299037135e-06, "loss": 2.4027, "step": 5519 }, { "epoch": 0.55, "learning_rate": 8.771590699961504e-06, "loss": 2.389, "step": 5520 }, { "epoch": 0.55, "learning_rate": 8.76837023024658e-06, "loss": 2.3089, "step": 5521 }, { "epoch": 0.55, "learning_rate": 8.765149890231512e-06, "loss": 2.3774, "step": 5522 }, { "epoch": 0.55, "learning_rate": 8.76192968025542e-06, "loss": 2.3136, "step": 5523 }, { "epoch": 0.55, "learning_rate": 8.75870960065742e-06, "loss": 2.3212, "step": 5524 }, { "epoch": 0.55, "learning_rate": 8.755489651776607e-06, "loss": 2.3506, "step": 5525 }, { "epoch": 0.55, "learning_rate": 8.752269833952071e-06, "loss": 2.2734, "step": 5526 }, { "epoch": 0.55, "learning_rate": 8.749050147522875e-06, "loss": 2.3857, "step": 5527 }, { "epoch": 0.55, "learning_rate": 8.745830592828082e-06, "loss": 2.3546, "step": 5528 }, { "epoch": 0.55, "learning_rate": 8.742611170206732e-06, "loss": 2.3199, "step": 5529 }, { "epoch": 0.55, "learning_rate": 8.739391879997852e-06, "loss": 2.2231, "step": 5530 }, { "epoch": 0.55, "learning_rate": 8.736172722540464e-06, "loss": 2.3464, "step": 5531 }, { "epoch": 0.55, "learning_rate": 8.732953698173569e-06, "loss": 2.3591, "step": 5532 }, { "epoch": 0.55, "learning_rate": 8.72973480723615e-06, "loss": 2.365, "step": 5533 }, { "epoch": 0.55, "learning_rate": 8.726516050067183e-06, "loss": 2.2191, "step": 5534 }, { "epoch": 0.55, "learning_rate": 8.723297427005628e-06, "loss": 2.2569, "step": 5535 }, { "epoch": 0.55, "learning_rate": 8.720078938390426e-06, "loss": 2.3116, "step": 5536 }, { "epoch": 0.55, "learning_rate": 8.716860584560512e-06, "loss": 2.3862, "step": 5537 }, { "epoch": 0.55, "learning_rate": 8.713642365854805e-06, "loss": 2.231, "step": 5538 }, { "epoch": 0.55, "learning_rate": 8.710424282612197e-06, "loss": 2.361, "step": 5539 }, { "epoch": 0.56, "learning_rate": 8.707206335171586e-06, "loss": 2.2546, "step": 5540 }, { "epoch": 0.56, "learning_rate": 8.703988523871845e-06, "loss": 2.3095, "step": 5541 }, { "epoch": 0.56, "learning_rate": 8.700770849051833e-06, "loss": 2.311, "step": 5542 }, { "epoch": 0.56, "learning_rate": 8.697553311050393e-06, "loss": 2.4037, "step": 5543 }, { "epoch": 0.56, "learning_rate": 8.694335910206357e-06, "loss": 2.4081, "step": 5544 }, { "epoch": 0.56, "learning_rate": 8.691118646858543e-06, "loss": 2.4031, "step": 5545 }, { "epoch": 0.56, "learning_rate": 8.68790152134575e-06, "loss": 2.3063, "step": 5546 }, { "epoch": 0.56, "learning_rate": 8.684684534006768e-06, "loss": 2.4415, "step": 5547 }, { "epoch": 0.56, "learning_rate": 8.681467685180367e-06, "loss": 2.3368, "step": 5548 }, { "epoch": 0.56, "learning_rate": 8.678250975205308e-06, "loss": 2.3643, "step": 5549 }, { "epoch": 0.56, "learning_rate": 8.675034404420337e-06, "loss": 2.4251, "step": 5550 }, { "epoch": 0.56, "learning_rate": 8.671817973164177e-06, "loss": 2.3506, "step": 5551 }, { "epoch": 0.56, "learning_rate": 8.668601681775547e-06, "loss": 2.4071, "step": 5552 }, { "epoch": 0.56, "learning_rate": 8.665385530593145e-06, "loss": 2.3452, "step": 5553 }, { "epoch": 0.56, "learning_rate": 8.662169519955654e-06, "loss": 2.2733, "step": 5554 }, { "epoch": 0.56, "learning_rate": 8.658953650201748e-06, "loss": 2.3447, "step": 5555 }, { "epoch": 0.56, "learning_rate": 8.655737921670079e-06, "loss": 2.3423, "step": 5556 }, { "epoch": 0.56, "learning_rate": 8.652522334699286e-06, "loss": 2.2662, "step": 5557 }, { "epoch": 0.56, "learning_rate": 8.649306889628e-06, "loss": 2.3099, "step": 5558 }, { "epoch": 0.56, "learning_rate": 8.646091586794828e-06, "loss": 2.3846, "step": 5559 }, { "epoch": 0.56, "learning_rate": 8.642876426538365e-06, "loss": 2.2167, "step": 5560 }, { "epoch": 0.56, "learning_rate": 8.639661409197192e-06, "loss": 2.2653, "step": 5561 }, { "epoch": 0.56, "learning_rate": 8.636446535109875e-06, "loss": 2.3661, "step": 5562 }, { "epoch": 0.56, "learning_rate": 8.633231804614964e-06, "loss": 2.3251, "step": 5563 }, { "epoch": 0.56, "learning_rate": 8.630017218050994e-06, "loss": 2.3325, "step": 5564 }, { "epoch": 0.56, "learning_rate": 8.626802775756486e-06, "loss": 2.2107, "step": 5565 }, { "epoch": 0.56, "learning_rate": 8.623588478069943e-06, "loss": 2.3733, "step": 5566 }, { "epoch": 0.56, "learning_rate": 8.620374325329856e-06, "loss": 2.3983, "step": 5567 }, { "epoch": 0.56, "learning_rate": 8.6171603178747e-06, "loss": 2.3372, "step": 5568 }, { "epoch": 0.56, "learning_rate": 8.613946456042935e-06, "loss": 2.4091, "step": 5569 }, { "epoch": 0.56, "learning_rate": 8.610732740173e-06, "loss": 2.3603, "step": 5570 }, { "epoch": 0.56, "learning_rate": 8.607519170603329e-06, "loss": 2.361, "step": 5571 }, { "epoch": 0.56, "learning_rate": 8.604305747672332e-06, "loss": 2.2872, "step": 5572 }, { "epoch": 0.56, "learning_rate": 8.601092471718406e-06, "loss": 2.4338, "step": 5573 }, { "epoch": 0.56, "learning_rate": 8.597879343079935e-06, "loss": 2.2868, "step": 5574 }, { "epoch": 0.56, "learning_rate": 8.59466636209528e-06, "loss": 2.268, "step": 5575 }, { "epoch": 0.56, "learning_rate": 8.5914535291028e-06, "loss": 2.2604, "step": 5576 }, { "epoch": 0.56, "learning_rate": 8.588240844440828e-06, "loss": 2.2826, "step": 5577 }, { "epoch": 0.56, "learning_rate": 8.585028308447685e-06, "loss": 2.3457, "step": 5578 }, { "epoch": 0.56, "learning_rate": 8.58181592146167e-06, "loss": 2.4057, "step": 5579 }, { "epoch": 0.56, "learning_rate": 8.578603683821077e-06, "loss": 2.359, "step": 5580 }, { "epoch": 0.56, "learning_rate": 8.575391595864173e-06, "loss": 2.382, "step": 5581 }, { "epoch": 0.56, "learning_rate": 8.572179657929218e-06, "loss": 2.293, "step": 5582 }, { "epoch": 0.56, "learning_rate": 8.568967870354455e-06, "loss": 2.1777, "step": 5583 }, { "epoch": 0.56, "learning_rate": 8.565756233478101e-06, "loss": 2.35, "step": 5584 }, { "epoch": 0.56, "learning_rate": 8.56254474763838e-06, "loss": 2.2959, "step": 5585 }, { "epoch": 0.56, "learning_rate": 8.559333413173474e-06, "loss": 2.2413, "step": 5586 }, { "epoch": 0.56, "learning_rate": 8.556122230421565e-06, "loss": 2.3352, "step": 5587 }, { "epoch": 0.56, "learning_rate": 8.552911199720815e-06, "loss": 2.4372, "step": 5588 }, { "epoch": 0.56, "learning_rate": 8.549700321409366e-06, "loss": 2.4015, "step": 5589 }, { "epoch": 0.56, "learning_rate": 8.546489595825354e-06, "loss": 2.3582, "step": 5590 }, { "epoch": 0.56, "learning_rate": 8.543279023306887e-06, "loss": 2.3463, "step": 5591 }, { "epoch": 0.56, "learning_rate": 8.540068604192061e-06, "loss": 2.3833, "step": 5592 }, { "epoch": 0.56, "learning_rate": 8.536858338818957e-06, "loss": 2.3384, "step": 5593 }, { "epoch": 0.56, "learning_rate": 8.533648227525649e-06, "loss": 2.3668, "step": 5594 }, { "epoch": 0.56, "learning_rate": 8.530438270650177e-06, "loss": 2.2811, "step": 5595 }, { "epoch": 0.56, "learning_rate": 8.527228468530578e-06, "loss": 2.3319, "step": 5596 }, { "epoch": 0.56, "learning_rate": 8.524018821504864e-06, "loss": 2.299, "step": 5597 }, { "epoch": 0.56, "learning_rate": 8.52080932991104e-06, "loss": 2.2938, "step": 5598 }, { "epoch": 0.56, "learning_rate": 8.517599994087086e-06, "loss": 2.3486, "step": 5599 }, { "epoch": 0.56, "learning_rate": 8.514390814370973e-06, "loss": 2.339, "step": 5600 }, { "epoch": 0.56, "learning_rate": 8.511181791100645e-06, "loss": 2.3284, "step": 5601 }, { "epoch": 0.56, "learning_rate": 8.507972924614039e-06, "loss": 2.3541, "step": 5602 }, { "epoch": 0.56, "learning_rate": 8.504764215249077e-06, "loss": 2.3524, "step": 5603 }, { "epoch": 0.56, "learning_rate": 8.501555663343655e-06, "loss": 2.3108, "step": 5604 }, { "epoch": 0.56, "learning_rate": 8.498347269235661e-06, "loss": 2.3298, "step": 5605 }, { "epoch": 0.56, "learning_rate": 8.49513903326296e-06, "loss": 2.2517, "step": 5606 }, { "epoch": 0.56, "learning_rate": 8.491930955763407e-06, "loss": 2.3486, "step": 5607 }, { "epoch": 0.56, "learning_rate": 8.488723037074834e-06, "loss": 2.2697, "step": 5608 }, { "epoch": 0.56, "learning_rate": 8.485515277535056e-06, "loss": 2.3137, "step": 5609 }, { "epoch": 0.56, "learning_rate": 8.48230767748188e-06, "loss": 2.3424, "step": 5610 }, { "epoch": 0.56, "learning_rate": 8.479100237253086e-06, "loss": 2.2528, "step": 5611 }, { "epoch": 0.56, "learning_rate": 8.475892957186444e-06, "loss": 2.3711, "step": 5612 }, { "epoch": 0.56, "learning_rate": 8.472685837619706e-06, "loss": 2.3128, "step": 5613 }, { "epoch": 0.56, "learning_rate": 8.4694788788906e-06, "loss": 2.4373, "step": 5614 }, { "epoch": 0.56, "learning_rate": 8.46627208133685e-06, "loss": 2.3751, "step": 5615 }, { "epoch": 0.56, "learning_rate": 8.46306544529615e-06, "loss": 2.3539, "step": 5616 }, { "epoch": 0.56, "learning_rate": 8.459858971106186e-06, "loss": 2.4233, "step": 5617 }, { "epoch": 0.56, "learning_rate": 8.456652659104622e-06, "loss": 2.4997, "step": 5618 }, { "epoch": 0.56, "learning_rate": 8.45344650962911e-06, "loss": 2.313, "step": 5619 }, { "epoch": 0.56, "learning_rate": 8.450240523017275e-06, "loss": 2.3457, "step": 5620 }, { "epoch": 0.56, "learning_rate": 8.447034699606738e-06, "loss": 2.352, "step": 5621 }, { "epoch": 0.56, "learning_rate": 8.443829039735095e-06, "loss": 2.3185, "step": 5622 }, { "epoch": 0.56, "learning_rate": 8.440623543739924e-06, "loss": 2.4093, "step": 5623 }, { "epoch": 0.56, "learning_rate": 8.437418211958788e-06, "loss": 2.2446, "step": 5624 }, { "epoch": 0.56, "learning_rate": 8.434213044729233e-06, "loss": 2.3786, "step": 5625 }, { "epoch": 0.56, "learning_rate": 8.43100804238879e-06, "loss": 2.365, "step": 5626 }, { "epoch": 0.56, "learning_rate": 8.427803205274963e-06, "loss": 2.4213, "step": 5627 }, { "epoch": 0.56, "learning_rate": 8.424598533725252e-06, "loss": 2.3899, "step": 5628 }, { "epoch": 0.56, "learning_rate": 8.421394028077125e-06, "loss": 2.3388, "step": 5629 }, { "epoch": 0.56, "learning_rate": 8.418189688668052e-06, "loss": 2.3977, "step": 5630 }, { "epoch": 0.56, "learning_rate": 8.414985515835466e-06, "loss": 2.2708, "step": 5631 }, { "epoch": 0.56, "learning_rate": 8.411781509916793e-06, "loss": 2.3581, "step": 5632 }, { "epoch": 0.56, "learning_rate": 8.408577671249438e-06, "loss": 2.3748, "step": 5633 }, { "epoch": 0.56, "learning_rate": 8.40537400017079e-06, "loss": 2.3071, "step": 5634 }, { "epoch": 0.56, "learning_rate": 8.402170497018217e-06, "loss": 2.2528, "step": 5635 }, { "epoch": 0.56, "learning_rate": 8.398967162129074e-06, "loss": 2.4382, "step": 5636 }, { "epoch": 0.56, "learning_rate": 8.395763995840697e-06, "loss": 2.3536, "step": 5637 }, { "epoch": 0.56, "learning_rate": 8.392560998490399e-06, "loss": 2.3714, "step": 5638 }, { "epoch": 0.56, "learning_rate": 8.389358170415485e-06, "loss": 2.3856, "step": 5639 }, { "epoch": 0.57, "learning_rate": 8.386155511953239e-06, "loss": 2.3278, "step": 5640 }, { "epoch": 0.57, "learning_rate": 8.382953023440916e-06, "loss": 2.3074, "step": 5641 }, { "epoch": 0.57, "learning_rate": 8.379750705215771e-06, "loss": 2.3783, "step": 5642 }, { "epoch": 0.57, "learning_rate": 8.376548557615028e-06, "loss": 2.3088, "step": 5643 }, { "epoch": 0.57, "learning_rate": 8.373346580975895e-06, "loss": 2.3586, "step": 5644 }, { "epoch": 0.57, "learning_rate": 8.370144775635566e-06, "loss": 2.3675, "step": 5645 }, { "epoch": 0.57, "learning_rate": 8.366943141931216e-06, "loss": 2.4181, "step": 5646 }, { "epoch": 0.57, "learning_rate": 8.363741680199998e-06, "loss": 2.3968, "step": 5647 }, { "epoch": 0.57, "learning_rate": 8.360540390779055e-06, "loss": 2.4552, "step": 5648 }, { "epoch": 0.57, "learning_rate": 8.357339274005504e-06, "loss": 2.3262, "step": 5649 }, { "epoch": 0.57, "learning_rate": 8.354138330216448e-06, "loss": 2.2526, "step": 5650 }, { "epoch": 0.57, "learning_rate": 8.350937559748968e-06, "loss": 2.2987, "step": 5651 }, { "epoch": 0.57, "learning_rate": 8.347736962940131e-06, "loss": 2.387, "step": 5652 }, { "epoch": 0.57, "learning_rate": 8.344536540126982e-06, "loss": 2.4274, "step": 5653 }, { "epoch": 0.57, "learning_rate": 8.341336291646555e-06, "loss": 2.2256, "step": 5654 }, { "epoch": 0.57, "learning_rate": 8.338136217835848e-06, "loss": 2.3501, "step": 5655 }, { "epoch": 0.57, "learning_rate": 8.334936319031865e-06, "loss": 2.3481, "step": 5656 }, { "epoch": 0.57, "learning_rate": 8.331736595571576e-06, "loss": 2.4265, "step": 5657 }, { "epoch": 0.57, "learning_rate": 8.328537047791935e-06, "loss": 2.3793, "step": 5658 }, { "epoch": 0.57, "learning_rate": 8.325337676029876e-06, "loss": 2.3016, "step": 5659 }, { "epoch": 0.57, "learning_rate": 8.322138480622322e-06, "loss": 2.2959, "step": 5660 }, { "epoch": 0.57, "learning_rate": 8.318939461906168e-06, "loss": 2.1578, "step": 5661 }, { "epoch": 0.57, "learning_rate": 8.315740620218295e-06, "loss": 2.3216, "step": 5662 }, { "epoch": 0.57, "learning_rate": 8.312541955895567e-06, "loss": 2.405, "step": 5663 }, { "epoch": 0.57, "learning_rate": 8.309343469274826e-06, "loss": 2.4147, "step": 5664 }, { "epoch": 0.57, "learning_rate": 8.306145160692897e-06, "loss": 2.2143, "step": 5665 }, { "epoch": 0.57, "learning_rate": 8.302947030486586e-06, "loss": 2.2695, "step": 5666 }, { "epoch": 0.57, "learning_rate": 8.299749078992682e-06, "loss": 2.441, "step": 5667 }, { "epoch": 0.57, "learning_rate": 8.29655130654795e-06, "loss": 2.373, "step": 5668 }, { "epoch": 0.57, "learning_rate": 8.293353713489139e-06, "loss": 2.3446, "step": 5669 }, { "epoch": 0.57, "learning_rate": 8.290156300152984e-06, "loss": 2.1833, "step": 5670 }, { "epoch": 0.57, "learning_rate": 8.286959066876192e-06, "loss": 2.2912, "step": 5671 }, { "epoch": 0.57, "learning_rate": 8.283762013995457e-06, "loss": 2.3447, "step": 5672 }, { "epoch": 0.57, "learning_rate": 8.280565141847454e-06, "loss": 2.3704, "step": 5673 }, { "epoch": 0.57, "learning_rate": 8.277368450768836e-06, "loss": 2.3584, "step": 5674 }, { "epoch": 0.57, "learning_rate": 8.27417194109624e-06, "loss": 2.3573, "step": 5675 }, { "epoch": 0.57, "learning_rate": 8.270975613166282e-06, "loss": 2.2897, "step": 5676 }, { "epoch": 0.57, "learning_rate": 8.26777946731556e-06, "loss": 2.355, "step": 5677 }, { "epoch": 0.57, "learning_rate": 8.26458350388065e-06, "loss": 2.3782, "step": 5678 }, { "epoch": 0.57, "learning_rate": 8.261387723198112e-06, "loss": 2.3548, "step": 5679 }, { "epoch": 0.57, "learning_rate": 8.258192125604486e-06, "loss": 2.2489, "step": 5680 }, { "epoch": 0.57, "learning_rate": 8.254996711436292e-06, "loss": 2.3259, "step": 5681 }, { "epoch": 0.57, "learning_rate": 8.251801481030028e-06, "loss": 2.3324, "step": 5682 }, { "epoch": 0.57, "learning_rate": 8.248606434722183e-06, "loss": 2.2987, "step": 5683 }, { "epoch": 0.57, "learning_rate": 8.245411572849215e-06, "loss": 2.3614, "step": 5684 }, { "epoch": 0.57, "learning_rate": 8.242216895747566e-06, "loss": 2.2546, "step": 5685 }, { "epoch": 0.57, "learning_rate": 8.239022403753662e-06, "loss": 2.3508, "step": 5686 }, { "epoch": 0.57, "learning_rate": 8.235828097203905e-06, "loss": 2.4414, "step": 5687 }, { "epoch": 0.57, "learning_rate": 8.232633976434679e-06, "loss": 2.3085, "step": 5688 }, { "epoch": 0.57, "learning_rate": 8.229440041782352e-06, "loss": 2.4359, "step": 5689 }, { "epoch": 0.57, "learning_rate": 8.226246293583266e-06, "loss": 2.3075, "step": 5690 }, { "epoch": 0.57, "learning_rate": 8.223052732173744e-06, "loss": 2.3559, "step": 5691 }, { "epoch": 0.57, "learning_rate": 8.2198593578901e-06, "loss": 2.2367, "step": 5692 }, { "epoch": 0.57, "learning_rate": 8.216666171068615e-06, "loss": 2.2978, "step": 5693 }, { "epoch": 0.57, "learning_rate": 8.21347317204556e-06, "loss": 2.3353, "step": 5694 }, { "epoch": 0.57, "learning_rate": 8.210280361157176e-06, "loss": 2.2529, "step": 5695 }, { "epoch": 0.57, "learning_rate": 8.207087738739693e-06, "loss": 2.3063, "step": 5696 }, { "epoch": 0.57, "learning_rate": 8.203895305129315e-06, "loss": 2.338, "step": 5697 }, { "epoch": 0.57, "learning_rate": 8.200703060662232e-06, "loss": 2.3315, "step": 5698 }, { "epoch": 0.57, "learning_rate": 8.197511005674612e-06, "loss": 2.4676, "step": 5699 }, { "epoch": 0.57, "learning_rate": 8.194319140502597e-06, "loss": 2.39, "step": 5700 }, { "epoch": 0.57, "learning_rate": 8.191127465482322e-06, "loss": 2.398, "step": 5701 }, { "epoch": 0.57, "learning_rate": 8.187935980949892e-06, "loss": 2.3104, "step": 5702 }, { "epoch": 0.57, "learning_rate": 8.184744687241391e-06, "loss": 2.3455, "step": 5703 }, { "epoch": 0.57, "learning_rate": 8.18155358469289e-06, "loss": 2.3703, "step": 5704 }, { "epoch": 0.57, "learning_rate": 8.178362673640435e-06, "loss": 2.3164, "step": 5705 }, { "epoch": 0.57, "learning_rate": 8.175171954420052e-06, "loss": 2.2719, "step": 5706 }, { "epoch": 0.57, "learning_rate": 8.171981427367746e-06, "loss": 2.3291, "step": 5707 }, { "epoch": 0.57, "learning_rate": 8.168791092819508e-06, "loss": 2.3122, "step": 5708 }, { "epoch": 0.57, "learning_rate": 8.165600951111292e-06, "loss": 2.2902, "step": 5709 }, { "epoch": 0.57, "learning_rate": 8.162411002579061e-06, "loss": 2.4216, "step": 5710 }, { "epoch": 0.57, "learning_rate": 8.159221247558734e-06, "loss": 2.28, "step": 5711 }, { "epoch": 0.57, "learning_rate": 8.156031686386213e-06, "loss": 2.3135, "step": 5712 }, { "epoch": 0.57, "learning_rate": 8.152842319397384e-06, "loss": 2.3619, "step": 5713 }, { "epoch": 0.57, "learning_rate": 8.149653146928111e-06, "loss": 2.449, "step": 5714 }, { "epoch": 0.57, "learning_rate": 8.146464169314241e-06, "loss": 2.3032, "step": 5715 }, { "epoch": 0.57, "learning_rate": 8.143275386891594e-06, "loss": 2.3621, "step": 5716 }, { "epoch": 0.57, "learning_rate": 8.140086799995973e-06, "loss": 2.394, "step": 5717 }, { "epoch": 0.57, "learning_rate": 8.136898408963158e-06, "loss": 2.3861, "step": 5718 }, { "epoch": 0.57, "learning_rate": 8.133710214128916e-06, "loss": 2.3822, "step": 5719 }, { "epoch": 0.57, "learning_rate": 8.130522215828987e-06, "loss": 2.3063, "step": 5720 }, { "epoch": 0.57, "learning_rate": 8.127334414399086e-06, "loss": 2.3954, "step": 5721 }, { "epoch": 0.57, "learning_rate": 8.124146810174918e-06, "loss": 2.2498, "step": 5722 }, { "epoch": 0.57, "learning_rate": 8.120959403492158e-06, "loss": 2.3336, "step": 5723 }, { "epoch": 0.57, "learning_rate": 8.117772194686464e-06, "loss": 2.2428, "step": 5724 }, { "epoch": 0.57, "learning_rate": 8.114585184093476e-06, "loss": 2.2878, "step": 5725 }, { "epoch": 0.57, "learning_rate": 8.111398372048806e-06, "loss": 2.4032, "step": 5726 }, { "epoch": 0.57, "learning_rate": 8.10821175888805e-06, "loss": 2.3454, "step": 5727 }, { "epoch": 0.57, "learning_rate": 8.105025344946786e-06, "loss": 2.253, "step": 5728 }, { "epoch": 0.57, "learning_rate": 8.101839130560565e-06, "loss": 2.3556, "step": 5729 }, { "epoch": 0.57, "learning_rate": 8.098653116064919e-06, "loss": 2.3695, "step": 5730 }, { "epoch": 0.57, "learning_rate": 8.09546730179536e-06, "loss": 2.2594, "step": 5731 }, { "epoch": 0.57, "learning_rate": 8.092281688087376e-06, "loss": 2.3809, "step": 5732 }, { "epoch": 0.57, "learning_rate": 8.089096275276437e-06, "loss": 2.3038, "step": 5733 }, { "epoch": 0.57, "learning_rate": 8.085911063697992e-06, "loss": 2.3486, "step": 5734 }, { "epoch": 0.57, "learning_rate": 8.082726053687468e-06, "loss": 2.3895, "step": 5735 }, { "epoch": 0.57, "learning_rate": 8.079541245580267e-06, "loss": 2.239, "step": 5736 }, { "epoch": 0.57, "learning_rate": 8.076356639711778e-06, "loss": 2.2667, "step": 5737 }, { "epoch": 0.57, "learning_rate": 8.07317223641736e-06, "loss": 2.2842, "step": 5738 }, { "epoch": 0.57, "learning_rate": 8.069988036032358e-06, "loss": 2.3607, "step": 5739 }, { "epoch": 0.58, "learning_rate": 8.066804038892088e-06, "loss": 2.2927, "step": 5740 }, { "epoch": 0.58, "learning_rate": 8.063620245331853e-06, "loss": 2.2588, "step": 5741 }, { "epoch": 0.58, "learning_rate": 8.060436655686927e-06, "loss": 2.3627, "step": 5742 }, { "epoch": 0.58, "learning_rate": 8.057253270292569e-06, "loss": 2.4072, "step": 5743 }, { "epoch": 0.58, "learning_rate": 8.054070089484009e-06, "loss": 2.3315, "step": 5744 }, { "epoch": 0.58, "learning_rate": 8.050887113596463e-06, "loss": 2.3636, "step": 5745 }, { "epoch": 0.58, "learning_rate": 8.047704342965121e-06, "loss": 2.2352, "step": 5746 }, { "epoch": 0.58, "learning_rate": 8.044521777925157e-06, "loss": 2.2343, "step": 5747 }, { "epoch": 0.58, "learning_rate": 8.041339418811711e-06, "loss": 2.4127, "step": 5748 }, { "epoch": 0.58, "learning_rate": 8.038157265959917e-06, "loss": 2.3562, "step": 5749 }, { "epoch": 0.58, "learning_rate": 8.034975319704873e-06, "loss": 2.353, "step": 5750 }, { "epoch": 0.58, "learning_rate": 8.031793580381665e-06, "loss": 2.3011, "step": 5751 }, { "epoch": 0.58, "learning_rate": 8.028612048325357e-06, "loss": 2.3847, "step": 5752 }, { "epoch": 0.58, "learning_rate": 8.025430723870982e-06, "loss": 2.3576, "step": 5753 }, { "epoch": 0.58, "learning_rate": 8.022249607353558e-06, "loss": 2.3066, "step": 5754 }, { "epoch": 0.58, "learning_rate": 8.019068699108086e-06, "loss": 2.2865, "step": 5755 }, { "epoch": 0.58, "learning_rate": 8.015887999469537e-06, "loss": 2.3216, "step": 5756 }, { "epoch": 0.58, "learning_rate": 8.012707508772863e-06, "loss": 2.3144, "step": 5757 }, { "epoch": 0.58, "learning_rate": 8.009527227352992e-06, "loss": 2.2884, "step": 5758 }, { "epoch": 0.58, "learning_rate": 8.006347155544831e-06, "loss": 2.4024, "step": 5759 }, { "epoch": 0.58, "learning_rate": 8.003167293683265e-06, "loss": 2.2285, "step": 5760 }, { "epoch": 0.58, "learning_rate": 7.99998764210316e-06, "loss": 2.415, "step": 5761 }, { "epoch": 0.58, "learning_rate": 7.996808201139354e-06, "loss": 2.4191, "step": 5762 }, { "epoch": 0.58, "learning_rate": 7.993628971126665e-06, "loss": 2.3855, "step": 5763 }, { "epoch": 0.58, "learning_rate": 7.990449952399895e-06, "loss": 2.3391, "step": 5764 }, { "epoch": 0.58, "learning_rate": 7.987271145293818e-06, "loss": 2.3567, "step": 5765 }, { "epoch": 0.58, "learning_rate": 7.984092550143183e-06, "loss": 2.3761, "step": 5766 }, { "epoch": 0.58, "learning_rate": 7.980914167282722e-06, "loss": 2.3089, "step": 5767 }, { "epoch": 0.58, "learning_rate": 7.97773599704714e-06, "loss": 2.4028, "step": 5768 }, { "epoch": 0.58, "learning_rate": 7.974558039771126e-06, "loss": 2.4357, "step": 5769 }, { "epoch": 0.58, "learning_rate": 7.971380295789341e-06, "loss": 2.265, "step": 5770 }, { "epoch": 0.58, "learning_rate": 7.968202765436424e-06, "loss": 2.317, "step": 5771 }, { "epoch": 0.58, "learning_rate": 7.965025449046988e-06, "loss": 2.2668, "step": 5772 }, { "epoch": 0.58, "learning_rate": 7.961848346955639e-06, "loss": 2.3485, "step": 5773 }, { "epoch": 0.58, "learning_rate": 7.958671459496944e-06, "loss": 2.29, "step": 5774 }, { "epoch": 0.58, "learning_rate": 7.955494787005452e-06, "loss": 2.379, "step": 5775 }, { "epoch": 0.58, "learning_rate": 7.952318329815694e-06, "loss": 2.3104, "step": 5776 }, { "epoch": 0.58, "learning_rate": 7.949142088262175e-06, "loss": 2.3175, "step": 5777 }, { "epoch": 0.58, "learning_rate": 7.945966062679371e-06, "loss": 2.3149, "step": 5778 }, { "epoch": 0.58, "learning_rate": 7.942790253401747e-06, "loss": 2.3835, "step": 5779 }, { "epoch": 0.58, "learning_rate": 7.939614660763737e-06, "loss": 2.322, "step": 5780 }, { "epoch": 0.58, "learning_rate": 7.936439285099753e-06, "loss": 2.2325, "step": 5781 }, { "epoch": 0.58, "learning_rate": 7.933264126744192e-06, "loss": 2.2978, "step": 5782 }, { "epoch": 0.58, "learning_rate": 7.930089186031416e-06, "loss": 2.2504, "step": 5783 }, { "epoch": 0.58, "learning_rate": 7.926914463295774e-06, "loss": 2.3469, "step": 5784 }, { "epoch": 0.58, "learning_rate": 7.923739958871586e-06, "loss": 2.35, "step": 5785 }, { "epoch": 0.58, "learning_rate": 7.92056567309315e-06, "loss": 2.1568, "step": 5786 }, { "epoch": 0.58, "learning_rate": 7.917391606294745e-06, "loss": 2.3169, "step": 5787 }, { "epoch": 0.58, "learning_rate": 7.914217758810625e-06, "loss": 2.4111, "step": 5788 }, { "epoch": 0.58, "learning_rate": 7.911044130975014e-06, "loss": 2.3701, "step": 5789 }, { "epoch": 0.58, "learning_rate": 7.907870723122123e-06, "loss": 2.3436, "step": 5790 }, { "epoch": 0.58, "learning_rate": 7.904697535586135e-06, "loss": 2.2769, "step": 5791 }, { "epoch": 0.58, "learning_rate": 7.901524568701212e-06, "loss": 2.2714, "step": 5792 }, { "epoch": 0.58, "learning_rate": 7.89835182280149e-06, "loss": 2.3413, "step": 5793 }, { "epoch": 0.58, "learning_rate": 7.895179298221081e-06, "loss": 2.3719, "step": 5794 }, { "epoch": 0.58, "learning_rate": 7.892006995294079e-06, "loss": 2.2948, "step": 5795 }, { "epoch": 0.58, "learning_rate": 7.888834914354548e-06, "loss": 2.3054, "step": 5796 }, { "epoch": 0.58, "learning_rate": 7.885663055736535e-06, "loss": 2.4221, "step": 5797 }, { "epoch": 0.58, "learning_rate": 7.882491419774058e-06, "loss": 2.3071, "step": 5798 }, { "epoch": 0.58, "learning_rate": 7.879320006801114e-06, "loss": 2.3338, "step": 5799 }, { "epoch": 0.58, "learning_rate": 7.87614881715168e-06, "loss": 2.3664, "step": 5800 }, { "epoch": 0.58, "learning_rate": 7.872977851159703e-06, "loss": 2.249, "step": 5801 }, { "epoch": 0.58, "learning_rate": 7.86980710915911e-06, "loss": 2.3361, "step": 5802 }, { "epoch": 0.58, "learning_rate": 7.866636591483805e-06, "loss": 2.3662, "step": 5803 }, { "epoch": 0.58, "learning_rate": 7.863466298467665e-06, "loss": 2.395, "step": 5804 }, { "epoch": 0.58, "learning_rate": 7.860296230444548e-06, "loss": 2.3529, "step": 5805 }, { "epoch": 0.58, "learning_rate": 7.857126387748286e-06, "loss": 2.3324, "step": 5806 }, { "epoch": 0.58, "learning_rate": 7.853956770712684e-06, "loss": 2.3823, "step": 5807 }, { "epoch": 0.58, "learning_rate": 7.850787379671525e-06, "loss": 2.2855, "step": 5808 }, { "epoch": 0.58, "learning_rate": 7.847618214958582e-06, "loss": 2.3019, "step": 5809 }, { "epoch": 0.58, "learning_rate": 7.844449276907577e-06, "loss": 2.279, "step": 5810 }, { "epoch": 0.58, "learning_rate": 7.841280565852232e-06, "loss": 2.3874, "step": 5811 }, { "epoch": 0.58, "learning_rate": 7.838112082126232e-06, "loss": 2.1894, "step": 5812 }, { "epoch": 0.58, "learning_rate": 7.834943826063243e-06, "loss": 2.3807, "step": 5813 }, { "epoch": 0.58, "learning_rate": 7.831775797996907e-06, "loss": 2.2985, "step": 5814 }, { "epoch": 0.58, "learning_rate": 7.82860799826084e-06, "loss": 2.3286, "step": 5815 }, { "epoch": 0.58, "learning_rate": 7.825440427188635e-06, "loss": 2.264, "step": 5816 }, { "epoch": 0.58, "learning_rate": 7.82227308511386e-06, "loss": 2.3528, "step": 5817 }, { "epoch": 0.58, "learning_rate": 7.81910597237006e-06, "loss": 2.217, "step": 5818 }, { "epoch": 0.58, "learning_rate": 7.815939089290762e-06, "loss": 2.3089, "step": 5819 }, { "epoch": 0.58, "learning_rate": 7.812772436209456e-06, "loss": 2.2913, "step": 5820 }, { "epoch": 0.58, "learning_rate": 7.809606013459618e-06, "loss": 2.346, "step": 5821 }, { "epoch": 0.58, "learning_rate": 7.806439821374692e-06, "loss": 2.1921, "step": 5822 }, { "epoch": 0.58, "learning_rate": 7.803273860288105e-06, "loss": 2.3328, "step": 5823 }, { "epoch": 0.58, "learning_rate": 7.800108130533253e-06, "loss": 2.2856, "step": 5824 }, { "epoch": 0.58, "learning_rate": 7.79694263244351e-06, "loss": 2.3917, "step": 5825 }, { "epoch": 0.58, "learning_rate": 7.793777366352233e-06, "loss": 2.352, "step": 5826 }, { "epoch": 0.58, "learning_rate": 7.790612332592748e-06, "loss": 2.3467, "step": 5827 }, { "epoch": 0.58, "learning_rate": 7.787447531498351e-06, "loss": 2.3976, "step": 5828 }, { "epoch": 0.58, "learning_rate": 7.784282963402325e-06, "loss": 2.4973, "step": 5829 }, { "epoch": 0.58, "learning_rate": 7.781118628637918e-06, "loss": 2.2874, "step": 5830 }, { "epoch": 0.58, "learning_rate": 7.777954527538362e-06, "loss": 2.417, "step": 5831 }, { "epoch": 0.58, "learning_rate": 7.774790660436857e-06, "loss": 2.4205, "step": 5832 }, { "epoch": 0.58, "learning_rate": 7.771627027666585e-06, "loss": 2.3398, "step": 5833 }, { "epoch": 0.58, "learning_rate": 7.768463629560696e-06, "loss": 2.362, "step": 5834 }, { "epoch": 0.58, "learning_rate": 7.765300466452326e-06, "loss": 2.3918, "step": 5835 }, { "epoch": 0.58, "learning_rate": 7.762137538674576e-06, "loss": 2.4303, "step": 5836 }, { "epoch": 0.58, "learning_rate": 7.758974846560525e-06, "loss": 2.3433, "step": 5837 }, { "epoch": 0.58, "learning_rate": 7.755812390443231e-06, "loss": 2.2238, "step": 5838 }, { "epoch": 0.59, "learning_rate": 7.752650170655722e-06, "loss": 2.221, "step": 5839 }, { "epoch": 0.59, "learning_rate": 7.749488187531005e-06, "loss": 2.3015, "step": 5840 }, { "epoch": 0.59, "learning_rate": 7.74632644140206e-06, "loss": 2.2967, "step": 5841 }, { "epoch": 0.59, "learning_rate": 7.743164932601842e-06, "loss": 2.2545, "step": 5842 }, { "epoch": 0.59, "learning_rate": 7.74000366146328e-06, "loss": 2.3109, "step": 5843 }, { "epoch": 0.59, "learning_rate": 7.736842628319286e-06, "loss": 2.3235, "step": 5844 }, { "epoch": 0.59, "learning_rate": 7.733681833502732e-06, "loss": 2.3747, "step": 5845 }, { "epoch": 0.59, "learning_rate": 7.73052127734648e-06, "loss": 2.3787, "step": 5846 }, { "epoch": 0.59, "learning_rate": 7.72736096018336e-06, "loss": 2.366, "step": 5847 }, { "epoch": 0.59, "learning_rate": 7.72420088234617e-06, "loss": 2.4175, "step": 5848 }, { "epoch": 0.59, "learning_rate": 7.721041044167698e-06, "loss": 2.3466, "step": 5849 }, { "epoch": 0.59, "learning_rate": 7.717881445980695e-06, "loss": 2.3667, "step": 5850 }, { "epoch": 0.59, "learning_rate": 7.71472208811789e-06, "loss": 2.3647, "step": 5851 }, { "epoch": 0.59, "learning_rate": 7.711562970911987e-06, "loss": 2.2012, "step": 5852 }, { "epoch": 0.59, "learning_rate": 7.708404094695668e-06, "loss": 2.352, "step": 5853 }, { "epoch": 0.59, "learning_rate": 7.705245459801583e-06, "loss": 2.3, "step": 5854 }, { "epoch": 0.59, "learning_rate": 7.702087066562361e-06, "loss": 2.2924, "step": 5855 }, { "epoch": 0.59, "learning_rate": 7.698928915310605e-06, "loss": 2.358, "step": 5856 }, { "epoch": 0.59, "learning_rate": 7.69577100637889e-06, "loss": 2.3131, "step": 5857 }, { "epoch": 0.59, "learning_rate": 7.69261334009977e-06, "loss": 2.2166, "step": 5858 }, { "epoch": 0.59, "learning_rate": 7.68945591680577e-06, "loss": 2.3349, "step": 5859 }, { "epoch": 0.59, "learning_rate": 7.686298736829391e-06, "loss": 2.3384, "step": 5860 }, { "epoch": 0.59, "learning_rate": 7.683141800503103e-06, "loss": 2.2829, "step": 5861 }, { "epoch": 0.59, "learning_rate": 7.679985108159362e-06, "loss": 2.3146, "step": 5862 }, { "epoch": 0.59, "learning_rate": 7.67682866013059e-06, "loss": 2.2911, "step": 5863 }, { "epoch": 0.59, "learning_rate": 7.673672456749182e-06, "loss": 2.2611, "step": 5864 }, { "epoch": 0.59, "learning_rate": 7.67051649834751e-06, "loss": 2.3647, "step": 5865 }, { "epoch": 0.59, "learning_rate": 7.667360785257922e-06, "loss": 2.3567, "step": 5866 }, { "epoch": 0.59, "learning_rate": 7.664205317812736e-06, "loss": 2.2623, "step": 5867 }, { "epoch": 0.59, "learning_rate": 7.66105009634425e-06, "loss": 2.325, "step": 5868 }, { "epoch": 0.59, "learning_rate": 7.657895121184729e-06, "loss": 2.2996, "step": 5869 }, { "epoch": 0.59, "learning_rate": 7.654740392666411e-06, "loss": 2.3443, "step": 5870 }, { "epoch": 0.59, "learning_rate": 7.651585911121525e-06, "loss": 2.3439, "step": 5871 }, { "epoch": 0.59, "learning_rate": 7.648431676882254e-06, "loss": 2.3008, "step": 5872 }, { "epoch": 0.59, "learning_rate": 7.645277690280766e-06, "loss": 2.2625, "step": 5873 }, { "epoch": 0.59, "learning_rate": 7.642123951649193e-06, "loss": 2.1925, "step": 5874 }, { "epoch": 0.59, "learning_rate": 7.638970461319653e-06, "loss": 2.3018, "step": 5875 }, { "epoch": 0.59, "learning_rate": 7.635817219624229e-06, "loss": 2.3379, "step": 5876 }, { "epoch": 0.59, "learning_rate": 7.632664226894982e-06, "loss": 2.3232, "step": 5877 }, { "epoch": 0.59, "learning_rate": 7.629511483463947e-06, "loss": 2.2577, "step": 5878 }, { "epoch": 0.59, "learning_rate": 7.626358989663127e-06, "loss": 2.284, "step": 5879 }, { "epoch": 0.59, "learning_rate": 7.623206745824511e-06, "loss": 2.3464, "step": 5880 }, { "epoch": 0.59, "learning_rate": 7.620054752280048e-06, "loss": 2.2266, "step": 5881 }, { "epoch": 0.59, "learning_rate": 7.6169030093616705e-06, "loss": 2.3493, "step": 5882 }, { "epoch": 0.59, "learning_rate": 7.613751517401278e-06, "loss": 2.3234, "step": 5883 }, { "epoch": 0.59, "learning_rate": 7.6106002767307465e-06, "loss": 2.3905, "step": 5884 }, { "epoch": 0.59, "learning_rate": 7.6074492876819275e-06, "loss": 2.2597, "step": 5885 }, { "epoch": 0.59, "learning_rate": 7.604298550586639e-06, "loss": 2.3323, "step": 5886 }, { "epoch": 0.59, "learning_rate": 7.601148065776681e-06, "loss": 2.36, "step": 5887 }, { "epoch": 0.59, "learning_rate": 7.597997833583819e-06, "loss": 2.3543, "step": 5888 }, { "epoch": 0.59, "learning_rate": 7.5948478543398015e-06, "loss": 2.2945, "step": 5889 }, { "epoch": 0.59, "learning_rate": 7.591698128376343e-06, "loss": 2.321, "step": 5890 }, { "epoch": 0.59, "learning_rate": 7.588548656025135e-06, "loss": 2.281, "step": 5891 }, { "epoch": 0.59, "learning_rate": 7.5853994376178375e-06, "loss": 2.3032, "step": 5892 }, { "epoch": 0.59, "learning_rate": 7.582250473486087e-06, "loss": 2.2583, "step": 5893 }, { "epoch": 0.59, "learning_rate": 7.579101763961495e-06, "loss": 2.3702, "step": 5894 }, { "epoch": 0.59, "learning_rate": 7.575953309375643e-06, "loss": 2.3295, "step": 5895 }, { "epoch": 0.59, "learning_rate": 7.572805110060087e-06, "loss": 2.3082, "step": 5896 }, { "epoch": 0.59, "learning_rate": 7.569657166346354e-06, "loss": 2.3687, "step": 5897 }, { "epoch": 0.59, "learning_rate": 7.566509478565949e-06, "loss": 2.1893, "step": 5898 }, { "epoch": 0.59, "learning_rate": 7.563362047050348e-06, "loss": 2.3005, "step": 5899 }, { "epoch": 0.59, "learning_rate": 7.560214872130997e-06, "loss": 2.3185, "step": 5900 }, { "epoch": 0.59, "learning_rate": 7.557067954139316e-06, "loss": 2.3472, "step": 5901 }, { "epoch": 0.59, "learning_rate": 7.553921293406702e-06, "loss": 2.3283, "step": 5902 }, { "epoch": 0.59, "learning_rate": 7.550774890264521e-06, "loss": 2.3413, "step": 5903 }, { "epoch": 0.59, "learning_rate": 7.547628745044111e-06, "loss": 2.3065, "step": 5904 }, { "epoch": 0.59, "learning_rate": 7.544482858076787e-06, "loss": 2.412, "step": 5905 }, { "epoch": 0.59, "learning_rate": 7.541337229693831e-06, "loss": 2.3577, "step": 5906 }, { "epoch": 0.59, "learning_rate": 7.5381918602265066e-06, "loss": 2.254, "step": 5907 }, { "epoch": 0.59, "learning_rate": 7.535046750006042e-06, "loss": 2.3815, "step": 5908 }, { "epoch": 0.59, "learning_rate": 7.531901899363641e-06, "loss": 2.3994, "step": 5909 }, { "epoch": 0.59, "learning_rate": 7.528757308630479e-06, "loss": 2.2977, "step": 5910 }, { "epoch": 0.59, "learning_rate": 7.525612978137706e-06, "loss": 2.3176, "step": 5911 }, { "epoch": 0.59, "learning_rate": 7.522468908216445e-06, "loss": 2.2756, "step": 5912 }, { "epoch": 0.59, "learning_rate": 7.519325099197787e-06, "loss": 2.2953, "step": 5913 }, { "epoch": 0.59, "learning_rate": 7.5161815514128e-06, "loss": 2.3633, "step": 5914 }, { "epoch": 0.59, "learning_rate": 7.513038265192523e-06, "loss": 2.4469, "step": 5915 }, { "epoch": 0.59, "learning_rate": 7.509895240867968e-06, "loss": 2.3499, "step": 5916 }, { "epoch": 0.59, "learning_rate": 7.50675247877012e-06, "loss": 2.2937, "step": 5917 }, { "epoch": 0.59, "learning_rate": 7.503609979229936e-06, "loss": 2.3901, "step": 5918 }, { "epoch": 0.59, "learning_rate": 7.500467742578341e-06, "loss": 2.3376, "step": 5919 }, { "epoch": 0.59, "learning_rate": 7.497325769146239e-06, "loss": 2.4172, "step": 5920 }, { "epoch": 0.59, "learning_rate": 7.494184059264505e-06, "loss": 2.3962, "step": 5921 }, { "epoch": 0.59, "learning_rate": 7.491042613263979e-06, "loss": 2.3802, "step": 5922 }, { "epoch": 0.59, "learning_rate": 7.487901431475484e-06, "loss": 2.3607, "step": 5923 }, { "epoch": 0.59, "learning_rate": 7.484760514229803e-06, "loss": 2.303, "step": 5924 }, { "epoch": 0.59, "learning_rate": 7.481619861857711e-06, "loss": 2.2792, "step": 5925 }, { "epoch": 0.59, "learning_rate": 7.478479474689931e-06, "loss": 2.2087, "step": 5926 }, { "epoch": 0.59, "learning_rate": 7.475339353057174e-06, "loss": 2.3005, "step": 5927 }, { "epoch": 0.59, "learning_rate": 7.472199497290116e-06, "loss": 2.2718, "step": 5928 }, { "epoch": 0.59, "learning_rate": 7.469059907719409e-06, "loss": 2.1741, "step": 5929 }, { "epoch": 0.59, "learning_rate": 7.465920584675674e-06, "loss": 2.2935, "step": 5930 }, { "epoch": 0.59, "learning_rate": 7.462781528489509e-06, "loss": 2.3557, "step": 5931 }, { "epoch": 0.59, "learning_rate": 7.459642739491475e-06, "loss": 2.2323, "step": 5932 }, { "epoch": 0.59, "learning_rate": 7.456504218012109e-06, "loss": 2.2971, "step": 5933 }, { "epoch": 0.59, "learning_rate": 7.4533659643819274e-06, "loss": 2.1821, "step": 5934 }, { "epoch": 0.59, "learning_rate": 7.45022797893141e-06, "loss": 2.3276, "step": 5935 }, { "epoch": 0.59, "learning_rate": 7.447090261991008e-06, "loss": 2.3183, "step": 5936 }, { "epoch": 0.59, "learning_rate": 7.443952813891149e-06, "loss": 2.2394, "step": 5937 }, { "epoch": 0.59, "learning_rate": 7.440815634962227e-06, "loss": 2.2557, "step": 5938 }, { "epoch": 0.6, "learning_rate": 7.437678725534611e-06, "loss": 2.4213, "step": 5939 }, { "epoch": 0.6, "learning_rate": 7.434542085938643e-06, "loss": 2.3655, "step": 5940 }, { "epoch": 0.6, "learning_rate": 7.431405716504631e-06, "loss": 2.2941, "step": 5941 }, { "epoch": 0.6, "learning_rate": 7.428269617562859e-06, "loss": 2.3076, "step": 5942 }, { "epoch": 0.6, "learning_rate": 7.425133789443586e-06, "loss": 2.2859, "step": 5943 }, { "epoch": 0.6, "learning_rate": 7.421998232477037e-06, "loss": 2.175, "step": 5944 }, { "epoch": 0.6, "learning_rate": 7.418862946993406e-06, "loss": 2.3013, "step": 5945 }, { "epoch": 0.6, "learning_rate": 7.415727933322866e-06, "loss": 2.353, "step": 5946 }, { "epoch": 0.6, "learning_rate": 7.412593191795557e-06, "loss": 2.3321, "step": 5947 }, { "epoch": 0.6, "learning_rate": 7.4094587227415874e-06, "loss": 2.3205, "step": 5948 }, { "epoch": 0.6, "learning_rate": 7.4063245264910444e-06, "loss": 2.3284, "step": 5949 }, { "epoch": 0.6, "learning_rate": 7.40319060337398e-06, "loss": 2.3853, "step": 5950 }, { "epoch": 0.6, "learning_rate": 7.400056953720414e-06, "loss": 2.3377, "step": 5951 }, { "epoch": 0.6, "learning_rate": 7.396923577860356e-06, "loss": 2.4551, "step": 5952 }, { "epoch": 0.6, "learning_rate": 7.393790476123766e-06, "loss": 2.2577, "step": 5953 }, { "epoch": 0.6, "learning_rate": 7.390657648840584e-06, "loss": 2.4371, "step": 5954 }, { "epoch": 0.6, "learning_rate": 7.387525096340722e-06, "loss": 2.3219, "step": 5955 }, { "epoch": 0.6, "learning_rate": 7.384392818954059e-06, "loss": 2.3372, "step": 5956 }, { "epoch": 0.6, "learning_rate": 7.3812608170104494e-06, "loss": 2.3523, "step": 5957 }, { "epoch": 0.6, "learning_rate": 7.378129090839714e-06, "loss": 2.3439, "step": 5958 }, { "epoch": 0.6, "learning_rate": 7.374997640771651e-06, "loss": 2.2601, "step": 5959 }, { "epoch": 0.6, "learning_rate": 7.371866467136018e-06, "loss": 2.3998, "step": 5960 }, { "epoch": 0.6, "learning_rate": 7.368735570262559e-06, "loss": 2.1468, "step": 5961 }, { "epoch": 0.6, "learning_rate": 7.36560495048098e-06, "loss": 2.2075, "step": 5962 }, { "epoch": 0.6, "learning_rate": 7.362474608120955e-06, "loss": 2.3176, "step": 5963 }, { "epoch": 0.6, "learning_rate": 7.359344543512135e-06, "loss": 2.2543, "step": 5964 }, { "epoch": 0.6, "learning_rate": 7.356214756984138e-06, "loss": 2.349, "step": 5965 }, { "epoch": 0.6, "learning_rate": 7.3530852488665535e-06, "loss": 2.2233, "step": 5966 }, { "epoch": 0.6, "learning_rate": 7.349956019488946e-06, "loss": 2.4808, "step": 5967 }, { "epoch": 0.6, "learning_rate": 7.346827069180842e-06, "loss": 2.1832, "step": 5968 }, { "epoch": 0.6, "learning_rate": 7.343698398271743e-06, "loss": 2.3489, "step": 5969 }, { "epoch": 0.6, "learning_rate": 7.340570007091128e-06, "loss": 2.3797, "step": 5970 }, { "epoch": 0.6, "learning_rate": 7.337441895968436e-06, "loss": 2.403, "step": 5971 }, { "epoch": 0.6, "learning_rate": 7.334314065233079e-06, "loss": 2.2677, "step": 5972 }, { "epoch": 0.6, "learning_rate": 7.331186515214444e-06, "loss": 2.3457, "step": 5973 }, { "epoch": 0.6, "learning_rate": 7.328059246241883e-06, "loss": 2.265, "step": 5974 }, { "epoch": 0.6, "learning_rate": 7.324932258644723e-06, "loss": 2.3762, "step": 5975 }, { "epoch": 0.6, "learning_rate": 7.321805552752259e-06, "loss": 2.3477, "step": 5976 }, { "epoch": 0.6, "learning_rate": 7.318679128893754e-06, "loss": 2.3494, "step": 5977 }, { "epoch": 0.6, "learning_rate": 7.315552987398444e-06, "loss": 2.3169, "step": 5978 }, { "epoch": 0.6, "learning_rate": 7.31242712859554e-06, "loss": 2.3815, "step": 5979 }, { "epoch": 0.6, "learning_rate": 7.309301552814214e-06, "loss": 2.359, "step": 5980 }, { "epoch": 0.6, "learning_rate": 7.306176260383615e-06, "loss": 2.3628, "step": 5981 }, { "epoch": 0.6, "learning_rate": 7.303051251632858e-06, "loss": 2.3091, "step": 5982 }, { "epoch": 0.6, "learning_rate": 7.2999265268910304e-06, "loss": 2.294, "step": 5983 }, { "epoch": 0.6, "learning_rate": 7.296802086487189e-06, "loss": 2.4084, "step": 5984 }, { "epoch": 0.6, "learning_rate": 7.293677930750361e-06, "loss": 2.4273, "step": 5985 }, { "epoch": 0.6, "learning_rate": 7.290554060009543e-06, "loss": 2.2282, "step": 5986 }, { "epoch": 0.6, "learning_rate": 7.287430474593698e-06, "loss": 2.3598, "step": 5987 }, { "epoch": 0.6, "learning_rate": 7.284307174831773e-06, "loss": 2.3266, "step": 5988 }, { "epoch": 0.6, "learning_rate": 7.2811841610526705e-06, "loss": 2.329, "step": 5989 }, { "epoch": 0.6, "learning_rate": 7.278061433585264e-06, "loss": 2.2868, "step": 5990 }, { "epoch": 0.6, "learning_rate": 7.274938992758402e-06, "loss": 2.4192, "step": 5991 }, { "epoch": 0.6, "learning_rate": 7.2718168389009016e-06, "loss": 2.3372, "step": 5992 }, { "epoch": 0.6, "learning_rate": 7.268694972341548e-06, "loss": 2.3347, "step": 5993 }, { "epoch": 0.6, "learning_rate": 7.265573393409097e-06, "loss": 2.3459, "step": 5994 }, { "epoch": 0.6, "learning_rate": 7.262452102432271e-06, "loss": 2.3181, "step": 5995 }, { "epoch": 0.6, "learning_rate": 7.259331099739774e-06, "loss": 2.3422, "step": 5996 }, { "epoch": 0.6, "learning_rate": 7.256210385660267e-06, "loss": 2.222, "step": 5997 }, { "epoch": 0.6, "learning_rate": 7.253089960522384e-06, "loss": 2.35, "step": 5998 }, { "epoch": 0.6, "learning_rate": 7.2499698246547275e-06, "loss": 2.3291, "step": 5999 }, { "epoch": 0.6, "learning_rate": 7.246849978385874e-06, "loss": 2.2203, "step": 6000 }, { "epoch": 0.6, "learning_rate": 7.243730422044366e-06, "loss": 2.3751, "step": 6001 }, { "epoch": 0.6, "learning_rate": 7.240611155958716e-06, "loss": 2.3276, "step": 6002 }, { "epoch": 0.6, "learning_rate": 7.2374921804574035e-06, "loss": 2.2803, "step": 6003 }, { "epoch": 0.6, "learning_rate": 7.234373495868879e-06, "loss": 2.2441, "step": 6004 }, { "epoch": 0.6, "learning_rate": 7.23125510252157e-06, "loss": 2.2931, "step": 6005 }, { "epoch": 0.6, "learning_rate": 7.228137000743864e-06, "loss": 2.3389, "step": 6006 }, { "epoch": 0.6, "learning_rate": 7.22501919086412e-06, "loss": 2.3248, "step": 6007 }, { "epoch": 0.6, "learning_rate": 7.221901673210667e-06, "loss": 2.3127, "step": 6008 }, { "epoch": 0.6, "learning_rate": 7.218784448111802e-06, "loss": 2.2502, "step": 6009 }, { "epoch": 0.6, "learning_rate": 7.215667515895793e-06, "loss": 2.3129, "step": 6010 }, { "epoch": 0.6, "learning_rate": 7.212550876890876e-06, "loss": 2.354, "step": 6011 }, { "epoch": 0.6, "learning_rate": 7.209434531425257e-06, "loss": 2.31, "step": 6012 }, { "epoch": 0.6, "learning_rate": 7.206318479827108e-06, "loss": 2.312, "step": 6013 }, { "epoch": 0.6, "learning_rate": 7.203202722424576e-06, "loss": 2.3388, "step": 6014 }, { "epoch": 0.6, "learning_rate": 7.2000872595457725e-06, "loss": 2.2528, "step": 6015 }, { "epoch": 0.6, "learning_rate": 7.196972091518779e-06, "loss": 2.2393, "step": 6016 }, { "epoch": 0.6, "learning_rate": 7.1938572186716475e-06, "loss": 2.4042, "step": 6017 }, { "epoch": 0.6, "learning_rate": 7.190742641332393e-06, "loss": 2.247, "step": 6018 }, { "epoch": 0.6, "learning_rate": 7.187628359829009e-06, "loss": 2.2825, "step": 6019 }, { "epoch": 0.6, "learning_rate": 7.184514374489451e-06, "loss": 2.4558, "step": 6020 }, { "epoch": 0.6, "learning_rate": 7.181400685641643e-06, "loss": 2.3591, "step": 6021 }, { "epoch": 0.6, "learning_rate": 7.17828729361348e-06, "loss": 2.2616, "step": 6022 }, { "epoch": 0.6, "learning_rate": 7.1751741987328285e-06, "loss": 2.2796, "step": 6023 }, { "epoch": 0.6, "learning_rate": 7.172061401327519e-06, "loss": 2.2605, "step": 6024 }, { "epoch": 0.6, "learning_rate": 7.1689489017253545e-06, "loss": 2.3826, "step": 6025 }, { "epoch": 0.6, "learning_rate": 7.1658367002541e-06, "loss": 2.412, "step": 6026 }, { "epoch": 0.6, "learning_rate": 7.1627247972414985e-06, "loss": 2.3177, "step": 6027 }, { "epoch": 0.6, "learning_rate": 7.1596131930152524e-06, "loss": 2.3718, "step": 6028 }, { "epoch": 0.6, "learning_rate": 7.15650188790304e-06, "loss": 2.352, "step": 6029 }, { "epoch": 0.6, "learning_rate": 7.1533908822325035e-06, "loss": 2.2848, "step": 6030 }, { "epoch": 0.6, "learning_rate": 7.150280176331254e-06, "loss": 2.3127, "step": 6031 }, { "epoch": 0.6, "learning_rate": 7.147169770526876e-06, "loss": 2.2236, "step": 6032 }, { "epoch": 0.6, "learning_rate": 7.144059665146917e-06, "loss": 2.2834, "step": 6033 }, { "epoch": 0.6, "learning_rate": 7.140949860518893e-06, "loss": 2.3172, "step": 6034 }, { "epoch": 0.6, "learning_rate": 7.137840356970291e-06, "loss": 2.278, "step": 6035 }, { "epoch": 0.6, "learning_rate": 7.134731154828565e-06, "loss": 2.33, "step": 6036 }, { "epoch": 0.6, "learning_rate": 7.1316222544211356e-06, "loss": 2.2177, "step": 6037 }, { "epoch": 0.6, "learning_rate": 7.128513656075395e-06, "loss": 2.4288, "step": 6038 }, { "epoch": 0.61, "learning_rate": 7.125405360118703e-06, "loss": 2.3138, "step": 6039 }, { "epoch": 0.61, "learning_rate": 7.122297366878379e-06, "loss": 2.3603, "step": 6040 }, { "epoch": 0.61, "learning_rate": 7.11918967668173e-06, "loss": 2.406, "step": 6041 }, { "epoch": 0.61, "learning_rate": 7.116082289856013e-06, "loss": 2.4458, "step": 6042 }, { "epoch": 0.61, "learning_rate": 7.112975206728459e-06, "loss": 2.2864, "step": 6043 }, { "epoch": 0.61, "learning_rate": 7.109868427626268e-06, "loss": 2.423, "step": 6044 }, { "epoch": 0.61, "learning_rate": 7.106761952876604e-06, "loss": 2.3531, "step": 6045 }, { "epoch": 0.61, "learning_rate": 7.103655782806607e-06, "loss": 2.341, "step": 6046 }, { "epoch": 0.61, "learning_rate": 7.100549917743375e-06, "loss": 2.4693, "step": 6047 }, { "epoch": 0.61, "learning_rate": 7.097444358013985e-06, "loss": 2.277, "step": 6048 }, { "epoch": 0.61, "learning_rate": 7.094339103945467e-06, "loss": 2.3592, "step": 6049 }, { "epoch": 0.61, "learning_rate": 7.091234155864835e-06, "loss": 2.3301, "step": 6050 }, { "epoch": 0.61, "learning_rate": 7.088129514099062e-06, "loss": 2.2654, "step": 6051 }, { "epoch": 0.61, "learning_rate": 7.085025178975091e-06, "loss": 2.3294, "step": 6052 }, { "epoch": 0.61, "learning_rate": 7.08192115081983e-06, "loss": 2.2319, "step": 6053 }, { "epoch": 0.61, "learning_rate": 7.078817429960156e-06, "loss": 2.3746, "step": 6054 }, { "epoch": 0.61, "learning_rate": 7.0757140167229146e-06, "loss": 2.4385, "step": 6055 }, { "epoch": 0.61, "learning_rate": 7.072610911434916e-06, "loss": 2.3753, "step": 6056 }, { "epoch": 0.61, "learning_rate": 7.069508114422945e-06, "loss": 2.3898, "step": 6057 }, { "epoch": 0.61, "learning_rate": 7.066405626013743e-06, "loss": 2.3217, "step": 6058 }, { "epoch": 0.61, "learning_rate": 7.063303446534032e-06, "loss": 2.288, "step": 6059 }, { "epoch": 0.61, "learning_rate": 7.060201576310494e-06, "loss": 2.3748, "step": 6060 }, { "epoch": 0.61, "learning_rate": 7.057100015669776e-06, "loss": 2.3288, "step": 6061 }, { "epoch": 0.61, "learning_rate": 7.053998764938499e-06, "loss": 2.3844, "step": 6062 }, { "epoch": 0.61, "learning_rate": 7.050897824443245e-06, "loss": 2.275, "step": 6063 }, { "epoch": 0.61, "learning_rate": 7.047797194510567e-06, "loss": 2.3708, "step": 6064 }, { "epoch": 0.61, "learning_rate": 7.044696875466987e-06, "loss": 2.2677, "step": 6065 }, { "epoch": 0.61, "learning_rate": 7.041596867638989e-06, "loss": 2.1782, "step": 6066 }, { "epoch": 0.61, "learning_rate": 7.038497171353023e-06, "loss": 2.3208, "step": 6067 }, { "epoch": 0.61, "learning_rate": 7.035397786935518e-06, "loss": 2.2396, "step": 6068 }, { "epoch": 0.61, "learning_rate": 7.032298714712861e-06, "loss": 2.3161, "step": 6069 }, { "epoch": 0.61, "learning_rate": 7.029199955011406e-06, "loss": 2.243, "step": 6070 }, { "epoch": 0.61, "learning_rate": 7.026101508157475e-06, "loss": 2.3649, "step": 6071 }, { "epoch": 0.61, "learning_rate": 7.02300337447736e-06, "loss": 2.3967, "step": 6072 }, { "epoch": 0.61, "learning_rate": 7.019905554297314e-06, "loss": 2.2478, "step": 6073 }, { "epoch": 0.61, "learning_rate": 7.016808047943564e-06, "loss": 2.2709, "step": 6074 }, { "epoch": 0.61, "learning_rate": 7.013710855742299e-06, "loss": 2.3475, "step": 6075 }, { "epoch": 0.61, "learning_rate": 7.010613978019676e-06, "loss": 2.2358, "step": 6076 }, { "epoch": 0.61, "learning_rate": 7.007517415101821e-06, "loss": 2.3477, "step": 6077 }, { "epoch": 0.61, "learning_rate": 7.004421167314826e-06, "loss": 2.3673, "step": 6078 }, { "epoch": 0.61, "learning_rate": 7.001325234984746e-06, "loss": 2.347, "step": 6079 }, { "epoch": 0.61, "learning_rate": 6.99822961843761e-06, "loss": 2.3436, "step": 6080 }, { "epoch": 0.61, "learning_rate": 6.995134317999407e-06, "loss": 2.3878, "step": 6081 }, { "epoch": 0.61, "learning_rate": 6.992039333996094e-06, "loss": 2.2871, "step": 6082 }, { "epoch": 0.61, "learning_rate": 6.988944666753601e-06, "loss": 2.2584, "step": 6083 }, { "epoch": 0.61, "learning_rate": 6.985850316597814e-06, "loss": 2.2959, "step": 6084 }, { "epoch": 0.61, "learning_rate": 6.982756283854593e-06, "loss": 2.3774, "step": 6085 }, { "epoch": 0.61, "learning_rate": 6.979662568849765e-06, "loss": 2.2791, "step": 6086 }, { "epoch": 0.61, "learning_rate": 6.97656917190912e-06, "loss": 2.2411, "step": 6087 }, { "epoch": 0.61, "learning_rate": 6.973476093358416e-06, "loss": 2.2946, "step": 6088 }, { "epoch": 0.61, "learning_rate": 6.970383333523376e-06, "loss": 2.2699, "step": 6089 }, { "epoch": 0.61, "learning_rate": 6.967290892729694e-06, "loss": 2.351, "step": 6090 }, { "epoch": 0.61, "learning_rate": 6.964198771303024e-06, "loss": 2.3013, "step": 6091 }, { "epoch": 0.61, "learning_rate": 6.961106969568992e-06, "loss": 2.2489, "step": 6092 }, { "epoch": 0.61, "learning_rate": 6.958015487853187e-06, "loss": 2.151, "step": 6093 }, { "epoch": 0.61, "learning_rate": 6.954924326481162e-06, "loss": 2.2559, "step": 6094 }, { "epoch": 0.61, "learning_rate": 6.951833485778444e-06, "loss": 2.4043, "step": 6095 }, { "epoch": 0.61, "learning_rate": 6.948742966070521e-06, "loss": 2.3573, "step": 6096 }, { "epoch": 0.61, "learning_rate": 6.945652767682846e-06, "loss": 2.4227, "step": 6097 }, { "epoch": 0.61, "learning_rate": 6.942562890940843e-06, "loss": 2.3542, "step": 6098 }, { "epoch": 0.61, "learning_rate": 6.939473336169896e-06, "loss": 2.375, "step": 6099 }, { "epoch": 0.61, "learning_rate": 6.93638410369536e-06, "loss": 2.3333, "step": 6100 }, { "epoch": 0.61, "learning_rate": 6.933295193842554e-06, "loss": 2.3933, "step": 6101 }, { "epoch": 0.61, "learning_rate": 6.930206606936762e-06, "loss": 2.2942, "step": 6102 }, { "epoch": 0.61, "learning_rate": 6.927118343303234e-06, "loss": 2.3339, "step": 6103 }, { "epoch": 0.61, "learning_rate": 6.924030403267194e-06, "loss": 2.325, "step": 6104 }, { "epoch": 0.61, "learning_rate": 6.920942787153824e-06, "loss": 2.3788, "step": 6105 }, { "epoch": 0.61, "learning_rate": 6.9178554952882685e-06, "loss": 2.2689, "step": 6106 }, { "epoch": 0.61, "learning_rate": 6.9147685279956425e-06, "loss": 2.3572, "step": 6107 }, { "epoch": 0.61, "learning_rate": 6.91168188560103e-06, "loss": 2.3745, "step": 6108 }, { "epoch": 0.61, "learning_rate": 6.908595568429475e-06, "loss": 2.2403, "step": 6109 }, { "epoch": 0.61, "learning_rate": 6.905509576805992e-06, "loss": 2.3152, "step": 6110 }, { "epoch": 0.61, "learning_rate": 6.902423911055558e-06, "loss": 2.4502, "step": 6111 }, { "epoch": 0.61, "learning_rate": 6.8993385715031134e-06, "loss": 2.274, "step": 6112 }, { "epoch": 0.61, "learning_rate": 6.896253558473574e-06, "loss": 2.3305, "step": 6113 }, { "epoch": 0.61, "learning_rate": 6.893168872291813e-06, "loss": 2.2065, "step": 6114 }, { "epoch": 0.61, "learning_rate": 6.89008451328267e-06, "loss": 2.3351, "step": 6115 }, { "epoch": 0.61, "learning_rate": 6.887000481770951e-06, "loss": 2.2447, "step": 6116 }, { "epoch": 0.61, "learning_rate": 6.8839167780814295e-06, "loss": 2.3581, "step": 6117 }, { "epoch": 0.61, "learning_rate": 6.8808334025388376e-06, "loss": 2.2769, "step": 6118 }, { "epoch": 0.61, "learning_rate": 6.877750355467882e-06, "loss": 2.3154, "step": 6119 }, { "epoch": 0.61, "learning_rate": 6.874667637193231e-06, "loss": 2.2322, "step": 6120 }, { "epoch": 0.61, "learning_rate": 6.871585248039512e-06, "loss": 2.3512, "step": 6121 }, { "epoch": 0.61, "learning_rate": 6.868503188331333e-06, "loss": 2.2961, "step": 6122 }, { "epoch": 0.61, "learning_rate": 6.865421458393251e-06, "loss": 2.3409, "step": 6123 }, { "epoch": 0.61, "learning_rate": 6.8623400585498e-06, "loss": 2.3632, "step": 6124 }, { "epoch": 0.61, "learning_rate": 6.859258989125471e-06, "loss": 2.3447, "step": 6125 }, { "epoch": 0.61, "learning_rate": 6.856178250444726e-06, "loss": 2.2921, "step": 6126 }, { "epoch": 0.61, "learning_rate": 6.853097842831988e-06, "loss": 2.304, "step": 6127 }, { "epoch": 0.61, "learning_rate": 6.8500177666116475e-06, "loss": 2.271, "step": 6128 }, { "epoch": 0.61, "learning_rate": 6.8469380221080625e-06, "loss": 2.2998, "step": 6129 }, { "epoch": 0.61, "learning_rate": 6.843858609645546e-06, "loss": 2.4175, "step": 6130 }, { "epoch": 0.61, "learning_rate": 6.840779529548389e-06, "loss": 2.3688, "step": 6131 }, { "epoch": 0.61, "learning_rate": 6.837700782140844e-06, "loss": 2.3164, "step": 6132 }, { "epoch": 0.61, "learning_rate": 6.8346223677471204e-06, "loss": 2.3383, "step": 6133 }, { "epoch": 0.61, "learning_rate": 6.8315442866914005e-06, "loss": 2.3038, "step": 6134 }, { "epoch": 0.61, "learning_rate": 6.828466539297831e-06, "loss": 2.3986, "step": 6135 }, { "epoch": 0.61, "learning_rate": 6.825389125890521e-06, "loss": 2.1934, "step": 6136 }, { "epoch": 0.61, "learning_rate": 6.8223120467935426e-06, "loss": 2.3981, "step": 6137 }, { "epoch": 0.61, "learning_rate": 6.819235302330938e-06, "loss": 2.2802, "step": 6138 }, { "epoch": 0.62, "learning_rate": 6.816158892826707e-06, "loss": 2.3386, "step": 6139 }, { "epoch": 0.62, "learning_rate": 6.813082818604827e-06, "loss": 2.3007, "step": 6140 }, { "epoch": 0.62, "learning_rate": 6.810007079989226e-06, "loss": 2.3508, "step": 6141 }, { "epoch": 0.62, "learning_rate": 6.806931677303803e-06, "loss": 2.3419, "step": 6142 }, { "epoch": 0.62, "learning_rate": 6.803856610872421e-06, "loss": 2.3247, "step": 6143 }, { "epoch": 0.62, "learning_rate": 6.80078188101891e-06, "loss": 2.3516, "step": 6144 }, { "epoch": 0.62, "learning_rate": 6.797707488067058e-06, "loss": 2.2367, "step": 6145 }, { "epoch": 0.62, "learning_rate": 6.794633432340623e-06, "loss": 2.3419, "step": 6146 }, { "epoch": 0.62, "learning_rate": 6.791559714163328e-06, "loss": 2.3065, "step": 6147 }, { "epoch": 0.62, "learning_rate": 6.788486333858855e-06, "loss": 2.3821, "step": 6148 }, { "epoch": 0.62, "learning_rate": 6.785413291750858e-06, "loss": 2.3227, "step": 6149 }, { "epoch": 0.62, "learning_rate": 6.78234058816295e-06, "loss": 2.3333, "step": 6150 }, { "epoch": 0.62, "learning_rate": 6.779268223418709e-06, "loss": 2.3745, "step": 6151 }, { "epoch": 0.62, "learning_rate": 6.77619619784168e-06, "loss": 2.3315, "step": 6152 }, { "epoch": 0.62, "learning_rate": 6.773124511755367e-06, "loss": 2.3296, "step": 6153 }, { "epoch": 0.62, "learning_rate": 6.770053165483243e-06, "loss": 2.3501, "step": 6154 }, { "epoch": 0.62, "learning_rate": 6.766982159348747e-06, "loss": 2.3155, "step": 6155 }, { "epoch": 0.62, "learning_rate": 6.763911493675274e-06, "loss": 2.3582, "step": 6156 }, { "epoch": 0.62, "learning_rate": 6.760841168786189e-06, "loss": 2.3156, "step": 6157 }, { "epoch": 0.62, "learning_rate": 6.757771185004822e-06, "loss": 2.3952, "step": 6158 }, { "epoch": 0.62, "learning_rate": 6.754701542654467e-06, "loss": 2.3013, "step": 6159 }, { "epoch": 0.62, "learning_rate": 6.751632242058377e-06, "loss": 2.376, "step": 6160 }, { "epoch": 0.62, "learning_rate": 6.7485632835397726e-06, "loss": 2.3578, "step": 6161 }, { "epoch": 0.62, "learning_rate": 6.745494667421841e-06, "loss": 2.366, "step": 6162 }, { "epoch": 0.62, "learning_rate": 6.742426394027728e-06, "loss": 2.3442, "step": 6163 }, { "epoch": 0.62, "learning_rate": 6.739358463680545e-06, "loss": 2.3301, "step": 6164 }, { "epoch": 0.62, "learning_rate": 6.736290876703367e-06, "loss": 2.2944, "step": 6165 }, { "epoch": 0.62, "learning_rate": 6.733223633419241e-06, "loss": 2.2789, "step": 6166 }, { "epoch": 0.62, "learning_rate": 6.730156734151165e-06, "loss": 2.3527, "step": 6167 }, { "epoch": 0.62, "learning_rate": 6.72709017922211e-06, "loss": 2.3791, "step": 6168 }, { "epoch": 0.62, "learning_rate": 6.724023968955003e-06, "loss": 2.4227, "step": 6169 }, { "epoch": 0.62, "learning_rate": 6.72095810367274e-06, "loss": 2.3586, "step": 6170 }, { "epoch": 0.62, "learning_rate": 6.71789258369818e-06, "loss": 2.2907, "step": 6171 }, { "epoch": 0.62, "learning_rate": 6.714827409354147e-06, "loss": 2.3585, "step": 6172 }, { "epoch": 0.62, "learning_rate": 6.7117625809634255e-06, "loss": 2.2563, "step": 6173 }, { "epoch": 0.62, "learning_rate": 6.7086980988487595e-06, "loss": 2.37, "step": 6174 }, { "epoch": 0.62, "learning_rate": 6.7056339633328715e-06, "loss": 2.2977, "step": 6175 }, { "epoch": 0.62, "learning_rate": 6.7025701747384344e-06, "loss": 2.3751, "step": 6176 }, { "epoch": 0.62, "learning_rate": 6.699506733388088e-06, "loss": 2.2749, "step": 6177 }, { "epoch": 0.62, "learning_rate": 6.6964436396044355e-06, "loss": 2.3414, "step": 6178 }, { "epoch": 0.62, "learning_rate": 6.693380893710042e-06, "loss": 2.3586, "step": 6179 }, { "epoch": 0.62, "learning_rate": 6.690318496027439e-06, "loss": 2.2522, "step": 6180 }, { "epoch": 0.62, "learning_rate": 6.687256446879122e-06, "loss": 2.3744, "step": 6181 }, { "epoch": 0.62, "learning_rate": 6.684194746587545e-06, "loss": 2.307, "step": 6182 }, { "epoch": 0.62, "learning_rate": 6.6811333954751215e-06, "loss": 2.312, "step": 6183 }, { "epoch": 0.62, "learning_rate": 6.678072393864248e-06, "loss": 2.1801, "step": 6184 }, { "epoch": 0.62, "learning_rate": 6.675011742077264e-06, "loss": 2.2955, "step": 6185 }, { "epoch": 0.62, "learning_rate": 6.67195144043648e-06, "loss": 2.3487, "step": 6186 }, { "epoch": 0.62, "learning_rate": 6.668891489264169e-06, "loss": 2.415, "step": 6187 }, { "epoch": 0.62, "learning_rate": 6.665831888882565e-06, "loss": 2.3763, "step": 6188 }, { "epoch": 0.62, "learning_rate": 6.6627726396138705e-06, "loss": 2.4312, "step": 6189 }, { "epoch": 0.62, "learning_rate": 6.659713741780245e-06, "loss": 2.3907, "step": 6190 }, { "epoch": 0.62, "learning_rate": 6.656655195703812e-06, "loss": 2.3286, "step": 6191 }, { "epoch": 0.62, "learning_rate": 6.65359700170666e-06, "loss": 2.355, "step": 6192 }, { "epoch": 0.62, "learning_rate": 6.65053916011084e-06, "loss": 2.3449, "step": 6193 }, { "epoch": 0.62, "learning_rate": 6.647481671238369e-06, "loss": 2.3309, "step": 6194 }, { "epoch": 0.62, "learning_rate": 6.64442453541122e-06, "loss": 2.3099, "step": 6195 }, { "epoch": 0.62, "learning_rate": 6.641367752951334e-06, "loss": 2.2828, "step": 6196 }, { "epoch": 0.62, "learning_rate": 6.638311324180611e-06, "loss": 2.3411, "step": 6197 }, { "epoch": 0.62, "learning_rate": 6.6352552494209165e-06, "loss": 2.2981, "step": 6198 }, { "epoch": 0.62, "learning_rate": 6.6321995289940785e-06, "loss": 2.3534, "step": 6199 }, { "epoch": 0.62, "learning_rate": 6.6291441632218904e-06, "loss": 2.3003, "step": 6200 }, { "epoch": 0.62, "learning_rate": 6.626089152426097e-06, "loss": 2.3525, "step": 6201 }, { "epoch": 0.62, "learning_rate": 6.623034496928422e-06, "loss": 2.2114, "step": 6202 }, { "epoch": 0.62, "learning_rate": 6.619980197050542e-06, "loss": 2.3427, "step": 6203 }, { "epoch": 0.62, "learning_rate": 6.616926253114094e-06, "loss": 2.2873, "step": 6204 }, { "epoch": 0.62, "learning_rate": 6.613872665440684e-06, "loss": 2.3291, "step": 6205 }, { "epoch": 0.62, "learning_rate": 6.610819434351878e-06, "loss": 2.3259, "step": 6206 }, { "epoch": 0.62, "learning_rate": 6.607766560169203e-06, "loss": 2.3416, "step": 6207 }, { "epoch": 0.62, "learning_rate": 6.60471404321415e-06, "loss": 2.3, "step": 6208 }, { "epoch": 0.62, "learning_rate": 6.60166188380817e-06, "loss": 2.2741, "step": 6209 }, { "epoch": 0.62, "learning_rate": 6.598610082272681e-06, "loss": 2.3119, "step": 6210 }, { "epoch": 0.62, "learning_rate": 6.59555863892906e-06, "loss": 2.2951, "step": 6211 }, { "epoch": 0.62, "learning_rate": 6.592507554098646e-06, "loss": 2.2505, "step": 6212 }, { "epoch": 0.62, "learning_rate": 6.589456828102742e-06, "loss": 2.3179, "step": 6213 }, { "epoch": 0.62, "learning_rate": 6.586406461262611e-06, "loss": 2.3689, "step": 6214 }, { "epoch": 0.62, "learning_rate": 6.583356453899482e-06, "loss": 2.239, "step": 6215 }, { "epoch": 0.62, "learning_rate": 6.580306806334542e-06, "loss": 2.3275, "step": 6216 }, { "epoch": 0.62, "learning_rate": 6.577257518888941e-06, "loss": 2.229, "step": 6217 }, { "epoch": 0.62, "learning_rate": 6.5742085918837925e-06, "loss": 2.3167, "step": 6218 }, { "epoch": 0.62, "learning_rate": 6.571160025640169e-06, "loss": 2.3752, "step": 6219 }, { "epoch": 0.62, "learning_rate": 6.568111820479114e-06, "loss": 2.2665, "step": 6220 }, { "epoch": 0.62, "learning_rate": 6.565063976721622e-06, "loss": 2.3758, "step": 6221 }, { "epoch": 0.62, "learning_rate": 6.562016494688652e-06, "loss": 2.3435, "step": 6222 }, { "epoch": 0.62, "learning_rate": 6.558969374701131e-06, "loss": 2.3261, "step": 6223 }, { "epoch": 0.62, "learning_rate": 6.555922617079939e-06, "loss": 2.3066, "step": 6224 }, { "epoch": 0.62, "learning_rate": 6.552876222145928e-06, "loss": 2.4051, "step": 6225 }, { "epoch": 0.62, "learning_rate": 6.549830190219902e-06, "loss": 2.2506, "step": 6226 }, { "epoch": 0.62, "learning_rate": 6.54678452162263e-06, "loss": 2.1395, "step": 6227 }, { "epoch": 0.62, "learning_rate": 6.543739216674843e-06, "loss": 2.372, "step": 6228 }, { "epoch": 0.62, "learning_rate": 6.5406942756972415e-06, "loss": 2.3083, "step": 6229 }, { "epoch": 0.62, "learning_rate": 6.537649699010477e-06, "loss": 2.3917, "step": 6230 }, { "epoch": 0.62, "learning_rate": 6.534605486935164e-06, "loss": 2.3464, "step": 6231 }, { "epoch": 0.62, "learning_rate": 6.531561639791886e-06, "loss": 2.4736, "step": 6232 }, { "epoch": 0.62, "learning_rate": 6.528518157901177e-06, "loss": 2.1774, "step": 6233 }, { "epoch": 0.62, "learning_rate": 6.525475041583541e-06, "loss": 2.2628, "step": 6234 }, { "epoch": 0.62, "learning_rate": 6.52243229115944e-06, "loss": 2.2403, "step": 6235 }, { "epoch": 0.62, "learning_rate": 6.5193899069493005e-06, "loss": 2.371, "step": 6236 }, { "epoch": 0.62, "learning_rate": 6.516347889273502e-06, "loss": 2.305, "step": 6237 }, { "epoch": 0.62, "learning_rate": 6.513306238452403e-06, "loss": 2.3668, "step": 6238 }, { "epoch": 0.63, "learning_rate": 6.510264954806305e-06, "loss": 2.3637, "step": 6239 }, { "epoch": 0.63, "learning_rate": 6.507224038655478e-06, "loss": 2.2033, "step": 6240 }, { "epoch": 0.63, "learning_rate": 6.504183490320155e-06, "loss": 2.3508, "step": 6241 }, { "epoch": 0.63, "learning_rate": 6.501143310120528e-06, "loss": 2.3354, "step": 6242 }, { "epoch": 0.63, "learning_rate": 6.498103498376751e-06, "loss": 2.3433, "step": 6243 }, { "epoch": 0.63, "learning_rate": 6.4950640554089395e-06, "loss": 2.4154, "step": 6244 }, { "epoch": 0.63, "learning_rate": 6.4920249815371685e-06, "loss": 2.3679, "step": 6245 }, { "epoch": 0.63, "learning_rate": 6.48898627708147e-06, "loss": 2.2832, "step": 6246 }, { "epoch": 0.63, "learning_rate": 6.485947942361855e-06, "loss": 2.1825, "step": 6247 }, { "epoch": 0.63, "learning_rate": 6.482909977698273e-06, "loss": 2.3021, "step": 6248 }, { "epoch": 0.63, "learning_rate": 6.479872383410648e-06, "loss": 2.2507, "step": 6249 }, { "epoch": 0.63, "learning_rate": 6.4768351598188595e-06, "loss": 2.3101, "step": 6250 }, { "epoch": 0.63, "learning_rate": 6.473798307242753e-06, "loss": 2.329, "step": 6251 }, { "epoch": 0.63, "learning_rate": 6.47076182600213e-06, "loss": 2.3615, "step": 6252 }, { "epoch": 0.63, "learning_rate": 6.4677257164167525e-06, "loss": 2.261, "step": 6253 }, { "epoch": 0.63, "learning_rate": 6.464689978806351e-06, "loss": 2.3603, "step": 6254 }, { "epoch": 0.63, "learning_rate": 6.461654613490605e-06, "loss": 2.3982, "step": 6255 }, { "epoch": 0.63, "learning_rate": 6.458619620789166e-06, "loss": 2.3056, "step": 6256 }, { "epoch": 0.63, "learning_rate": 6.455585001021641e-06, "loss": 2.3573, "step": 6257 }, { "epoch": 0.63, "learning_rate": 6.452550754507596e-06, "loss": 2.2757, "step": 6258 }, { "epoch": 0.63, "learning_rate": 6.449516881566562e-06, "loss": 2.2841, "step": 6259 }, { "epoch": 0.63, "learning_rate": 6.4464833825180285e-06, "loss": 2.2809, "step": 6260 }, { "epoch": 0.63, "learning_rate": 6.443450257681445e-06, "loss": 2.2702, "step": 6261 }, { "epoch": 0.63, "learning_rate": 6.440417507376221e-06, "loss": 2.2804, "step": 6262 }, { "epoch": 0.63, "learning_rate": 6.437385131921729e-06, "loss": 2.2312, "step": 6263 }, { "epoch": 0.63, "learning_rate": 6.434353131637301e-06, "loss": 2.3551, "step": 6264 }, { "epoch": 0.63, "learning_rate": 6.43132150684223e-06, "loss": 2.3303, "step": 6265 }, { "epoch": 0.63, "learning_rate": 6.428290257855768e-06, "loss": 2.3719, "step": 6266 }, { "epoch": 0.63, "learning_rate": 6.425259384997129e-06, "loss": 2.3138, "step": 6267 }, { "epoch": 0.63, "learning_rate": 6.422228888585487e-06, "loss": 2.3508, "step": 6268 }, { "epoch": 0.63, "learning_rate": 6.419198768939974e-06, "loss": 2.3524, "step": 6269 }, { "epoch": 0.63, "learning_rate": 6.416169026379684e-06, "loss": 2.3953, "step": 6270 }, { "epoch": 0.63, "learning_rate": 6.413139661223675e-06, "loss": 2.3343, "step": 6271 }, { "epoch": 0.63, "learning_rate": 6.410110673790959e-06, "loss": 2.3864, "step": 6272 }, { "epoch": 0.63, "learning_rate": 6.40708206440051e-06, "loss": 2.2003, "step": 6273 }, { "epoch": 0.63, "learning_rate": 6.404053833371269e-06, "loss": 2.318, "step": 6274 }, { "epoch": 0.63, "learning_rate": 6.401025981022126e-06, "loss": 2.2377, "step": 6275 }, { "epoch": 0.63, "learning_rate": 6.397998507671939e-06, "loss": 2.3004, "step": 6276 }, { "epoch": 0.63, "learning_rate": 6.394971413639521e-06, "loss": 2.2958, "step": 6277 }, { "epoch": 0.63, "learning_rate": 6.391944699243652e-06, "loss": 2.3018, "step": 6278 }, { "epoch": 0.63, "learning_rate": 6.388918364803065e-06, "loss": 2.238, "step": 6279 }, { "epoch": 0.63, "learning_rate": 6.385892410636455e-06, "loss": 2.2103, "step": 6280 }, { "epoch": 0.63, "learning_rate": 6.382866837062479e-06, "loss": 2.352, "step": 6281 }, { "epoch": 0.63, "learning_rate": 6.379841644399749e-06, "loss": 2.3241, "step": 6282 }, { "epoch": 0.63, "learning_rate": 6.376816832966848e-06, "loss": 2.3815, "step": 6283 }, { "epoch": 0.63, "learning_rate": 6.373792403082308e-06, "loss": 2.3271, "step": 6284 }, { "epoch": 0.63, "learning_rate": 6.3707683550646216e-06, "loss": 2.2852, "step": 6285 }, { "epoch": 0.63, "learning_rate": 6.367744689232244e-06, "loss": 2.3728, "step": 6286 }, { "epoch": 0.63, "learning_rate": 6.364721405903594e-06, "loss": 2.3483, "step": 6287 }, { "epoch": 0.63, "learning_rate": 6.361698505397043e-06, "loss": 2.3822, "step": 6288 }, { "epoch": 0.63, "learning_rate": 6.358675988030925e-06, "loss": 2.4218, "step": 6289 }, { "epoch": 0.63, "learning_rate": 6.3556538541235335e-06, "loss": 2.3254, "step": 6290 }, { "epoch": 0.63, "learning_rate": 6.352632103993118e-06, "loss": 2.2971, "step": 6291 }, { "epoch": 0.63, "learning_rate": 6.349610737957901e-06, "loss": 2.2723, "step": 6292 }, { "epoch": 0.63, "learning_rate": 6.34658975633605e-06, "loss": 2.3318, "step": 6293 }, { "epoch": 0.63, "learning_rate": 6.343569159445697e-06, "loss": 2.3439, "step": 6294 }, { "epoch": 0.63, "learning_rate": 6.340548947604932e-06, "loss": 2.2903, "step": 6295 }, { "epoch": 0.63, "learning_rate": 6.337529121131811e-06, "loss": 2.2982, "step": 6296 }, { "epoch": 0.63, "learning_rate": 6.334509680344339e-06, "loss": 2.3112, "step": 6297 }, { "epoch": 0.63, "learning_rate": 6.331490625560487e-06, "loss": 2.3717, "step": 6298 }, { "epoch": 0.63, "learning_rate": 6.328471957098184e-06, "loss": 2.3561, "step": 6299 }, { "epoch": 0.63, "learning_rate": 6.325453675275317e-06, "loss": 2.3614, "step": 6300 }, { "epoch": 0.63, "learning_rate": 6.322435780409738e-06, "loss": 2.2556, "step": 6301 }, { "epoch": 0.63, "learning_rate": 6.319418272819253e-06, "loss": 2.2901, "step": 6302 }, { "epoch": 0.63, "learning_rate": 6.3164011528216255e-06, "loss": 2.2883, "step": 6303 }, { "epoch": 0.63, "learning_rate": 6.313384420734584e-06, "loss": 2.3301, "step": 6304 }, { "epoch": 0.63, "learning_rate": 6.3103680768758105e-06, "loss": 2.3558, "step": 6305 }, { "epoch": 0.63, "learning_rate": 6.307352121562949e-06, "loss": 2.3129, "step": 6306 }, { "epoch": 0.63, "learning_rate": 6.304336555113604e-06, "loss": 2.3838, "step": 6307 }, { "epoch": 0.63, "learning_rate": 6.3013213778453356e-06, "loss": 2.3316, "step": 6308 }, { "epoch": 0.63, "learning_rate": 6.298306590075662e-06, "loss": 2.4354, "step": 6309 }, { "epoch": 0.63, "learning_rate": 6.295292192122069e-06, "loss": 2.3334, "step": 6310 }, { "epoch": 0.63, "learning_rate": 6.292278184301992e-06, "loss": 2.3046, "step": 6311 }, { "epoch": 0.63, "learning_rate": 6.2892645669328286e-06, "loss": 2.3409, "step": 6312 }, { "epoch": 0.63, "learning_rate": 6.286251340331935e-06, "loss": 2.3808, "step": 6313 }, { "epoch": 0.63, "learning_rate": 6.283238504816628e-06, "loss": 2.4142, "step": 6314 }, { "epoch": 0.63, "learning_rate": 6.28022606070418e-06, "loss": 2.3839, "step": 6315 }, { "epoch": 0.63, "learning_rate": 6.277214008311825e-06, "loss": 2.2709, "step": 6316 }, { "epoch": 0.63, "learning_rate": 6.274202347956755e-06, "loss": 2.3753, "step": 6317 }, { "epoch": 0.63, "learning_rate": 6.271191079956118e-06, "loss": 2.3257, "step": 6318 }, { "epoch": 0.63, "learning_rate": 6.268180204627028e-06, "loss": 2.3257, "step": 6319 }, { "epoch": 0.63, "learning_rate": 6.2651697222865485e-06, "loss": 2.2843, "step": 6320 }, { "epoch": 0.63, "learning_rate": 6.262159633251707e-06, "loss": 2.3312, "step": 6321 }, { "epoch": 0.63, "learning_rate": 6.259149937839489e-06, "loss": 2.2893, "step": 6322 }, { "epoch": 0.63, "learning_rate": 6.256140636366839e-06, "loss": 2.3344, "step": 6323 }, { "epoch": 0.63, "learning_rate": 6.2531317291506555e-06, "loss": 2.3123, "step": 6324 }, { "epoch": 0.63, "learning_rate": 6.250123216507802e-06, "loss": 2.321, "step": 6325 }, { "epoch": 0.63, "learning_rate": 6.247115098755096e-06, "loss": 2.3195, "step": 6326 }, { "epoch": 0.63, "learning_rate": 6.244107376209315e-06, "loss": 2.2757, "step": 6327 }, { "epoch": 0.63, "learning_rate": 6.241100049187197e-06, "loss": 2.3371, "step": 6328 }, { "epoch": 0.63, "learning_rate": 6.238093118005432e-06, "loss": 2.3104, "step": 6329 }, { "epoch": 0.63, "learning_rate": 6.2350865829806774e-06, "loss": 2.3109, "step": 6330 }, { "epoch": 0.63, "learning_rate": 6.23208044442954e-06, "loss": 2.3729, "step": 6331 }, { "epoch": 0.63, "learning_rate": 6.2290747026685895e-06, "loss": 2.3589, "step": 6332 }, { "epoch": 0.63, "learning_rate": 6.226069358014355e-06, "loss": 2.3121, "step": 6333 }, { "epoch": 0.63, "learning_rate": 6.223064410783319e-06, "loss": 2.4, "step": 6334 }, { "epoch": 0.63, "learning_rate": 6.220059861291923e-06, "loss": 2.2731, "step": 6335 }, { "epoch": 0.63, "learning_rate": 6.217055709856577e-06, "loss": 2.2954, "step": 6336 }, { "epoch": 0.63, "learning_rate": 6.214051956793633e-06, "loss": 2.3623, "step": 6337 }, { "epoch": 0.64, "learning_rate": 6.211048602419413e-06, "loss": 2.3359, "step": 6338 }, { "epoch": 0.64, "learning_rate": 6.208045647050189e-06, "loss": 2.3589, "step": 6339 }, { "epoch": 0.64, "learning_rate": 6.2050430910021985e-06, "loss": 2.4049, "step": 6340 }, { "epoch": 0.64, "learning_rate": 6.202040934591631e-06, "loss": 2.2974, "step": 6341 }, { "epoch": 0.64, "learning_rate": 6.199039178134636e-06, "loss": 2.3786, "step": 6342 }, { "epoch": 0.64, "learning_rate": 6.196037821947323e-06, "loss": 2.3276, "step": 6343 }, { "epoch": 0.64, "learning_rate": 6.19303686634575e-06, "loss": 2.3588, "step": 6344 }, { "epoch": 0.64, "learning_rate": 6.190036311645951e-06, "loss": 2.3217, "step": 6345 }, { "epoch": 0.64, "learning_rate": 6.1870361581638995e-06, "loss": 2.2587, "step": 6346 }, { "epoch": 0.64, "learning_rate": 6.184036406215539e-06, "loss": 2.1924, "step": 6347 }, { "epoch": 0.64, "learning_rate": 6.181037056116765e-06, "loss": 2.3962, "step": 6348 }, { "epoch": 0.64, "learning_rate": 6.178038108183426e-06, "loss": 2.4096, "step": 6349 }, { "epoch": 0.64, "learning_rate": 6.17503956273134e-06, "loss": 2.2005, "step": 6350 }, { "epoch": 0.64, "learning_rate": 6.172041420076274e-06, "loss": 2.2403, "step": 6351 }, { "epoch": 0.64, "learning_rate": 6.169043680533952e-06, "loss": 2.2983, "step": 6352 }, { "epoch": 0.64, "learning_rate": 6.16604634442006e-06, "loss": 2.3535, "step": 6353 }, { "epoch": 0.64, "learning_rate": 6.163049412050244e-06, "loss": 2.2833, "step": 6354 }, { "epoch": 0.64, "learning_rate": 6.160052883740102e-06, "loss": 2.3629, "step": 6355 }, { "epoch": 0.64, "learning_rate": 6.157056759805189e-06, "loss": 2.3346, "step": 6356 }, { "epoch": 0.64, "learning_rate": 6.154061040561019e-06, "loss": 2.3944, "step": 6357 }, { "epoch": 0.64, "learning_rate": 6.151065726323066e-06, "loss": 2.3702, "step": 6358 }, { "epoch": 0.64, "learning_rate": 6.148070817406757e-06, "loss": 2.3214, "step": 6359 }, { "epoch": 0.64, "learning_rate": 6.14507631412748e-06, "loss": 2.3414, "step": 6360 }, { "epoch": 0.64, "learning_rate": 6.142082216800578e-06, "loss": 2.353, "step": 6361 }, { "epoch": 0.64, "learning_rate": 6.139088525741346e-06, "loss": 2.3217, "step": 6362 }, { "epoch": 0.64, "learning_rate": 6.136095241265052e-06, "loss": 2.3332, "step": 6363 }, { "epoch": 0.64, "learning_rate": 6.133102363686908e-06, "loss": 2.385, "step": 6364 }, { "epoch": 0.64, "learning_rate": 6.1301098933220845e-06, "loss": 2.3811, "step": 6365 }, { "epoch": 0.64, "learning_rate": 6.127117830485712e-06, "loss": 2.3293, "step": 6366 }, { "epoch": 0.64, "learning_rate": 6.1241261754928784e-06, "loss": 2.409, "step": 6367 }, { "epoch": 0.64, "learning_rate": 6.121134928658625e-06, "loss": 2.3742, "step": 6368 }, { "epoch": 0.64, "learning_rate": 6.118144090297955e-06, "loss": 2.352, "step": 6369 }, { "epoch": 0.64, "learning_rate": 6.115153660725823e-06, "loss": 2.3718, "step": 6370 }, { "epoch": 0.64, "learning_rate": 6.1121636402571464e-06, "loss": 2.3858, "step": 6371 }, { "epoch": 0.64, "learning_rate": 6.109174029206796e-06, "loss": 2.2645, "step": 6372 }, { "epoch": 0.64, "learning_rate": 6.106184827889601e-06, "loss": 2.2442, "step": 6373 }, { "epoch": 0.64, "learning_rate": 6.103196036620345e-06, "loss": 2.343, "step": 6374 }, { "epoch": 0.64, "learning_rate": 6.100207655713771e-06, "loss": 2.2335, "step": 6375 }, { "epoch": 0.64, "learning_rate": 6.097219685484579e-06, "loss": 2.3555, "step": 6376 }, { "epoch": 0.64, "learning_rate": 6.0942321262474224e-06, "loss": 2.2513, "step": 6377 }, { "epoch": 0.64, "learning_rate": 6.0912449783169145e-06, "loss": 2.2806, "step": 6378 }, { "epoch": 0.64, "learning_rate": 6.088258242007627e-06, "loss": 2.2689, "step": 6379 }, { "epoch": 0.64, "learning_rate": 6.085271917634079e-06, "loss": 2.3056, "step": 6380 }, { "epoch": 0.64, "learning_rate": 6.08228600551076e-06, "loss": 2.3785, "step": 6381 }, { "epoch": 0.64, "learning_rate": 6.079300505952107e-06, "loss": 2.3811, "step": 6382 }, { "epoch": 0.64, "learning_rate": 6.076315419272514e-06, "loss": 2.2946, "step": 6383 }, { "epoch": 0.64, "learning_rate": 6.0733307457863345e-06, "loss": 2.2534, "step": 6384 }, { "epoch": 0.64, "learning_rate": 6.070346485807874e-06, "loss": 2.4703, "step": 6385 }, { "epoch": 0.64, "learning_rate": 6.067362639651402e-06, "loss": 2.3147, "step": 6386 }, { "epoch": 0.64, "learning_rate": 6.064379207631136e-06, "loss": 2.3491, "step": 6387 }, { "epoch": 0.64, "learning_rate": 6.061396190061255e-06, "loss": 2.3674, "step": 6388 }, { "epoch": 0.64, "learning_rate": 6.058413587255893e-06, "loss": 2.3148, "step": 6389 }, { "epoch": 0.64, "learning_rate": 6.055431399529141e-06, "loss": 2.3933, "step": 6390 }, { "epoch": 0.64, "learning_rate": 6.0524496271950475e-06, "loss": 2.373, "step": 6391 }, { "epoch": 0.64, "learning_rate": 6.049468270567611e-06, "loss": 2.3317, "step": 6392 }, { "epoch": 0.64, "learning_rate": 6.046487329960795e-06, "loss": 2.3207, "step": 6393 }, { "epoch": 0.64, "learning_rate": 6.043506805688512e-06, "loss": 2.3271, "step": 6394 }, { "epoch": 0.64, "learning_rate": 6.040526698064636e-06, "loss": 2.3631, "step": 6395 }, { "epoch": 0.64, "learning_rate": 6.037547007402993e-06, "loss": 2.3505, "step": 6396 }, { "epoch": 0.64, "learning_rate": 6.0345677340173666e-06, "loss": 2.2861, "step": 6397 }, { "epoch": 0.64, "learning_rate": 6.0315888782214945e-06, "loss": 2.404, "step": 6398 }, { "epoch": 0.64, "learning_rate": 6.028610440329078e-06, "loss": 2.3375, "step": 6399 }, { "epoch": 0.64, "learning_rate": 6.025632420653769e-06, "loss": 2.3016, "step": 6400 }, { "epoch": 0.64, "learning_rate": 6.02265481950917e-06, "loss": 2.2932, "step": 6401 }, { "epoch": 0.64, "learning_rate": 6.019677637208847e-06, "loss": 2.2818, "step": 6402 }, { "epoch": 0.64, "learning_rate": 6.01670087406632e-06, "loss": 2.3957, "step": 6403 }, { "epoch": 0.64, "learning_rate": 6.013724530395064e-06, "loss": 2.2591, "step": 6404 }, { "epoch": 0.64, "learning_rate": 6.010748606508512e-06, "loss": 2.3238, "step": 6405 }, { "epoch": 0.64, "learning_rate": 6.0077731027200495e-06, "loss": 2.3148, "step": 6406 }, { "epoch": 0.64, "learning_rate": 6.004798019343015e-06, "loss": 2.2209, "step": 6407 }, { "epoch": 0.64, "learning_rate": 6.001823356690715e-06, "loss": 2.394, "step": 6408 }, { "epoch": 0.64, "learning_rate": 5.998849115076402e-06, "loss": 2.2867, "step": 6409 }, { "epoch": 0.64, "learning_rate": 5.995875294813283e-06, "loss": 2.3431, "step": 6410 }, { "epoch": 0.64, "learning_rate": 5.9929018962145254e-06, "loss": 2.3785, "step": 6411 }, { "epoch": 0.64, "learning_rate": 5.989928919593253e-06, "loss": 2.3689, "step": 6412 }, { "epoch": 0.64, "learning_rate": 5.986956365262537e-06, "loss": 2.33, "step": 6413 }, { "epoch": 0.64, "learning_rate": 5.983984233535412e-06, "loss": 2.2566, "step": 6414 }, { "epoch": 0.64, "learning_rate": 5.9810125247248655e-06, "loss": 2.1849, "step": 6415 }, { "epoch": 0.64, "learning_rate": 5.978041239143837e-06, "loss": 2.3233, "step": 6416 }, { "epoch": 0.64, "learning_rate": 5.975070377105234e-06, "loss": 2.2821, "step": 6417 }, { "epoch": 0.64, "learning_rate": 5.972099938921907e-06, "loss": 2.2695, "step": 6418 }, { "epoch": 0.64, "learning_rate": 5.969129924906662e-06, "loss": 2.3197, "step": 6419 }, { "epoch": 0.64, "learning_rate": 5.966160335372269e-06, "loss": 2.3174, "step": 6420 }, { "epoch": 0.64, "learning_rate": 5.963191170631442e-06, "loss": 2.3923, "step": 6421 }, { "epoch": 0.64, "learning_rate": 5.960222430996861e-06, "loss": 2.2745, "step": 6422 }, { "epoch": 0.64, "learning_rate": 5.957254116781155e-06, "loss": 2.2858, "step": 6423 }, { "epoch": 0.64, "learning_rate": 5.954286228296911e-06, "loss": 2.2864, "step": 6424 }, { "epoch": 0.64, "learning_rate": 5.951318765856664e-06, "loss": 2.3084, "step": 6425 }, { "epoch": 0.64, "learning_rate": 5.948351729772917e-06, "loss": 2.3719, "step": 6426 }, { "epoch": 0.64, "learning_rate": 5.9453851203581205e-06, "loss": 2.4995, "step": 6427 }, { "epoch": 0.64, "learning_rate": 5.942418937924677e-06, "loss": 2.3359, "step": 6428 }, { "epoch": 0.64, "learning_rate": 5.939453182784951e-06, "loss": 2.3179, "step": 6429 }, { "epoch": 0.64, "learning_rate": 5.936487855251258e-06, "loss": 2.2916, "step": 6430 }, { "epoch": 0.64, "learning_rate": 5.933522955635869e-06, "loss": 2.3149, "step": 6431 }, { "epoch": 0.64, "learning_rate": 5.930558484251007e-06, "loss": 2.2673, "step": 6432 }, { "epoch": 0.64, "learning_rate": 5.92759444140886e-06, "loss": 2.2604, "step": 6433 }, { "epoch": 0.64, "learning_rate": 5.924630827421556e-06, "loss": 2.4049, "step": 6434 }, { "epoch": 0.64, "learning_rate": 5.921667642601192e-06, "loss": 2.3167, "step": 6435 }, { "epoch": 0.64, "learning_rate": 5.9187048872598115e-06, "loss": 2.3346, "step": 6436 }, { "epoch": 0.64, "learning_rate": 5.915742561709414e-06, "loss": 2.2125, "step": 6437 }, { "epoch": 0.65, "learning_rate": 5.912780666261957e-06, "loss": 2.3899, "step": 6438 }, { "epoch": 0.65, "learning_rate": 5.909819201229346e-06, "loss": 2.3234, "step": 6439 }, { "epoch": 0.65, "learning_rate": 5.906858166923451e-06, "loss": 2.2799, "step": 6440 }, { "epoch": 0.65, "learning_rate": 5.9038975636560855e-06, "loss": 2.3835, "step": 6441 }, { "epoch": 0.65, "learning_rate": 5.900937391739028e-06, "loss": 2.2608, "step": 6442 }, { "epoch": 0.65, "learning_rate": 5.897977651484002e-06, "loss": 2.3882, "step": 6443 }, { "epoch": 0.65, "learning_rate": 5.895018343202694e-06, "loss": 2.3657, "step": 6444 }, { "epoch": 0.65, "learning_rate": 5.892059467206741e-06, "loss": 2.3514, "step": 6445 }, { "epoch": 0.65, "learning_rate": 5.889101023807735e-06, "loss": 2.341, "step": 6446 }, { "epoch": 0.65, "learning_rate": 5.88614301331722e-06, "loss": 2.3803, "step": 6447 }, { "epoch": 0.65, "learning_rate": 5.883185436046701e-06, "loss": 2.4242, "step": 6448 }, { "epoch": 0.65, "learning_rate": 5.880228292307628e-06, "loss": 2.3638, "step": 6449 }, { "epoch": 0.65, "learning_rate": 5.877271582411413e-06, "loss": 2.383, "step": 6450 }, { "epoch": 0.65, "learning_rate": 5.87431530666942e-06, "loss": 2.3007, "step": 6451 }, { "epoch": 0.65, "learning_rate": 5.871359465392964e-06, "loss": 2.2584, "step": 6452 }, { "epoch": 0.65, "learning_rate": 5.868404058893322e-06, "loss": 2.3099, "step": 6453 }, { "epoch": 0.65, "learning_rate": 5.865449087481718e-06, "loss": 2.2588, "step": 6454 }, { "epoch": 0.65, "learning_rate": 5.862494551469333e-06, "loss": 2.3854, "step": 6455 }, { "epoch": 0.65, "learning_rate": 5.859540451167301e-06, "loss": 2.3558, "step": 6456 }, { "epoch": 0.65, "learning_rate": 5.856586786886712e-06, "loss": 2.3379, "step": 6457 }, { "epoch": 0.65, "learning_rate": 5.853633558938608e-06, "loss": 2.4121, "step": 6458 }, { "epoch": 0.65, "learning_rate": 5.850680767633987e-06, "loss": 2.3039, "step": 6459 }, { "epoch": 0.65, "learning_rate": 5.8477284132838e-06, "loss": 2.3601, "step": 6460 }, { "epoch": 0.65, "learning_rate": 5.8447764961989475e-06, "loss": 2.2595, "step": 6461 }, { "epoch": 0.65, "learning_rate": 5.841825016690297e-06, "loss": 2.3292, "step": 6462 }, { "epoch": 0.65, "learning_rate": 5.8388739750686565e-06, "loss": 2.1404, "step": 6463 }, { "epoch": 0.65, "learning_rate": 5.835923371644794e-06, "loss": 2.2434, "step": 6464 }, { "epoch": 0.65, "learning_rate": 5.832973206729429e-06, "loss": 2.3519, "step": 6465 }, { "epoch": 0.65, "learning_rate": 5.8300234806332365e-06, "loss": 2.3736, "step": 6466 }, { "epoch": 0.65, "learning_rate": 5.8270741936668465e-06, "loss": 2.43, "step": 6467 }, { "epoch": 0.65, "learning_rate": 5.824125346140836e-06, "loss": 2.2731, "step": 6468 }, { "epoch": 0.65, "learning_rate": 5.8211769383657465e-06, "loss": 2.2638, "step": 6469 }, { "epoch": 0.65, "learning_rate": 5.818228970652067e-06, "loss": 2.2921, "step": 6470 }, { "epoch": 0.65, "learning_rate": 5.8152814433102366e-06, "loss": 2.3218, "step": 6471 }, { "epoch": 0.65, "learning_rate": 5.8123343566506525e-06, "loss": 2.3604, "step": 6472 }, { "epoch": 0.65, "learning_rate": 5.809387710983669e-06, "loss": 2.3151, "step": 6473 }, { "epoch": 0.65, "learning_rate": 5.806441506619588e-06, "loss": 2.4516, "step": 6474 }, { "epoch": 0.65, "learning_rate": 5.803495743868665e-06, "loss": 2.2164, "step": 6475 }, { "epoch": 0.65, "learning_rate": 5.8005504230411135e-06, "loss": 2.2202, "step": 6476 }, { "epoch": 0.65, "learning_rate": 5.797605544447098e-06, "loss": 2.3657, "step": 6477 }, { "epoch": 0.65, "learning_rate": 5.794661108396733e-06, "loss": 2.3462, "step": 6478 }, { "epoch": 0.65, "learning_rate": 5.791717115200088e-06, "loss": 2.309, "step": 6479 }, { "epoch": 0.65, "learning_rate": 5.788773565167198e-06, "loss": 2.3319, "step": 6480 }, { "epoch": 0.65, "learning_rate": 5.785830458608032e-06, "loss": 2.2611, "step": 6481 }, { "epoch": 0.65, "learning_rate": 5.782887795832523e-06, "loss": 2.4061, "step": 6482 }, { "epoch": 0.65, "learning_rate": 5.779945577150558e-06, "loss": 2.4424, "step": 6483 }, { "epoch": 0.65, "learning_rate": 5.777003802871972e-06, "loss": 2.3242, "step": 6484 }, { "epoch": 0.65, "learning_rate": 5.7740624733065565e-06, "loss": 2.2579, "step": 6485 }, { "epoch": 0.65, "learning_rate": 5.7711215887640555e-06, "loss": 2.3252, "step": 6486 }, { "epoch": 0.65, "learning_rate": 5.7681811495541664e-06, "loss": 2.315, "step": 6487 }, { "epoch": 0.65, "learning_rate": 5.7652411559865365e-06, "loss": 2.2258, "step": 6488 }, { "epoch": 0.65, "learning_rate": 5.762301608370775e-06, "loss": 2.2697, "step": 6489 }, { "epoch": 0.65, "learning_rate": 5.759362507016439e-06, "loss": 2.3493, "step": 6490 }, { "epoch": 0.65, "learning_rate": 5.756423852233031e-06, "loss": 2.3157, "step": 6491 }, { "epoch": 0.65, "learning_rate": 5.753485644330017e-06, "loss": 2.3493, "step": 6492 }, { "epoch": 0.65, "learning_rate": 5.750547883616811e-06, "loss": 2.355, "step": 6493 }, { "epoch": 0.65, "learning_rate": 5.747610570402784e-06, "loss": 2.325, "step": 6494 }, { "epoch": 0.65, "learning_rate": 5.744673704997253e-06, "loss": 2.2449, "step": 6495 }, { "epoch": 0.65, "learning_rate": 5.741737287709497e-06, "loss": 2.3284, "step": 6496 }, { "epoch": 0.65, "learning_rate": 5.7388013188487346e-06, "loss": 2.3316, "step": 6497 }, { "epoch": 0.65, "learning_rate": 5.735865798724154e-06, "loss": 2.3363, "step": 6498 }, { "epoch": 0.65, "learning_rate": 5.732930727644887e-06, "loss": 2.1615, "step": 6499 }, { "epoch": 0.65, "learning_rate": 5.729996105920014e-06, "loss": 2.3285, "step": 6500 }, { "epoch": 0.65, "learning_rate": 5.727061933858575e-06, "loss": 2.2576, "step": 6501 }, { "epoch": 0.65, "learning_rate": 5.72412821176956e-06, "loss": 2.2866, "step": 6502 }, { "epoch": 0.65, "learning_rate": 5.721194939961912e-06, "loss": 2.3067, "step": 6503 }, { "epoch": 0.65, "learning_rate": 5.718262118744527e-06, "loss": 2.3443, "step": 6504 }, { "epoch": 0.65, "learning_rate": 5.715329748426246e-06, "loss": 2.2532, "step": 6505 }, { "epoch": 0.65, "learning_rate": 5.7123978293158825e-06, "loss": 2.3697, "step": 6506 }, { "epoch": 0.65, "learning_rate": 5.709466361722182e-06, "loss": 2.3544, "step": 6507 }, { "epoch": 0.65, "learning_rate": 5.7065353459538515e-06, "loss": 2.3648, "step": 6508 }, { "epoch": 0.65, "learning_rate": 5.703604782319549e-06, "loss": 2.2533, "step": 6509 }, { "epoch": 0.65, "learning_rate": 5.700674671127884e-06, "loss": 2.2889, "step": 6510 }, { "epoch": 0.65, "learning_rate": 5.697745012687419e-06, "loss": 2.1952, "step": 6511 }, { "epoch": 0.65, "learning_rate": 5.69481580730667e-06, "loss": 2.32, "step": 6512 }, { "epoch": 0.65, "learning_rate": 5.691887055294105e-06, "loss": 2.3147, "step": 6513 }, { "epoch": 0.65, "learning_rate": 5.688958756958141e-06, "loss": 2.3432, "step": 6514 }, { "epoch": 0.65, "learning_rate": 5.686030912607152e-06, "loss": 2.3872, "step": 6515 }, { "epoch": 0.65, "learning_rate": 5.68310352254946e-06, "loss": 2.2689, "step": 6516 }, { "epoch": 0.65, "learning_rate": 5.680176587093345e-06, "loss": 2.362, "step": 6517 }, { "epoch": 0.65, "learning_rate": 5.67725010654703e-06, "loss": 2.3129, "step": 6518 }, { "epoch": 0.65, "learning_rate": 5.6743240812186984e-06, "loss": 2.2992, "step": 6519 }, { "epoch": 0.65, "learning_rate": 5.671398511416483e-06, "loss": 2.3001, "step": 6520 }, { "epoch": 0.65, "learning_rate": 5.6684733974484675e-06, "loss": 2.3115, "step": 6521 }, { "epoch": 0.65, "learning_rate": 5.665548739622687e-06, "loss": 2.3396, "step": 6522 }, { "epoch": 0.65, "learning_rate": 5.662624538247128e-06, "loss": 2.2089, "step": 6523 }, { "epoch": 0.65, "learning_rate": 5.659700793629738e-06, "loss": 2.3203, "step": 6524 }, { "epoch": 0.65, "learning_rate": 5.656777506078405e-06, "loss": 2.3013, "step": 6525 }, { "epoch": 0.65, "learning_rate": 5.653854675900974e-06, "loss": 2.3681, "step": 6526 }, { "epoch": 0.65, "learning_rate": 5.650932303405239e-06, "loss": 2.2644, "step": 6527 }, { "epoch": 0.65, "learning_rate": 5.648010388898949e-06, "loss": 2.2359, "step": 6528 }, { "epoch": 0.65, "learning_rate": 5.645088932689804e-06, "loss": 2.3072, "step": 6529 }, { "epoch": 0.65, "learning_rate": 5.642167935085454e-06, "loss": 2.3137, "step": 6530 }, { "epoch": 0.65, "learning_rate": 5.639247396393503e-06, "loss": 2.3744, "step": 6531 }, { "epoch": 0.65, "learning_rate": 5.636327316921506e-06, "loss": 2.2775, "step": 6532 }, { "epoch": 0.65, "learning_rate": 5.633407696976969e-06, "loss": 2.3051, "step": 6533 }, { "epoch": 0.65, "learning_rate": 5.630488536867349e-06, "loss": 2.2982, "step": 6534 }, { "epoch": 0.65, "learning_rate": 5.627569836900055e-06, "loss": 2.1943, "step": 6535 }, { "epoch": 0.65, "learning_rate": 5.624651597382449e-06, "loss": 2.2853, "step": 6536 }, { "epoch": 0.65, "learning_rate": 5.621733818621844e-06, "loss": 2.2774, "step": 6537 }, { "epoch": 0.66, "learning_rate": 5.618816500925503e-06, "loss": 2.2865, "step": 6538 }, { "epoch": 0.66, "learning_rate": 5.615899644600643e-06, "loss": 2.3358, "step": 6539 }, { "epoch": 0.66, "learning_rate": 5.612983249954429e-06, "loss": 2.2089, "step": 6540 }, { "epoch": 0.66, "learning_rate": 5.610067317293975e-06, "loss": 2.4312, "step": 6541 }, { "epoch": 0.66, "learning_rate": 5.6071518469263604e-06, "loss": 2.3704, "step": 6542 }, { "epoch": 0.66, "learning_rate": 5.604236839158601e-06, "loss": 2.3038, "step": 6543 }, { "epoch": 0.66, "learning_rate": 5.60132229429767e-06, "loss": 2.3668, "step": 6544 }, { "epoch": 0.66, "learning_rate": 5.598408212650488e-06, "loss": 2.3175, "step": 6545 }, { "epoch": 0.66, "learning_rate": 5.595494594523934e-06, "loss": 2.3079, "step": 6546 }, { "epoch": 0.66, "learning_rate": 5.592581440224829e-06, "loss": 2.4047, "step": 6547 }, { "epoch": 0.66, "learning_rate": 5.589668750059954e-06, "loss": 2.3208, "step": 6548 }, { "epoch": 0.66, "learning_rate": 5.5867565243360365e-06, "loss": 2.3388, "step": 6549 }, { "epoch": 0.66, "learning_rate": 5.583844763359749e-06, "loss": 2.3856, "step": 6550 }, { "epoch": 0.66, "learning_rate": 5.580933467437733e-06, "loss": 2.3229, "step": 6551 }, { "epoch": 0.66, "learning_rate": 5.578022636876563e-06, "loss": 2.3721, "step": 6552 }, { "epoch": 0.66, "learning_rate": 5.575112271982773e-06, "loss": 2.2287, "step": 6553 }, { "epoch": 0.66, "learning_rate": 5.5722023730628505e-06, "loss": 2.2538, "step": 6554 }, { "epoch": 0.66, "learning_rate": 5.569292940423221e-06, "loss": 2.2448, "step": 6555 }, { "epoch": 0.66, "learning_rate": 5.566383974370273e-06, "loss": 2.295, "step": 6556 }, { "epoch": 0.66, "learning_rate": 5.563475475210344e-06, "loss": 2.2199, "step": 6557 }, { "epoch": 0.66, "learning_rate": 5.560567443249718e-06, "loss": 2.2573, "step": 6558 }, { "epoch": 0.66, "learning_rate": 5.557659878794633e-06, "loss": 2.3341, "step": 6559 }, { "epoch": 0.66, "learning_rate": 5.5547527821512815e-06, "loss": 2.3001, "step": 6560 }, { "epoch": 0.66, "learning_rate": 5.5518461536258e-06, "loss": 2.2833, "step": 6561 }, { "epoch": 0.66, "learning_rate": 5.548939993524278e-06, "loss": 2.3214, "step": 6562 }, { "epoch": 0.66, "learning_rate": 5.5460343021527565e-06, "loss": 2.2444, "step": 6563 }, { "epoch": 0.66, "learning_rate": 5.543129079817226e-06, "loss": 2.3232, "step": 6564 }, { "epoch": 0.66, "learning_rate": 5.540224326823629e-06, "loss": 2.2964, "step": 6565 }, { "epoch": 0.66, "learning_rate": 5.5373200434778565e-06, "loss": 2.3574, "step": 6566 }, { "epoch": 0.66, "learning_rate": 5.534416230085751e-06, "loss": 2.2859, "step": 6567 }, { "epoch": 0.66, "learning_rate": 5.531512886953104e-06, "loss": 2.3537, "step": 6568 }, { "epoch": 0.66, "learning_rate": 5.528610014385667e-06, "loss": 2.3143, "step": 6569 }, { "epoch": 0.66, "learning_rate": 5.525707612689128e-06, "loss": 2.3468, "step": 6570 }, { "epoch": 0.66, "learning_rate": 5.522805682169132e-06, "loss": 2.1427, "step": 6571 }, { "epoch": 0.66, "learning_rate": 5.519904223131278e-06, "loss": 2.4102, "step": 6572 }, { "epoch": 0.66, "learning_rate": 5.517003235881106e-06, "loss": 2.2907, "step": 6573 }, { "epoch": 0.66, "learning_rate": 5.514102720724116e-06, "loss": 2.2459, "step": 6574 }, { "epoch": 0.66, "learning_rate": 5.5112026779657515e-06, "loss": 2.3481, "step": 6575 }, { "epoch": 0.66, "learning_rate": 5.508303107911409e-06, "loss": 2.3399, "step": 6576 }, { "epoch": 0.66, "learning_rate": 5.505404010866435e-06, "loss": 2.248, "step": 6577 }, { "epoch": 0.66, "learning_rate": 5.502505387136128e-06, "loss": 2.3518, "step": 6578 }, { "epoch": 0.66, "learning_rate": 5.4996072370257326e-06, "loss": 2.2424, "step": 6579 }, { "epoch": 0.66, "learning_rate": 5.4967095608404475e-06, "loss": 2.2352, "step": 6580 }, { "epoch": 0.66, "learning_rate": 5.493812358885418e-06, "loss": 2.2605, "step": 6581 }, { "epoch": 0.66, "learning_rate": 5.490915631465742e-06, "loss": 2.325, "step": 6582 }, { "epoch": 0.66, "learning_rate": 5.488019378886467e-06, "loss": 2.28, "step": 6583 }, { "epoch": 0.66, "learning_rate": 5.485123601452589e-06, "loss": 2.2509, "step": 6584 }, { "epoch": 0.66, "learning_rate": 5.482228299469056e-06, "loss": 2.3637, "step": 6585 }, { "epoch": 0.66, "learning_rate": 5.479333473240761e-06, "loss": 2.2481, "step": 6586 }, { "epoch": 0.66, "learning_rate": 5.476439123072559e-06, "loss": 2.4683, "step": 6587 }, { "epoch": 0.66, "learning_rate": 5.473545249269242e-06, "loss": 2.3359, "step": 6588 }, { "epoch": 0.66, "learning_rate": 5.470651852135558e-06, "loss": 2.3303, "step": 6589 }, { "epoch": 0.66, "learning_rate": 5.467758931976202e-06, "loss": 2.349, "step": 6590 }, { "epoch": 0.66, "learning_rate": 5.464866489095819e-06, "loss": 2.2753, "step": 6591 }, { "epoch": 0.66, "learning_rate": 5.461974523799008e-06, "loss": 2.3387, "step": 6592 }, { "epoch": 0.66, "learning_rate": 5.4590830363903135e-06, "loss": 2.3036, "step": 6593 }, { "epoch": 0.66, "learning_rate": 5.456192027174232e-06, "loss": 2.3037, "step": 6594 }, { "epoch": 0.66, "learning_rate": 5.453301496455206e-06, "loss": 2.3465, "step": 6595 }, { "epoch": 0.66, "learning_rate": 5.450411444537629e-06, "loss": 2.3886, "step": 6596 }, { "epoch": 0.66, "learning_rate": 5.447521871725849e-06, "loss": 2.3007, "step": 6597 }, { "epoch": 0.66, "learning_rate": 5.444632778324159e-06, "loss": 2.3, "step": 6598 }, { "epoch": 0.66, "learning_rate": 5.4417441646368e-06, "loss": 2.2909, "step": 6599 }, { "epoch": 0.66, "learning_rate": 5.438856030967965e-06, "loss": 2.3096, "step": 6600 }, { "epoch": 0.66, "learning_rate": 5.4359683776217985e-06, "loss": 2.2699, "step": 6601 }, { "epoch": 0.66, "learning_rate": 5.43308120490239e-06, "loss": 2.2752, "step": 6602 }, { "epoch": 0.66, "learning_rate": 5.43019451311378e-06, "loss": 2.2524, "step": 6603 }, { "epoch": 0.66, "learning_rate": 5.427308302559957e-06, "loss": 2.3599, "step": 6604 }, { "epoch": 0.66, "learning_rate": 5.424422573544867e-06, "loss": 2.2901, "step": 6605 }, { "epoch": 0.66, "learning_rate": 5.421537326372394e-06, "loss": 2.3907, "step": 6606 }, { "epoch": 0.66, "learning_rate": 5.41865256134638e-06, "loss": 2.3338, "step": 6607 }, { "epoch": 0.66, "learning_rate": 5.415768278770608e-06, "loss": 2.3055, "step": 6608 }, { "epoch": 0.66, "learning_rate": 5.412884478948817e-06, "loss": 2.2022, "step": 6609 }, { "epoch": 0.66, "learning_rate": 5.410001162184693e-06, "loss": 2.4016, "step": 6610 }, { "epoch": 0.66, "learning_rate": 5.407118328781869e-06, "loss": 2.3298, "step": 6611 }, { "epoch": 0.66, "learning_rate": 5.404235979043929e-06, "loss": 2.2459, "step": 6612 }, { "epoch": 0.66, "learning_rate": 5.401354113274404e-06, "loss": 2.3475, "step": 6613 }, { "epoch": 0.66, "learning_rate": 5.398472731776784e-06, "loss": 2.3248, "step": 6614 }, { "epoch": 0.66, "learning_rate": 5.395591834854495e-06, "loss": 2.3674, "step": 6615 }, { "epoch": 0.66, "learning_rate": 5.3927114228109165e-06, "loss": 2.3132, "step": 6616 }, { "epoch": 0.66, "learning_rate": 5.389831495949378e-06, "loss": 2.4363, "step": 6617 }, { "epoch": 0.66, "learning_rate": 5.386952054573162e-06, "loss": 2.4532, "step": 6618 }, { "epoch": 0.66, "learning_rate": 5.3840730989854875e-06, "loss": 2.331, "step": 6619 }, { "epoch": 0.66, "learning_rate": 5.3811946294895335e-06, "loss": 2.3369, "step": 6620 }, { "epoch": 0.66, "learning_rate": 5.378316646388424e-06, "loss": 2.3662, "step": 6621 }, { "epoch": 0.66, "learning_rate": 5.375439149985229e-06, "loss": 2.3363, "step": 6622 }, { "epoch": 0.66, "learning_rate": 5.3725621405829775e-06, "loss": 2.1748, "step": 6623 }, { "epoch": 0.66, "learning_rate": 5.369685618484638e-06, "loss": 2.3434, "step": 6624 }, { "epoch": 0.66, "learning_rate": 5.366809583993128e-06, "loss": 2.3057, "step": 6625 }, { "epoch": 0.66, "learning_rate": 5.363934037411316e-06, "loss": 2.3229, "step": 6626 }, { "epoch": 0.66, "learning_rate": 5.361058979042019e-06, "loss": 2.2976, "step": 6627 }, { "epoch": 0.66, "learning_rate": 5.358184409188002e-06, "loss": 2.3278, "step": 6628 }, { "epoch": 0.66, "learning_rate": 5.355310328151979e-06, "loss": 2.3766, "step": 6629 }, { "epoch": 0.66, "learning_rate": 5.35243673623661e-06, "loss": 2.3235, "step": 6630 }, { "epoch": 0.66, "learning_rate": 5.3495636337445065e-06, "loss": 2.3468, "step": 6631 }, { "epoch": 0.66, "learning_rate": 5.346691020978232e-06, "loss": 2.4169, "step": 6632 }, { "epoch": 0.66, "learning_rate": 5.3438188982402915e-06, "loss": 2.3908, "step": 6633 }, { "epoch": 0.66, "learning_rate": 5.3409472658331406e-06, "loss": 2.2804, "step": 6634 }, { "epoch": 0.66, "learning_rate": 5.338076124059184e-06, "loss": 2.295, "step": 6635 }, { "epoch": 0.66, "learning_rate": 5.335205473220773e-06, "loss": 2.2506, "step": 6636 }, { "epoch": 0.66, "learning_rate": 5.332335313620211e-06, "loss": 2.3305, "step": 6637 }, { "epoch": 0.67, "learning_rate": 5.329465645559748e-06, "loss": 2.3245, "step": 6638 }, { "epoch": 0.67, "learning_rate": 5.3265964693415785e-06, "loss": 2.2606, "step": 6639 }, { "epoch": 0.67, "learning_rate": 5.3237277852678494e-06, "loss": 2.2957, "step": 6640 }, { "epoch": 0.67, "learning_rate": 5.320859593640655e-06, "loss": 2.3742, "step": 6641 }, { "epoch": 0.67, "learning_rate": 5.317991894762038e-06, "loss": 2.3167, "step": 6642 }, { "epoch": 0.67, "learning_rate": 5.3151246889339884e-06, "loss": 2.3528, "step": 6643 }, { "epoch": 0.67, "learning_rate": 5.312257976458442e-06, "loss": 2.3953, "step": 6644 }, { "epoch": 0.67, "learning_rate": 5.309391757637289e-06, "loss": 2.3298, "step": 6645 }, { "epoch": 0.67, "learning_rate": 5.306526032772361e-06, "loss": 2.2783, "step": 6646 }, { "epoch": 0.67, "learning_rate": 5.303660802165441e-06, "loss": 2.2422, "step": 6647 }, { "epoch": 0.67, "learning_rate": 5.30079606611826e-06, "loss": 2.2732, "step": 6648 }, { "epoch": 0.67, "learning_rate": 5.297931824932492e-06, "loss": 2.2778, "step": 6649 }, { "epoch": 0.67, "learning_rate": 5.295068078909771e-06, "loss": 2.3649, "step": 6650 }, { "epoch": 0.67, "learning_rate": 5.292204828351666e-06, "loss": 2.2799, "step": 6651 }, { "epoch": 0.67, "learning_rate": 5.289342073559698e-06, "loss": 2.3877, "step": 6652 }, { "epoch": 0.67, "learning_rate": 5.286479814835339e-06, "loss": 2.4127, "step": 6653 }, { "epoch": 0.67, "learning_rate": 5.283618052480006e-06, "loss": 2.3613, "step": 6654 }, { "epoch": 0.67, "learning_rate": 5.2807567867950625e-06, "loss": 2.2045, "step": 6655 }, { "epoch": 0.67, "learning_rate": 5.277896018081823e-06, "loss": 2.2374, "step": 6656 }, { "epoch": 0.67, "learning_rate": 5.275035746641547e-06, "loss": 2.3357, "step": 6657 }, { "epoch": 0.67, "learning_rate": 5.2721759727754415e-06, "loss": 2.3382, "step": 6658 }, { "epoch": 0.67, "learning_rate": 5.269316696784664e-06, "loss": 2.2271, "step": 6659 }, { "epoch": 0.67, "learning_rate": 5.266457918970317e-06, "loss": 2.3349, "step": 6660 }, { "epoch": 0.67, "learning_rate": 5.26359963963345e-06, "loss": 2.3013, "step": 6661 }, { "epoch": 0.67, "learning_rate": 5.260741859075062e-06, "loss": 2.2406, "step": 6662 }, { "epoch": 0.67, "learning_rate": 5.2578845775961015e-06, "loss": 2.357, "step": 6663 }, { "epoch": 0.67, "learning_rate": 5.255027795497457e-06, "loss": 2.3554, "step": 6664 }, { "epoch": 0.67, "learning_rate": 5.252171513079972e-06, "loss": 2.3276, "step": 6665 }, { "epoch": 0.67, "learning_rate": 5.249315730644433e-06, "loss": 2.3407, "step": 6666 }, { "epoch": 0.67, "learning_rate": 5.246460448491574e-06, "loss": 2.2929, "step": 6667 }, { "epoch": 0.67, "learning_rate": 5.243605666922083e-06, "loss": 2.3564, "step": 6668 }, { "epoch": 0.67, "learning_rate": 5.240751386236585e-06, "loss": 2.3379, "step": 6669 }, { "epoch": 0.67, "learning_rate": 5.23789760673566e-06, "loss": 2.3791, "step": 6670 }, { "epoch": 0.67, "learning_rate": 5.235044328719831e-06, "loss": 2.3234, "step": 6671 }, { "epoch": 0.67, "learning_rate": 5.232191552489569e-06, "loss": 2.3348, "step": 6672 }, { "epoch": 0.67, "learning_rate": 5.229339278345296e-06, "loss": 2.2615, "step": 6673 }, { "epoch": 0.67, "learning_rate": 5.2264875065873725e-06, "loss": 2.3447, "step": 6674 }, { "epoch": 0.67, "learning_rate": 5.223636237516112e-06, "loss": 2.2961, "step": 6675 }, { "epoch": 0.67, "learning_rate": 5.22078547143178e-06, "loss": 2.3147, "step": 6676 }, { "epoch": 0.67, "learning_rate": 5.2179352086345804e-06, "loss": 2.3666, "step": 6677 }, { "epoch": 0.67, "learning_rate": 5.215085449424666e-06, "loss": 2.3655, "step": 6678 }, { "epoch": 0.67, "learning_rate": 5.212236194102141e-06, "loss": 2.2983, "step": 6679 }, { "epoch": 0.67, "learning_rate": 5.209387442967051e-06, "loss": 2.2917, "step": 6680 }, { "epoch": 0.67, "learning_rate": 5.206539196319394e-06, "loss": 2.261, "step": 6681 }, { "epoch": 0.67, "learning_rate": 5.203691454459106e-06, "loss": 2.179, "step": 6682 }, { "epoch": 0.67, "learning_rate": 5.200844217686078e-06, "loss": 2.395, "step": 6683 }, { "epoch": 0.67, "learning_rate": 5.197997486300142e-06, "loss": 2.3387, "step": 6684 }, { "epoch": 0.67, "learning_rate": 5.195151260601088e-06, "loss": 2.3618, "step": 6685 }, { "epoch": 0.67, "learning_rate": 5.192305540888642e-06, "loss": 2.3194, "step": 6686 }, { "epoch": 0.67, "learning_rate": 5.189460327462478e-06, "loss": 2.1893, "step": 6687 }, { "epoch": 0.67, "learning_rate": 5.1866156206222185e-06, "loss": 2.2828, "step": 6688 }, { "epoch": 0.67, "learning_rate": 5.183771420667433e-06, "loss": 2.2845, "step": 6689 }, { "epoch": 0.67, "learning_rate": 5.1809277278976365e-06, "loss": 2.3416, "step": 6690 }, { "epoch": 0.67, "learning_rate": 5.178084542612293e-06, "loss": 2.2124, "step": 6691 }, { "epoch": 0.67, "learning_rate": 5.1752418651108094e-06, "loss": 2.3614, "step": 6692 }, { "epoch": 0.67, "learning_rate": 5.172399695692536e-06, "loss": 2.2599, "step": 6693 }, { "epoch": 0.67, "learning_rate": 5.169558034656786e-06, "loss": 2.3521, "step": 6694 }, { "epoch": 0.67, "learning_rate": 5.1667168823028e-06, "loss": 2.4106, "step": 6695 }, { "epoch": 0.67, "learning_rate": 5.163876238929775e-06, "loss": 2.321, "step": 6696 }, { "epoch": 0.67, "learning_rate": 5.1610361048368515e-06, "loss": 2.2532, "step": 6697 }, { "epoch": 0.67, "learning_rate": 5.158196480323117e-06, "loss": 2.2182, "step": 6698 }, { "epoch": 0.67, "learning_rate": 5.1553573656876045e-06, "loss": 2.3425, "step": 6699 }, { "epoch": 0.67, "learning_rate": 5.152518761229295e-06, "loss": 2.327, "step": 6700 }, { "epoch": 0.67, "learning_rate": 5.149680667247114e-06, "loss": 2.2017, "step": 6701 }, { "epoch": 0.67, "learning_rate": 5.146843084039934e-06, "loss": 2.383, "step": 6702 }, { "epoch": 0.67, "learning_rate": 5.144006011906575e-06, "loss": 2.3682, "step": 6703 }, { "epoch": 0.67, "learning_rate": 5.141169451145801e-06, "loss": 2.3396, "step": 6704 }, { "epoch": 0.67, "learning_rate": 5.138333402056324e-06, "loss": 2.2608, "step": 6705 }, { "epoch": 0.67, "learning_rate": 5.135497864936799e-06, "loss": 2.2681, "step": 6706 }, { "epoch": 0.67, "learning_rate": 5.1326628400858314e-06, "loss": 2.3847, "step": 6707 }, { "epoch": 0.67, "learning_rate": 5.129828327801971e-06, "loss": 2.3279, "step": 6708 }, { "epoch": 0.67, "learning_rate": 5.126994328383712e-06, "loss": 2.3087, "step": 6709 }, { "epoch": 0.67, "learning_rate": 5.124160842129495e-06, "loss": 2.2885, "step": 6710 }, { "epoch": 0.67, "learning_rate": 5.121327869337707e-06, "loss": 2.2026, "step": 6711 }, { "epoch": 0.67, "learning_rate": 5.1184954103066855e-06, "loss": 2.2992, "step": 6712 }, { "epoch": 0.67, "learning_rate": 5.115663465334706e-06, "loss": 2.2826, "step": 6713 }, { "epoch": 0.67, "learning_rate": 5.1128320347199945e-06, "loss": 2.304, "step": 6714 }, { "epoch": 0.67, "learning_rate": 5.110001118760723e-06, "loss": 2.3403, "step": 6715 }, { "epoch": 0.67, "learning_rate": 5.107170717755006e-06, "loss": 2.2796, "step": 6716 }, { "epoch": 0.67, "learning_rate": 5.104340832000907e-06, "loss": 2.2732, "step": 6717 }, { "epoch": 0.67, "learning_rate": 5.101511461796436e-06, "loss": 2.4196, "step": 6718 }, { "epoch": 0.67, "learning_rate": 5.0986826074395424e-06, "loss": 2.2407, "step": 6719 }, { "epoch": 0.67, "learning_rate": 5.095854269228127e-06, "loss": 2.2781, "step": 6720 }, { "epoch": 0.67, "learning_rate": 5.093026447460042e-06, "loss": 2.4084, "step": 6721 }, { "epoch": 0.67, "learning_rate": 5.09019914243307e-06, "loss": 2.2632, "step": 6722 }, { "epoch": 0.67, "learning_rate": 5.087372354444951e-06, "loss": 2.3728, "step": 6723 }, { "epoch": 0.67, "learning_rate": 5.084546083793364e-06, "loss": 2.2647, "step": 6724 }, { "epoch": 0.67, "learning_rate": 5.081720330775939e-06, "loss": 2.326, "step": 6725 }, { "epoch": 0.67, "learning_rate": 5.078895095690249e-06, "loss": 2.2794, "step": 6726 }, { "epoch": 0.67, "learning_rate": 5.076070378833813e-06, "loss": 2.3862, "step": 6727 }, { "epoch": 0.67, "learning_rate": 5.073246180504092e-06, "loss": 2.3765, "step": 6728 }, { "epoch": 0.67, "learning_rate": 5.070422500998496e-06, "loss": 2.2773, "step": 6729 }, { "epoch": 0.67, "learning_rate": 5.067599340614382e-06, "loss": 2.3151, "step": 6730 }, { "epoch": 0.67, "learning_rate": 5.06477669964905e-06, "loss": 2.34, "step": 6731 }, { "epoch": 0.67, "learning_rate": 5.061954578399744e-06, "loss": 2.4239, "step": 6732 }, { "epoch": 0.67, "learning_rate": 5.0591329771636545e-06, "loss": 2.345, "step": 6733 }, { "epoch": 0.67, "learning_rate": 5.056311896237917e-06, "loss": 2.3453, "step": 6734 }, { "epoch": 0.67, "learning_rate": 5.053491335919614e-06, "loss": 2.3018, "step": 6735 }, { "epoch": 0.67, "learning_rate": 5.050671296505769e-06, "loss": 2.2382, "step": 6736 }, { "epoch": 0.67, "learning_rate": 5.047851778293355e-06, "loss": 2.2986, "step": 6737 }, { "epoch": 0.68, "learning_rate": 5.045032781579284e-06, "loss": 2.2355, "step": 6738 }, { "epoch": 0.68, "learning_rate": 5.042214306660427e-06, "loss": 2.2687, "step": 6739 }, { "epoch": 0.68, "learning_rate": 5.039396353833583e-06, "loss": 2.2707, "step": 6740 }, { "epoch": 0.68, "learning_rate": 5.036578923395508e-06, "loss": 2.3405, "step": 6741 }, { "epoch": 0.68, "learning_rate": 5.033762015642895e-06, "loss": 2.342, "step": 6742 }, { "epoch": 0.68, "learning_rate": 5.030945630872388e-06, "loss": 2.2368, "step": 6743 }, { "epoch": 0.68, "learning_rate": 5.028129769380572e-06, "loss": 2.2874, "step": 6744 }, { "epoch": 0.68, "learning_rate": 5.025314431463981e-06, "loss": 2.3203, "step": 6745 }, { "epoch": 0.68, "learning_rate": 5.022499617419085e-06, "loss": 2.2563, "step": 6746 }, { "epoch": 0.68, "learning_rate": 5.019685327542307e-06, "loss": 2.4154, "step": 6747 }, { "epoch": 0.68, "learning_rate": 5.016871562130017e-06, "loss": 2.286, "step": 6748 }, { "epoch": 0.68, "learning_rate": 5.0140583214785235e-06, "loss": 2.3351, "step": 6749 }, { "epoch": 0.68, "learning_rate": 5.011245605884083e-06, "loss": 2.3406, "step": 6750 }, { "epoch": 0.68, "learning_rate": 5.008433415642893e-06, "loss": 2.3048, "step": 6751 }, { "epoch": 0.68, "learning_rate": 5.005621751051099e-06, "loss": 2.3245, "step": 6752 }, { "epoch": 0.68, "learning_rate": 5.00281061240479e-06, "loss": 2.2101, "step": 6753 }, { "epoch": 0.68, "learning_rate": 5.000000000000003e-06, "loss": 2.3069, "step": 6754 }, { "epoch": 0.68, "learning_rate": 4.997189914132713e-06, "loss": 2.1894, "step": 6755 }, { "epoch": 0.68, "learning_rate": 4.99438035509884e-06, "loss": 2.3515, "step": 6756 }, { "epoch": 0.68, "learning_rate": 4.991571323194261e-06, "loss": 2.3029, "step": 6757 }, { "epoch": 0.68, "learning_rate": 4.9887628187147815e-06, "loss": 2.288, "step": 6758 }, { "epoch": 0.68, "learning_rate": 4.985954841956162e-06, "loss": 2.3432, "step": 6759 }, { "epoch": 0.68, "learning_rate": 4.9831473932141e-06, "loss": 2.3495, "step": 6760 }, { "epoch": 0.68, "learning_rate": 4.980340472784242e-06, "loss": 2.2762, "step": 6761 }, { "epoch": 0.68, "learning_rate": 4.977534080962179e-06, "loss": 2.4098, "step": 6762 }, { "epoch": 0.68, "learning_rate": 4.974728218043443e-06, "loss": 2.2381, "step": 6763 }, { "epoch": 0.68, "learning_rate": 4.971922884323514e-06, "loss": 2.35, "step": 6764 }, { "epoch": 0.68, "learning_rate": 4.9691180800978145e-06, "loss": 2.2959, "step": 6765 }, { "epoch": 0.68, "learning_rate": 4.96631380566171e-06, "loss": 2.3372, "step": 6766 }, { "epoch": 0.68, "learning_rate": 4.963510061310514e-06, "loss": 2.4145, "step": 6767 }, { "epoch": 0.68, "learning_rate": 4.9607068473394795e-06, "loss": 2.3015, "step": 6768 }, { "epoch": 0.68, "learning_rate": 4.957904164043807e-06, "loss": 2.3049, "step": 6769 }, { "epoch": 0.68, "learning_rate": 4.95510201171864e-06, "loss": 2.3556, "step": 6770 }, { "epoch": 0.68, "learning_rate": 4.952300390659066e-06, "loss": 2.2764, "step": 6771 }, { "epoch": 0.68, "learning_rate": 4.949499301160118e-06, "loss": 2.2722, "step": 6772 }, { "epoch": 0.68, "learning_rate": 4.94669874351677e-06, "loss": 2.2786, "step": 6773 }, { "epoch": 0.68, "learning_rate": 4.943898718023938e-06, "loss": 2.3047, "step": 6774 }, { "epoch": 0.68, "learning_rate": 4.941099224976494e-06, "loss": 2.3717, "step": 6775 }, { "epoch": 0.68, "learning_rate": 4.938300264669242e-06, "loss": 2.2328, "step": 6776 }, { "epoch": 0.68, "learning_rate": 4.935501837396933e-06, "loss": 2.3472, "step": 6777 }, { "epoch": 0.68, "learning_rate": 4.932703943454264e-06, "loss": 2.2934, "step": 6778 }, { "epoch": 0.68, "learning_rate": 4.929906583135871e-06, "loss": 2.317, "step": 6779 }, { "epoch": 0.68, "learning_rate": 4.927109756736338e-06, "loss": 2.3117, "step": 6780 }, { "epoch": 0.68, "learning_rate": 4.924313464550195e-06, "loss": 2.0985, "step": 6781 }, { "epoch": 0.68, "learning_rate": 4.921517706871908e-06, "loss": 2.3151, "step": 6782 }, { "epoch": 0.68, "learning_rate": 4.91872248399589e-06, "loss": 2.2886, "step": 6783 }, { "epoch": 0.68, "learning_rate": 4.915927796216506e-06, "loss": 2.3535, "step": 6784 }, { "epoch": 0.68, "learning_rate": 4.913133643828058e-06, "loss": 2.2481, "step": 6785 }, { "epoch": 0.68, "learning_rate": 4.910340027124784e-06, "loss": 2.2751, "step": 6786 }, { "epoch": 0.68, "learning_rate": 4.907546946400875e-06, "loss": 2.4012, "step": 6787 }, { "epoch": 0.68, "learning_rate": 4.904754401950464e-06, "loss": 2.3263, "step": 6788 }, { "epoch": 0.68, "learning_rate": 4.9019623940676275e-06, "loss": 2.1945, "step": 6789 }, { "epoch": 0.68, "learning_rate": 4.8991709230463845e-06, "loss": 2.3529, "step": 6790 }, { "epoch": 0.68, "learning_rate": 4.896379989180697e-06, "loss": 2.3211, "step": 6791 }, { "epoch": 0.68, "learning_rate": 4.89358959276447e-06, "loss": 2.311, "step": 6792 }, { "epoch": 0.68, "learning_rate": 4.8907997340915566e-06, "loss": 2.3204, "step": 6793 }, { "epoch": 0.68, "learning_rate": 4.88801041345575e-06, "loss": 2.2748, "step": 6794 }, { "epoch": 0.68, "learning_rate": 4.885221631150785e-06, "loss": 2.2513, "step": 6795 }, { "epoch": 0.68, "learning_rate": 4.8824333874703414e-06, "loss": 2.3212, "step": 6796 }, { "epoch": 0.68, "learning_rate": 4.879645682708042e-06, "loss": 2.404, "step": 6797 }, { "epoch": 0.68, "learning_rate": 4.876858517157453e-06, "loss": 2.3672, "step": 6798 }, { "epoch": 0.68, "learning_rate": 4.874071891112083e-06, "loss": 2.3218, "step": 6799 }, { "epoch": 0.68, "learning_rate": 4.871285804865387e-06, "loss": 2.3518, "step": 6800 }, { "epoch": 0.68, "learning_rate": 4.8685002587107554e-06, "loss": 2.3298, "step": 6801 }, { "epoch": 0.68, "learning_rate": 4.865715252941534e-06, "loss": 2.4005, "step": 6802 }, { "epoch": 0.68, "learning_rate": 4.862930787851003e-06, "loss": 2.252, "step": 6803 }, { "epoch": 0.68, "learning_rate": 4.860146863732386e-06, "loss": 2.3237, "step": 6804 }, { "epoch": 0.68, "learning_rate": 4.857363480878851e-06, "loss": 2.2677, "step": 6805 }, { "epoch": 0.68, "learning_rate": 4.854580639583509e-06, "loss": 2.3552, "step": 6806 }, { "epoch": 0.68, "learning_rate": 4.851798340139415e-06, "loss": 2.2706, "step": 6807 }, { "epoch": 0.68, "learning_rate": 4.849016582839565e-06, "loss": 2.2896, "step": 6808 }, { "epoch": 0.68, "learning_rate": 4.846235367976905e-06, "loss": 2.3066, "step": 6809 }, { "epoch": 0.68, "learning_rate": 4.843454695844303e-06, "loss": 2.3346, "step": 6810 }, { "epoch": 0.68, "learning_rate": 4.840674566734598e-06, "loss": 2.3082, "step": 6811 }, { "epoch": 0.68, "learning_rate": 4.837894980940554e-06, "loss": 2.2827, "step": 6812 }, { "epoch": 0.68, "learning_rate": 4.835115938754883e-06, "loss": 2.3684, "step": 6813 }, { "epoch": 0.68, "learning_rate": 4.8323374404702386e-06, "loss": 2.2809, "step": 6814 }, { "epoch": 0.68, "learning_rate": 4.829559486379218e-06, "loss": 2.304, "step": 6815 }, { "epoch": 0.68, "learning_rate": 4.826782076774359e-06, "loss": 2.3277, "step": 6816 }, { "epoch": 0.68, "learning_rate": 4.824005211948144e-06, "loss": 2.3217, "step": 6817 }, { "epoch": 0.68, "learning_rate": 4.821228892193e-06, "loss": 2.2931, "step": 6818 }, { "epoch": 0.68, "learning_rate": 4.818453117801289e-06, "loss": 2.2689, "step": 6819 }, { "epoch": 0.68, "learning_rate": 4.815677889065327e-06, "loss": 2.3481, "step": 6820 }, { "epoch": 0.68, "learning_rate": 4.812903206277364e-06, "loss": 2.2238, "step": 6821 }, { "epoch": 0.68, "learning_rate": 4.8101290697295954e-06, "loss": 2.2429, "step": 6822 }, { "epoch": 0.68, "learning_rate": 4.807355479714158e-06, "loss": 2.2739, "step": 6823 }, { "epoch": 0.68, "learning_rate": 4.804582436523132e-06, "loss": 2.2432, "step": 6824 }, { "epoch": 0.68, "learning_rate": 4.801809940448538e-06, "loss": 2.3726, "step": 6825 }, { "epoch": 0.68, "learning_rate": 4.799037991782343e-06, "loss": 2.3032, "step": 6826 }, { "epoch": 0.68, "learning_rate": 4.796266590816453e-06, "loss": 2.1713, "step": 6827 }, { "epoch": 0.68, "learning_rate": 4.793495737842716e-06, "loss": 2.337, "step": 6828 }, { "epoch": 0.68, "learning_rate": 4.790725433152927e-06, "loss": 2.3216, "step": 6829 }, { "epoch": 0.68, "learning_rate": 4.787955677038816e-06, "loss": 2.3518, "step": 6830 }, { "epoch": 0.68, "learning_rate": 4.78518646979206e-06, "loss": 2.3326, "step": 6831 }, { "epoch": 0.68, "learning_rate": 4.78241781170428e-06, "loss": 2.3044, "step": 6832 }, { "epoch": 0.68, "learning_rate": 4.779649703067033e-06, "loss": 2.2866, "step": 6833 }, { "epoch": 0.68, "learning_rate": 4.776882144171824e-06, "loss": 2.2099, "step": 6834 }, { "epoch": 0.68, "learning_rate": 4.774115135310096e-06, "loss": 2.3025, "step": 6835 }, { "epoch": 0.68, "learning_rate": 4.771348676773239e-06, "loss": 2.2598, "step": 6836 }, { "epoch": 0.69, "learning_rate": 4.768582768852573e-06, "loss": 2.3459, "step": 6837 }, { "epoch": 0.69, "learning_rate": 4.76581741183938e-06, "loss": 2.298, "step": 6838 }, { "epoch": 0.69, "learning_rate": 4.7630526060248685e-06, "loss": 2.3576, "step": 6839 }, { "epoch": 0.69, "learning_rate": 4.760288351700192e-06, "loss": 2.4532, "step": 6840 }, { "epoch": 0.69, "learning_rate": 4.757524649156448e-06, "loss": 2.3316, "step": 6841 }, { "epoch": 0.69, "learning_rate": 4.754761498684676e-06, "loss": 2.2506, "step": 6842 }, { "epoch": 0.69, "learning_rate": 4.751998900575856e-06, "loss": 2.4147, "step": 6843 }, { "epoch": 0.69, "learning_rate": 4.749236855120909e-06, "loss": 2.2301, "step": 6844 }, { "epoch": 0.69, "learning_rate": 4.746475362610696e-06, "loss": 2.2903, "step": 6845 }, { "epoch": 0.69, "learning_rate": 4.743714423336032e-06, "loss": 2.3169, "step": 6846 }, { "epoch": 0.69, "learning_rate": 4.74095403758766e-06, "loss": 2.3168, "step": 6847 }, { "epoch": 0.69, "learning_rate": 4.7381942056562666e-06, "loss": 2.2988, "step": 6848 }, { "epoch": 0.69, "learning_rate": 4.735434927832491e-06, "loss": 2.3264, "step": 6849 }, { "epoch": 0.69, "learning_rate": 4.732676204406895e-06, "loss": 2.2331, "step": 6850 }, { "epoch": 0.69, "learning_rate": 4.729918035669998e-06, "loss": 2.3457, "step": 6851 }, { "epoch": 0.69, "learning_rate": 4.727160421912256e-06, "loss": 2.3254, "step": 6852 }, { "epoch": 0.69, "learning_rate": 4.724403363424066e-06, "loss": 2.3475, "step": 6853 }, { "epoch": 0.69, "learning_rate": 4.721646860495763e-06, "loss": 2.2434, "step": 6854 }, { "epoch": 0.69, "learning_rate": 4.718890913417635e-06, "loss": 2.3299, "step": 6855 }, { "epoch": 0.69, "learning_rate": 4.716135522479901e-06, "loss": 2.3057, "step": 6856 }, { "epoch": 0.69, "learning_rate": 4.713380687972723e-06, "loss": 2.2231, "step": 6857 }, { "epoch": 0.69, "learning_rate": 4.710626410186208e-06, "loss": 2.3491, "step": 6858 }, { "epoch": 0.69, "learning_rate": 4.707872689410399e-06, "loss": 2.2888, "step": 6859 }, { "epoch": 0.69, "learning_rate": 4.705119525935284e-06, "loss": 2.2862, "step": 6860 }, { "epoch": 0.69, "learning_rate": 4.702366920050795e-06, "loss": 2.4374, "step": 6861 }, { "epoch": 0.69, "learning_rate": 4.699614872046798e-06, "loss": 2.3603, "step": 6862 }, { "epoch": 0.69, "learning_rate": 4.696863382213103e-06, "loss": 2.3093, "step": 6863 }, { "epoch": 0.69, "learning_rate": 4.694112450839469e-06, "loss": 2.344, "step": 6864 }, { "epoch": 0.69, "learning_rate": 4.691362078215586e-06, "loss": 2.3764, "step": 6865 }, { "epoch": 0.69, "learning_rate": 4.68861226463109e-06, "loss": 2.3101, "step": 6866 }, { "epoch": 0.69, "learning_rate": 4.685863010375556e-06, "loss": 2.2696, "step": 6867 }, { "epoch": 0.69, "learning_rate": 4.6831143157385005e-06, "loss": 2.2111, "step": 6868 }, { "epoch": 0.69, "learning_rate": 4.680366181009384e-06, "loss": 2.3419, "step": 6869 }, { "epoch": 0.69, "learning_rate": 4.677618606477602e-06, "loss": 2.3979, "step": 6870 }, { "epoch": 0.69, "learning_rate": 4.674871592432499e-06, "loss": 2.3214, "step": 6871 }, { "epoch": 0.69, "learning_rate": 4.6721251391633515e-06, "loss": 2.3833, "step": 6872 }, { "epoch": 0.69, "learning_rate": 4.669379246959386e-06, "loss": 2.3337, "step": 6873 }, { "epoch": 0.69, "learning_rate": 4.666633916109763e-06, "loss": 2.2499, "step": 6874 }, { "epoch": 0.69, "learning_rate": 4.6638891469035865e-06, "loss": 2.3742, "step": 6875 }, { "epoch": 0.69, "learning_rate": 4.661144939629903e-06, "loss": 2.3455, "step": 6876 }, { "epoch": 0.69, "learning_rate": 4.658401294577696e-06, "loss": 2.3648, "step": 6877 }, { "epoch": 0.69, "learning_rate": 4.655658212035893e-06, "loss": 2.3661, "step": 6878 }, { "epoch": 0.69, "learning_rate": 4.65291569229336e-06, "loss": 2.3121, "step": 6879 }, { "epoch": 0.69, "learning_rate": 4.650173735638908e-06, "loss": 2.3201, "step": 6880 }, { "epoch": 0.69, "learning_rate": 4.647432342361279e-06, "loss": 2.3685, "step": 6881 }, { "epoch": 0.69, "learning_rate": 4.64469151274917e-06, "loss": 2.2772, "step": 6882 }, { "epoch": 0.69, "learning_rate": 4.641951247091207e-06, "loss": 2.2797, "step": 6883 }, { "epoch": 0.69, "learning_rate": 4.639211545675963e-06, "loss": 2.2629, "step": 6884 }, { "epoch": 0.69, "learning_rate": 4.6364724087919464e-06, "loss": 2.218, "step": 6885 }, { "epoch": 0.69, "learning_rate": 4.6337338367276095e-06, "loss": 2.3276, "step": 6886 }, { "epoch": 0.69, "learning_rate": 4.630995829771346e-06, "loss": 2.1912, "step": 6887 }, { "epoch": 0.69, "learning_rate": 4.628258388211486e-06, "loss": 2.2647, "step": 6888 }, { "epoch": 0.69, "learning_rate": 4.625521512336304e-06, "loss": 2.4321, "step": 6889 }, { "epoch": 0.69, "learning_rate": 4.622785202434015e-06, "loss": 2.3209, "step": 6890 }, { "epoch": 0.69, "learning_rate": 4.620049458792771e-06, "loss": 2.299, "step": 6891 }, { "epoch": 0.69, "learning_rate": 4.617314281700664e-06, "loss": 2.3035, "step": 6892 }, { "epoch": 0.69, "learning_rate": 4.6145796714457345e-06, "loss": 2.3209, "step": 6893 }, { "epoch": 0.69, "learning_rate": 4.611845628315954e-06, "loss": 2.2038, "step": 6894 }, { "epoch": 0.69, "learning_rate": 4.609112152599237e-06, "loss": 2.3917, "step": 6895 }, { "epoch": 0.69, "learning_rate": 4.606379244583441e-06, "loss": 2.2363, "step": 6896 }, { "epoch": 0.69, "learning_rate": 4.60364690455636e-06, "loss": 2.3567, "step": 6897 }, { "epoch": 0.69, "learning_rate": 4.600915132805732e-06, "loss": 2.3212, "step": 6898 }, { "epoch": 0.69, "learning_rate": 4.598183929619228e-06, "loss": 2.2524, "step": 6899 }, { "epoch": 0.69, "learning_rate": 4.595453295284471e-06, "loss": 2.2938, "step": 6900 }, { "epoch": 0.69, "learning_rate": 4.5927232300890146e-06, "loss": 2.2184, "step": 6901 }, { "epoch": 0.69, "learning_rate": 4.589993734320353e-06, "loss": 2.419, "step": 6902 }, { "epoch": 0.69, "learning_rate": 4.587264808265928e-06, "loss": 2.3707, "step": 6903 }, { "epoch": 0.69, "learning_rate": 4.58453645221311e-06, "loss": 2.3523, "step": 6904 }, { "epoch": 0.69, "learning_rate": 4.581808666449218e-06, "loss": 2.2782, "step": 6905 }, { "epoch": 0.69, "learning_rate": 4.5790814512615075e-06, "loss": 2.3451, "step": 6906 }, { "epoch": 0.69, "learning_rate": 4.576354806937176e-06, "loss": 2.3028, "step": 6907 }, { "epoch": 0.69, "learning_rate": 4.573628733763356e-06, "loss": 2.3317, "step": 6908 }, { "epoch": 0.69, "learning_rate": 4.570903232027128e-06, "loss": 2.2807, "step": 6909 }, { "epoch": 0.69, "learning_rate": 4.568178302015507e-06, "loss": 2.3852, "step": 6910 }, { "epoch": 0.69, "learning_rate": 4.565453944015448e-06, "loss": 2.3111, "step": 6911 }, { "epoch": 0.69, "learning_rate": 4.562730158313845e-06, "loss": 2.4155, "step": 6912 }, { "epoch": 0.69, "learning_rate": 4.560006945197538e-06, "loss": 2.3154, "step": 6913 }, { "epoch": 0.69, "learning_rate": 4.557284304953294e-06, "loss": 2.2927, "step": 6914 }, { "epoch": 0.69, "learning_rate": 4.554562237867832e-06, "loss": 2.2671, "step": 6915 }, { "epoch": 0.69, "learning_rate": 4.551840744227804e-06, "loss": 2.3164, "step": 6916 }, { "epoch": 0.69, "learning_rate": 4.549119824319803e-06, "loss": 2.4179, "step": 6917 }, { "epoch": 0.69, "learning_rate": 4.546399478430367e-06, "loss": 2.3714, "step": 6918 }, { "epoch": 0.69, "learning_rate": 4.543679706845966e-06, "loss": 2.2914, "step": 6919 }, { "epoch": 0.69, "learning_rate": 4.540960509853012e-06, "loss": 2.3453, "step": 6920 }, { "epoch": 0.69, "learning_rate": 4.538241887737857e-06, "loss": 2.3142, "step": 6921 }, { "epoch": 0.69, "learning_rate": 4.535523840786794e-06, "loss": 2.308, "step": 6922 }, { "epoch": 0.69, "learning_rate": 4.532806369286051e-06, "loss": 2.2235, "step": 6923 }, { "epoch": 0.69, "learning_rate": 4.5300894735218005e-06, "loss": 2.5145, "step": 6924 }, { "epoch": 0.69, "learning_rate": 4.52737315378015e-06, "loss": 2.2629, "step": 6925 }, { "epoch": 0.69, "learning_rate": 4.524657410347145e-06, "loss": 2.3048, "step": 6926 }, { "epoch": 0.69, "learning_rate": 4.521942243508784e-06, "loss": 2.2477, "step": 6927 }, { "epoch": 0.69, "learning_rate": 4.519227653550986e-06, "loss": 2.2427, "step": 6928 }, { "epoch": 0.69, "learning_rate": 4.51651364075962e-06, "loss": 2.3371, "step": 6929 }, { "epoch": 0.69, "learning_rate": 4.513800205420493e-06, "loss": 2.2645, "step": 6930 }, { "epoch": 0.69, "learning_rate": 4.511087347819348e-06, "loss": 2.3891, "step": 6931 }, { "epoch": 0.69, "learning_rate": 4.508375068241872e-06, "loss": 2.3396, "step": 6932 }, { "epoch": 0.69, "learning_rate": 4.505663366973685e-06, "loss": 2.2507, "step": 6933 }, { "epoch": 0.69, "learning_rate": 4.502952244300352e-06, "loss": 2.2344, "step": 6934 }, { "epoch": 0.69, "learning_rate": 4.5002417005073725e-06, "loss": 2.3341, "step": 6935 }, { "epoch": 0.69, "learning_rate": 4.4975317358801885e-06, "loss": 2.2977, "step": 6936 }, { "epoch": 0.7, "learning_rate": 4.49482235070418e-06, "loss": 2.3359, "step": 6937 }, { "epoch": 0.7, "learning_rate": 4.492113545264665e-06, "loss": 2.3183, "step": 6938 }, { "epoch": 0.7, "learning_rate": 4.4894053198469e-06, "loss": 2.2752, "step": 6939 }, { "epoch": 0.7, "learning_rate": 4.486697674736084e-06, "loss": 2.2752, "step": 6940 }, { "epoch": 0.7, "learning_rate": 4.483990610217349e-06, "loss": 2.3215, "step": 6941 }, { "epoch": 0.7, "learning_rate": 4.481284126575772e-06, "loss": 2.3044, "step": 6942 }, { "epoch": 0.7, "learning_rate": 4.478578224096365e-06, "loss": 2.3051, "step": 6943 }, { "epoch": 0.7, "learning_rate": 4.475872903064076e-06, "loss": 2.3672, "step": 6944 }, { "epoch": 0.7, "learning_rate": 4.473168163763802e-06, "loss": 2.3146, "step": 6945 }, { "epoch": 0.7, "learning_rate": 4.470464006480371e-06, "loss": 2.3077, "step": 6946 }, { "epoch": 0.7, "learning_rate": 4.467760431498549e-06, "loss": 2.3479, "step": 6947 }, { "epoch": 0.7, "learning_rate": 4.465057439103044e-06, "loss": 2.2608, "step": 6948 }, { "epoch": 0.7, "learning_rate": 4.4623550295785e-06, "loss": 2.3559, "step": 6949 }, { "epoch": 0.7, "learning_rate": 4.459653203209503e-06, "loss": 2.3183, "step": 6950 }, { "epoch": 0.7, "learning_rate": 4.456951960280573e-06, "loss": 2.2791, "step": 6951 }, { "epoch": 0.7, "learning_rate": 4.454251301076175e-06, "loss": 2.3322, "step": 6952 }, { "epoch": 0.7, "learning_rate": 4.451551225880704e-06, "loss": 2.3834, "step": 6953 }, { "epoch": 0.7, "learning_rate": 4.448851734978501e-06, "loss": 2.3336, "step": 6954 }, { "epoch": 0.7, "learning_rate": 4.446152828653841e-06, "loss": 2.361, "step": 6955 }, { "epoch": 0.7, "learning_rate": 4.443454507190942e-06, "loss": 2.2755, "step": 6956 }, { "epoch": 0.7, "learning_rate": 4.440756770873954e-06, "loss": 2.3203, "step": 6957 }, { "epoch": 0.7, "learning_rate": 4.438059619986972e-06, "loss": 2.3277, "step": 6958 }, { "epoch": 0.7, "learning_rate": 4.435363054814024e-06, "loss": 2.3622, "step": 6959 }, { "epoch": 0.7, "learning_rate": 4.432667075639079e-06, "loss": 2.3367, "step": 6960 }, { "epoch": 0.7, "learning_rate": 4.429971682746044e-06, "loss": 2.2556, "step": 6961 }, { "epoch": 0.7, "learning_rate": 4.42727687641876e-06, "loss": 2.3228, "step": 6962 }, { "epoch": 0.7, "learning_rate": 4.424582656941019e-06, "loss": 2.3375, "step": 6963 }, { "epoch": 0.7, "learning_rate": 4.421889024596537e-06, "loss": 2.2512, "step": 6964 }, { "epoch": 0.7, "learning_rate": 4.4191959796689755e-06, "loss": 2.3379, "step": 6965 }, { "epoch": 0.7, "learning_rate": 4.416503522441931e-06, "loss": 2.2164, "step": 6966 }, { "epoch": 0.7, "learning_rate": 4.413811653198939e-06, "loss": 2.3307, "step": 6967 }, { "epoch": 0.7, "learning_rate": 4.411120372223477e-06, "loss": 2.338, "step": 6968 }, { "epoch": 0.7, "learning_rate": 4.408429679798953e-06, "loss": 2.2407, "step": 6969 }, { "epoch": 0.7, "learning_rate": 4.405739576208717e-06, "loss": 2.3869, "step": 6970 }, { "epoch": 0.7, "learning_rate": 4.4030500617360575e-06, "loss": 2.2641, "step": 6971 }, { "epoch": 0.7, "learning_rate": 4.400361136664204e-06, "loss": 2.4108, "step": 6972 }, { "epoch": 0.7, "learning_rate": 4.397672801276318e-06, "loss": 2.3619, "step": 6973 }, { "epoch": 0.7, "learning_rate": 4.394985055855503e-06, "loss": 2.3195, "step": 6974 }, { "epoch": 0.7, "learning_rate": 4.392297900684796e-06, "loss": 2.25, "step": 6975 }, { "epoch": 0.7, "learning_rate": 4.389611336047177e-06, "loss": 2.2421, "step": 6976 }, { "epoch": 0.7, "learning_rate": 4.386925362225563e-06, "loss": 2.4125, "step": 6977 }, { "epoch": 0.7, "learning_rate": 4.384239979502801e-06, "loss": 2.2902, "step": 6978 }, { "epoch": 0.7, "learning_rate": 4.381555188161686e-06, "loss": 2.3365, "step": 6979 }, { "epoch": 0.7, "learning_rate": 4.378870988484942e-06, "loss": 2.2939, "step": 6980 }, { "epoch": 0.7, "learning_rate": 4.3761873807552435e-06, "loss": 2.3282, "step": 6981 }, { "epoch": 0.7, "learning_rate": 4.37350436525519e-06, "loss": 2.3477, "step": 6982 }, { "epoch": 0.7, "learning_rate": 4.3708219422673235e-06, "loss": 2.3694, "step": 6983 }, { "epoch": 0.7, "learning_rate": 4.368140112074124e-06, "loss": 2.2537, "step": 6984 }, { "epoch": 0.7, "learning_rate": 4.3654588749580075e-06, "loss": 2.2504, "step": 6985 }, { "epoch": 0.7, "learning_rate": 4.362778231201328e-06, "loss": 2.3855, "step": 6986 }, { "epoch": 0.7, "learning_rate": 4.360098181086379e-06, "loss": 2.3237, "step": 6987 }, { "epoch": 0.7, "learning_rate": 4.357418724895388e-06, "loss": 2.3192, "step": 6988 }, { "epoch": 0.7, "learning_rate": 4.35473986291052e-06, "loss": 2.292, "step": 6989 }, { "epoch": 0.7, "learning_rate": 4.352061595413885e-06, "loss": 2.2854, "step": 6990 }, { "epoch": 0.7, "learning_rate": 4.3493839226875215e-06, "loss": 2.2437, "step": 6991 }, { "epoch": 0.7, "learning_rate": 4.346706845013409e-06, "loss": 2.2956, "step": 6992 }, { "epoch": 0.7, "learning_rate": 4.344030362673462e-06, "loss": 2.1386, "step": 6993 }, { "epoch": 0.7, "learning_rate": 4.341354475949537e-06, "loss": 2.2486, "step": 6994 }, { "epoch": 0.7, "learning_rate": 4.338679185123424e-06, "loss": 2.3107, "step": 6995 }, { "epoch": 0.7, "learning_rate": 4.33600449047685e-06, "loss": 2.3577, "step": 6996 }, { "epoch": 0.7, "learning_rate": 4.333330392291482e-06, "loss": 2.3294, "step": 6997 }, { "epoch": 0.7, "learning_rate": 4.330656890848921e-06, "loss": 2.3556, "step": 6998 }, { "epoch": 0.7, "learning_rate": 4.327983986430709e-06, "loss": 2.2489, "step": 6999 }, { "epoch": 0.7, "learning_rate": 4.325311679318319e-06, "loss": 2.231, "step": 7000 }, { "epoch": 0.7, "learning_rate": 4.322639969793169e-06, "loss": 2.2464, "step": 7001 }, { "epoch": 0.7, "learning_rate": 4.319968858136607e-06, "loss": 2.3375, "step": 7002 }, { "epoch": 0.7, "learning_rate": 4.317298344629924e-06, "loss": 2.2997, "step": 7003 }, { "epoch": 0.7, "learning_rate": 4.314628429554343e-06, "loss": 2.3496, "step": 7004 }, { "epoch": 0.7, "learning_rate": 4.311959113191027e-06, "loss": 2.2619, "step": 7005 }, { "epoch": 0.7, "learning_rate": 4.309290395821075e-06, "loss": 2.3824, "step": 7006 }, { "epoch": 0.7, "learning_rate": 4.306622277725518e-06, "loss": 2.3804, "step": 7007 }, { "epoch": 0.7, "learning_rate": 4.303954759185338e-06, "loss": 2.2894, "step": 7008 }, { "epoch": 0.7, "learning_rate": 4.3012878404814406e-06, "loss": 2.33, "step": 7009 }, { "epoch": 0.7, "learning_rate": 4.298621521894671e-06, "loss": 2.2959, "step": 7010 }, { "epoch": 0.7, "learning_rate": 4.295955803705815e-06, "loss": 2.3732, "step": 7011 }, { "epoch": 0.7, "learning_rate": 4.2932906861955896e-06, "loss": 2.2907, "step": 7012 }, { "epoch": 0.7, "learning_rate": 4.2906261696446535e-06, "loss": 2.3205, "step": 7013 }, { "epoch": 0.7, "learning_rate": 4.2879622543336005e-06, "loss": 2.3728, "step": 7014 }, { "epoch": 0.7, "learning_rate": 4.285298940542958e-06, "loss": 2.3416, "step": 7015 }, { "epoch": 0.7, "learning_rate": 4.282636228553201e-06, "loss": 2.3182, "step": 7016 }, { "epoch": 0.7, "learning_rate": 4.279974118644724e-06, "loss": 2.2845, "step": 7017 }, { "epoch": 0.7, "learning_rate": 4.277312611097871e-06, "loss": 2.3596, "step": 7018 }, { "epoch": 0.7, "learning_rate": 4.274651706192918e-06, "loss": 2.2815, "step": 7019 }, { "epoch": 0.7, "learning_rate": 4.271991404210078e-06, "loss": 2.2999, "step": 7020 }, { "epoch": 0.7, "learning_rate": 4.2693317054295025e-06, "loss": 2.3136, "step": 7021 }, { "epoch": 0.7, "learning_rate": 4.266672610131276e-06, "loss": 2.2742, "step": 7022 }, { "epoch": 0.7, "learning_rate": 4.264014118595422e-06, "loss": 2.3538, "step": 7023 }, { "epoch": 0.7, "learning_rate": 4.261356231101894e-06, "loss": 2.3517, "step": 7024 }, { "epoch": 0.7, "learning_rate": 4.258698947930599e-06, "loss": 2.3462, "step": 7025 }, { "epoch": 0.7, "learning_rate": 4.25604226936136e-06, "loss": 2.2532, "step": 7026 }, { "epoch": 0.7, "learning_rate": 4.253386195673948e-06, "loss": 2.2915, "step": 7027 }, { "epoch": 0.7, "learning_rate": 4.250730727148069e-06, "loss": 2.2309, "step": 7028 }, { "epoch": 0.7, "learning_rate": 4.248075864063361e-06, "loss": 2.3089, "step": 7029 }, { "epoch": 0.7, "learning_rate": 4.245421606699402e-06, "loss": 2.2818, "step": 7030 }, { "epoch": 0.7, "learning_rate": 4.242767955335705e-06, "loss": 2.3371, "step": 7031 }, { "epoch": 0.7, "learning_rate": 4.24011491025172e-06, "loss": 2.336, "step": 7032 }, { "epoch": 0.7, "learning_rate": 4.2374624717268275e-06, "loss": 2.3262, "step": 7033 }, { "epoch": 0.7, "learning_rate": 4.234810640040359e-06, "loss": 2.3266, "step": 7034 }, { "epoch": 0.7, "learning_rate": 4.232159415471566e-06, "loss": 2.3601, "step": 7035 }, { "epoch": 0.7, "learning_rate": 4.229508798299643e-06, "loss": 2.2532, "step": 7036 }, { "epoch": 0.71, "learning_rate": 4.226858788803722e-06, "loss": 2.3321, "step": 7037 }, { "epoch": 0.71, "learning_rate": 4.224209387262865e-06, "loss": 2.2702, "step": 7038 }, { "epoch": 0.71, "learning_rate": 4.2215605939560775e-06, "loss": 2.3043, "step": 7039 }, { "epoch": 0.71, "learning_rate": 4.218912409162295e-06, "loss": 2.4261, "step": 7040 }, { "epoch": 0.71, "learning_rate": 4.216264833160396e-06, "loss": 2.3224, "step": 7041 }, { "epoch": 0.71, "learning_rate": 4.213617866229178e-06, "loss": 2.3933, "step": 7042 }, { "epoch": 0.71, "learning_rate": 4.210971508647399e-06, "loss": 2.3216, "step": 7043 }, { "epoch": 0.71, "learning_rate": 4.208325760693736e-06, "loss": 2.3202, "step": 7044 }, { "epoch": 0.71, "learning_rate": 4.205680622646806e-06, "loss": 2.3758, "step": 7045 }, { "epoch": 0.71, "learning_rate": 4.2030360947851615e-06, "loss": 2.2928, "step": 7046 }, { "epoch": 0.71, "learning_rate": 4.200392177387291e-06, "loss": 2.2813, "step": 7047 }, { "epoch": 0.71, "learning_rate": 4.1977488707316206e-06, "loss": 2.3849, "step": 7048 }, { "epoch": 0.71, "learning_rate": 4.195106175096508e-06, "loss": 2.3256, "step": 7049 }, { "epoch": 0.71, "learning_rate": 4.19246409076025e-06, "loss": 2.2547, "step": 7050 }, { "epoch": 0.71, "learning_rate": 4.189822618001075e-06, "loss": 2.4066, "step": 7051 }, { "epoch": 0.71, "learning_rate": 4.187181757097155e-06, "loss": 2.3608, "step": 7052 }, { "epoch": 0.71, "learning_rate": 4.18454150832659e-06, "loss": 2.2662, "step": 7053 }, { "epoch": 0.71, "learning_rate": 4.1819018719674195e-06, "loss": 2.3148, "step": 7054 }, { "epoch": 0.71, "learning_rate": 4.179262848297615e-06, "loss": 2.263, "step": 7055 }, { "epoch": 0.71, "learning_rate": 4.176624437595086e-06, "loss": 2.2927, "step": 7056 }, { "epoch": 0.71, "learning_rate": 4.173986640137678e-06, "loss": 2.4111, "step": 7057 }, { "epoch": 0.71, "learning_rate": 4.1713494562031685e-06, "loss": 2.2142, "step": 7058 }, { "epoch": 0.71, "learning_rate": 4.1687128860692745e-06, "loss": 2.3349, "step": 7059 }, { "epoch": 0.71, "learning_rate": 4.166076930013647e-06, "loss": 2.3123, "step": 7060 }, { "epoch": 0.71, "learning_rate": 4.16344158831387e-06, "loss": 2.2808, "step": 7061 }, { "epoch": 0.71, "learning_rate": 4.160806861247467e-06, "loss": 2.2707, "step": 7062 }, { "epoch": 0.71, "learning_rate": 4.158172749091893e-06, "loss": 2.2483, "step": 7063 }, { "epoch": 0.71, "learning_rate": 4.155539252124541e-06, "loss": 2.3698, "step": 7064 }, { "epoch": 0.71, "learning_rate": 4.152906370622736e-06, "loss": 2.3568, "step": 7065 }, { "epoch": 0.71, "learning_rate": 4.1502741048637415e-06, "loss": 2.3322, "step": 7066 }, { "epoch": 0.71, "learning_rate": 4.1476424551247555e-06, "loss": 2.3362, "step": 7067 }, { "epoch": 0.71, "learning_rate": 4.145011421682909e-06, "loss": 2.2556, "step": 7068 }, { "epoch": 0.71, "learning_rate": 4.142381004815267e-06, "loss": 2.2395, "step": 7069 }, { "epoch": 0.71, "learning_rate": 4.139751204798839e-06, "loss": 2.3861, "step": 7070 }, { "epoch": 0.71, "learning_rate": 4.137122021910559e-06, "loss": 2.3475, "step": 7071 }, { "epoch": 0.71, "learning_rate": 4.1344934564272984e-06, "loss": 2.2385, "step": 7072 }, { "epoch": 0.71, "learning_rate": 4.131865508625868e-06, "loss": 2.3298, "step": 7073 }, { "epoch": 0.71, "learning_rate": 4.129238178783007e-06, "loss": 2.3205, "step": 7074 }, { "epoch": 0.71, "learning_rate": 4.126611467175396e-06, "loss": 2.3209, "step": 7075 }, { "epoch": 0.71, "learning_rate": 4.123985374079644e-06, "loss": 2.3648, "step": 7076 }, { "epoch": 0.71, "learning_rate": 4.121359899772302e-06, "loss": 2.248, "step": 7077 }, { "epoch": 0.71, "learning_rate": 4.118735044529846e-06, "loss": 2.2964, "step": 7078 }, { "epoch": 0.71, "learning_rate": 4.116110808628701e-06, "loss": 2.3102, "step": 7079 }, { "epoch": 0.71, "learning_rate": 4.113487192345219e-06, "loss": 2.2752, "step": 7080 }, { "epoch": 0.71, "learning_rate": 4.110864195955678e-06, "loss": 2.3276, "step": 7081 }, { "epoch": 0.71, "learning_rate": 4.108241819736304e-06, "loss": 2.2743, "step": 7082 }, { "epoch": 0.71, "learning_rate": 4.105620063963252e-06, "loss": 2.373, "step": 7083 }, { "epoch": 0.71, "learning_rate": 4.102998928912615e-06, "loss": 2.2649, "step": 7084 }, { "epoch": 0.71, "learning_rate": 4.100378414860416e-06, "loss": 2.2915, "step": 7085 }, { "epoch": 0.71, "learning_rate": 4.097758522082613e-06, "loss": 2.2808, "step": 7086 }, { "epoch": 0.71, "learning_rate": 4.0951392508551e-06, "loss": 2.3065, "step": 7087 }, { "epoch": 0.71, "learning_rate": 4.092520601453712e-06, "loss": 2.3832, "step": 7088 }, { "epoch": 0.71, "learning_rate": 4.089902574154209e-06, "loss": 2.208, "step": 7089 }, { "epoch": 0.71, "learning_rate": 4.087285169232288e-06, "loss": 2.2645, "step": 7090 }, { "epoch": 0.71, "learning_rate": 4.084668386963582e-06, "loss": 2.2768, "step": 7091 }, { "epoch": 0.71, "learning_rate": 4.082052227623658e-06, "loss": 2.2901, "step": 7092 }, { "epoch": 0.71, "learning_rate": 4.079436691488017e-06, "loss": 2.3769, "step": 7093 }, { "epoch": 0.71, "learning_rate": 4.076821778832095e-06, "loss": 2.3427, "step": 7094 }, { "epoch": 0.71, "learning_rate": 4.074207489931261e-06, "loss": 2.3736, "step": 7095 }, { "epoch": 0.71, "learning_rate": 4.071593825060817e-06, "loss": 2.2749, "step": 7096 }, { "epoch": 0.71, "learning_rate": 4.0689807844960065e-06, "loss": 2.2397, "step": 7097 }, { "epoch": 0.71, "learning_rate": 4.066368368512e-06, "loss": 2.3028, "step": 7098 }, { "epoch": 0.71, "learning_rate": 4.063756577383906e-06, "loss": 2.3102, "step": 7099 }, { "epoch": 0.71, "learning_rate": 4.061145411386763e-06, "loss": 2.3037, "step": 7100 }, { "epoch": 0.71, "learning_rate": 4.0585348707955484e-06, "loss": 2.3352, "step": 7101 }, { "epoch": 0.71, "learning_rate": 4.05592495588517e-06, "loss": 2.2663, "step": 7102 }, { "epoch": 0.71, "learning_rate": 4.053315666930473e-06, "loss": 2.368, "step": 7103 }, { "epoch": 0.71, "learning_rate": 4.050707004206234e-06, "loss": 2.2909, "step": 7104 }, { "epoch": 0.71, "learning_rate": 4.048098967987165e-06, "loss": 2.3097, "step": 7105 }, { "epoch": 0.71, "learning_rate": 4.045491558547912e-06, "loss": 2.3914, "step": 7106 }, { "epoch": 0.71, "learning_rate": 4.042884776163055e-06, "loss": 2.3409, "step": 7107 }, { "epoch": 0.71, "learning_rate": 4.040278621107108e-06, "loss": 2.2886, "step": 7108 }, { "epoch": 0.71, "learning_rate": 4.037673093654516e-06, "loss": 2.2383, "step": 7109 }, { "epoch": 0.71, "learning_rate": 4.0350681940796645e-06, "loss": 2.1724, "step": 7110 }, { "epoch": 0.71, "learning_rate": 4.0324639226568666e-06, "loss": 2.4345, "step": 7111 }, { "epoch": 0.71, "learning_rate": 4.029860279660371e-06, "loss": 2.2966, "step": 7112 }, { "epoch": 0.71, "learning_rate": 4.027257265364364e-06, "loss": 2.2957, "step": 7113 }, { "epoch": 0.71, "learning_rate": 4.024654880042955e-06, "loss": 2.3794, "step": 7114 }, { "epoch": 0.71, "learning_rate": 4.022053123970205e-06, "loss": 2.2347, "step": 7115 }, { "epoch": 0.71, "learning_rate": 4.019451997420093e-06, "loss": 2.3168, "step": 7116 }, { "epoch": 0.71, "learning_rate": 4.016851500666539e-06, "loss": 2.3004, "step": 7117 }, { "epoch": 0.71, "learning_rate": 4.014251633983392e-06, "loss": 2.2529, "step": 7118 }, { "epoch": 0.71, "learning_rate": 4.011652397644439e-06, "loss": 2.3064, "step": 7119 }, { "epoch": 0.71, "learning_rate": 4.0090537919234e-06, "loss": 2.2437, "step": 7120 }, { "epoch": 0.71, "learning_rate": 4.0064558170939264e-06, "loss": 2.3999, "step": 7121 }, { "epoch": 0.71, "learning_rate": 4.003858473429605e-06, "loss": 2.2337, "step": 7122 }, { "epoch": 0.71, "learning_rate": 4.001261761203955e-06, "loss": 2.2592, "step": 7123 }, { "epoch": 0.71, "learning_rate": 3.99866568069043e-06, "loss": 2.2904, "step": 7124 }, { "epoch": 0.71, "learning_rate": 3.996070232162417e-06, "loss": 2.3637, "step": 7125 }, { "epoch": 0.71, "learning_rate": 3.9934754158932355e-06, "loss": 2.3954, "step": 7126 }, { "epoch": 0.71, "learning_rate": 3.990881232156141e-06, "loss": 2.2882, "step": 7127 }, { "epoch": 0.71, "learning_rate": 3.988287681224317e-06, "loss": 2.1912, "step": 7128 }, { "epoch": 0.71, "learning_rate": 3.985694763370887e-06, "loss": 2.3528, "step": 7129 }, { "epoch": 0.71, "learning_rate": 3.983102478868904e-06, "loss": 2.2765, "step": 7130 }, { "epoch": 0.71, "learning_rate": 3.980510827991354e-06, "loss": 2.3917, "step": 7131 }, { "epoch": 0.71, "learning_rate": 3.977919811011155e-06, "loss": 2.3176, "step": 7132 }, { "epoch": 0.71, "learning_rate": 3.975329428201166e-06, "loss": 2.3308, "step": 7133 }, { "epoch": 0.71, "learning_rate": 3.972739679834173e-06, "loss": 2.2271, "step": 7134 }, { "epoch": 0.71, "learning_rate": 3.970150566182893e-06, "loss": 2.3324, "step": 7135 }, { "epoch": 0.71, "learning_rate": 3.96756208751998e-06, "loss": 2.3117, "step": 7136 }, { "epoch": 0.72, "learning_rate": 3.964974244118021e-06, "loss": 2.3082, "step": 7137 }, { "epoch": 0.72, "learning_rate": 3.962387036249535e-06, "loss": 2.2941, "step": 7138 }, { "epoch": 0.72, "learning_rate": 3.959800464186972e-06, "loss": 2.2753, "step": 7139 }, { "epoch": 0.72, "learning_rate": 3.957214528202722e-06, "loss": 2.342, "step": 7140 }, { "epoch": 0.72, "learning_rate": 3.954629228569096e-06, "loss": 2.3531, "step": 7141 }, { "epoch": 0.72, "learning_rate": 3.952044565558354e-06, "loss": 2.3035, "step": 7142 }, { "epoch": 0.72, "learning_rate": 3.949460539442677e-06, "loss": 2.1427, "step": 7143 }, { "epoch": 0.72, "learning_rate": 3.946877150494186e-06, "loss": 2.2501, "step": 7144 }, { "epoch": 0.72, "learning_rate": 3.944294398984925e-06, "loss": 2.3647, "step": 7145 }, { "epoch": 0.72, "learning_rate": 3.941712285186879e-06, "loss": 2.3508, "step": 7146 }, { "epoch": 0.72, "learning_rate": 3.939130809371963e-06, "loss": 2.2385, "step": 7147 }, { "epoch": 0.72, "learning_rate": 3.936549971812028e-06, "loss": 2.3426, "step": 7148 }, { "epoch": 0.72, "learning_rate": 3.933969772778855e-06, "loss": 2.3007, "step": 7149 }, { "epoch": 0.72, "learning_rate": 3.931390212544154e-06, "loss": 2.2937, "step": 7150 }, { "epoch": 0.72, "learning_rate": 3.928811291379579e-06, "loss": 2.3229, "step": 7151 }, { "epoch": 0.72, "learning_rate": 3.926233009556709e-06, "loss": 2.2819, "step": 7152 }, { "epoch": 0.72, "learning_rate": 3.923655367347054e-06, "loss": 2.2125, "step": 7153 }, { "epoch": 0.72, "learning_rate": 3.921078365022057e-06, "loss": 2.3479, "step": 7154 }, { "epoch": 0.72, "learning_rate": 3.9185020028530995e-06, "loss": 2.2462, "step": 7155 }, { "epoch": 0.72, "learning_rate": 3.915926281111491e-06, "loss": 2.3009, "step": 7156 }, { "epoch": 0.72, "learning_rate": 3.913351200068473e-06, "loss": 2.2935, "step": 7157 }, { "epoch": 0.72, "learning_rate": 3.9107767599952205e-06, "loss": 2.3712, "step": 7158 }, { "epoch": 0.72, "learning_rate": 3.908202961162839e-06, "loss": 2.303, "step": 7159 }, { "epoch": 0.72, "learning_rate": 3.905629803842377e-06, "loss": 2.3674, "step": 7160 }, { "epoch": 0.72, "learning_rate": 3.9030572883048014e-06, "loss": 2.3008, "step": 7161 }, { "epoch": 0.72, "learning_rate": 3.900485414821018e-06, "loss": 2.2852, "step": 7162 }, { "epoch": 0.72, "learning_rate": 3.897914183661865e-06, "loss": 2.341, "step": 7163 }, { "epoch": 0.72, "learning_rate": 3.895343595098112e-06, "loss": 2.376, "step": 7164 }, { "epoch": 0.72, "learning_rate": 3.892773649400462e-06, "loss": 2.25, "step": 7165 }, { "epoch": 0.72, "learning_rate": 3.890204346839548e-06, "loss": 2.3467, "step": 7166 }, { "epoch": 0.72, "learning_rate": 3.887635687685938e-06, "loss": 2.2107, "step": 7167 }, { "epoch": 0.72, "learning_rate": 3.88506767221013e-06, "loss": 2.2743, "step": 7168 }, { "epoch": 0.72, "learning_rate": 3.8825003006825564e-06, "loss": 2.4392, "step": 7169 }, { "epoch": 0.72, "learning_rate": 3.879933573373581e-06, "loss": 2.3092, "step": 7170 }, { "epoch": 0.72, "learning_rate": 3.877367490553498e-06, "loss": 2.3436, "step": 7171 }, { "epoch": 0.72, "learning_rate": 3.874802052492535e-06, "loss": 2.2966, "step": 7172 }, { "epoch": 0.72, "learning_rate": 3.872237259460855e-06, "loss": 2.3388, "step": 7173 }, { "epoch": 0.72, "learning_rate": 3.8696731117285465e-06, "loss": 2.3211, "step": 7174 }, { "epoch": 0.72, "learning_rate": 3.8671096095656344e-06, "loss": 2.3783, "step": 7175 }, { "epoch": 0.72, "learning_rate": 3.864546753242076e-06, "loss": 2.3012, "step": 7176 }, { "epoch": 0.72, "learning_rate": 3.861984543027754e-06, "loss": 2.3531, "step": 7177 }, { "epoch": 0.72, "learning_rate": 3.859422979192496e-06, "loss": 2.2291, "step": 7178 }, { "epoch": 0.72, "learning_rate": 3.8568620620060505e-06, "loss": 2.2542, "step": 7179 }, { "epoch": 0.72, "learning_rate": 3.854301791738102e-06, "loss": 2.4081, "step": 7180 }, { "epoch": 0.72, "learning_rate": 3.8517421686582644e-06, "loss": 2.3363, "step": 7181 }, { "epoch": 0.72, "learning_rate": 3.849183193036088e-06, "loss": 2.3648, "step": 7182 }, { "epoch": 0.72, "learning_rate": 3.846624865141048e-06, "loss": 2.314, "step": 7183 }, { "epoch": 0.72, "learning_rate": 3.844067185242561e-06, "loss": 2.3112, "step": 7184 }, { "epoch": 0.72, "learning_rate": 3.841510153609964e-06, "loss": 2.3129, "step": 7185 }, { "epoch": 0.72, "learning_rate": 3.838953770512536e-06, "loss": 2.2584, "step": 7186 }, { "epoch": 0.72, "learning_rate": 3.836398036219481e-06, "loss": 2.3506, "step": 7187 }, { "epoch": 0.72, "learning_rate": 3.833842950999937e-06, "loss": 2.3361, "step": 7188 }, { "epoch": 0.72, "learning_rate": 3.8312885151229765e-06, "loss": 2.3658, "step": 7189 }, { "epoch": 0.72, "learning_rate": 3.828734728857596e-06, "loss": 2.3658, "step": 7190 }, { "epoch": 0.72, "learning_rate": 3.826181592472733e-06, "loss": 2.2709, "step": 7191 }, { "epoch": 0.72, "learning_rate": 3.8236291062372485e-06, "loss": 2.386, "step": 7192 }, { "epoch": 0.72, "learning_rate": 3.821077270419941e-06, "loss": 2.3036, "step": 7193 }, { "epoch": 0.72, "learning_rate": 3.818526085289532e-06, "loss": 2.2758, "step": 7194 }, { "epoch": 0.72, "learning_rate": 3.815975551114689e-06, "loss": 2.3427, "step": 7195 }, { "epoch": 0.72, "learning_rate": 3.8134256681639993e-06, "loss": 2.4262, "step": 7196 }, { "epoch": 0.72, "learning_rate": 3.8108764367059836e-06, "loss": 2.242, "step": 7197 }, { "epoch": 0.72, "learning_rate": 3.8083278570090943e-06, "loss": 2.2986, "step": 7198 }, { "epoch": 0.72, "learning_rate": 3.8057799293417185e-06, "loss": 2.314, "step": 7199 }, { "epoch": 0.72, "learning_rate": 3.80323265397217e-06, "loss": 2.2673, "step": 7200 }, { "epoch": 0.72, "learning_rate": 3.8006860311686965e-06, "loss": 2.2669, "step": 7201 }, { "epoch": 0.72, "learning_rate": 3.7981400611994767e-06, "loss": 2.3447, "step": 7202 }, { "epoch": 0.72, "learning_rate": 3.795594744332618e-06, "loss": 2.2087, "step": 7203 }, { "epoch": 0.72, "learning_rate": 3.793050080836166e-06, "loss": 2.3017, "step": 7204 }, { "epoch": 0.72, "learning_rate": 3.7905060709780907e-06, "loss": 2.3393, "step": 7205 }, { "epoch": 0.72, "learning_rate": 3.7879627150262952e-06, "loss": 2.2916, "step": 7206 }, { "epoch": 0.72, "learning_rate": 3.785420013248614e-06, "loss": 2.4476, "step": 7207 }, { "epoch": 0.72, "learning_rate": 3.7828779659128155e-06, "loss": 2.3335, "step": 7208 }, { "epoch": 0.72, "learning_rate": 3.7803365732865915e-06, "loss": 2.2223, "step": 7209 }, { "epoch": 0.72, "learning_rate": 3.77779583563757e-06, "loss": 2.3875, "step": 7210 }, { "epoch": 0.72, "learning_rate": 3.7752557532333123e-06, "loss": 2.4322, "step": 7211 }, { "epoch": 0.72, "learning_rate": 3.7727163263413035e-06, "loss": 2.3205, "step": 7212 }, { "epoch": 0.72, "learning_rate": 3.770177555228972e-06, "loss": 2.2777, "step": 7213 }, { "epoch": 0.72, "learning_rate": 3.767639440163665e-06, "loss": 2.2041, "step": 7214 }, { "epoch": 0.72, "learning_rate": 3.7651019814126656e-06, "loss": 2.3552, "step": 7215 }, { "epoch": 0.72, "learning_rate": 3.762565179243187e-06, "loss": 2.3369, "step": 7216 }, { "epoch": 0.72, "learning_rate": 3.7600290339223746e-06, "loss": 2.2896, "step": 7217 }, { "epoch": 0.72, "learning_rate": 3.757493545717301e-06, "loss": 2.265, "step": 7218 }, { "epoch": 0.72, "learning_rate": 3.754958714894975e-06, "loss": 2.3977, "step": 7219 }, { "epoch": 0.72, "learning_rate": 3.7524245417223313e-06, "loss": 2.3589, "step": 7220 }, { "epoch": 0.72, "learning_rate": 3.7498910264662346e-06, "loss": 2.252, "step": 7221 }, { "epoch": 0.72, "learning_rate": 3.74735816939349e-06, "loss": 2.2751, "step": 7222 }, { "epoch": 0.72, "learning_rate": 3.7448259707708234e-06, "loss": 2.2726, "step": 7223 }, { "epoch": 0.72, "learning_rate": 3.7422944308648935e-06, "loss": 2.3145, "step": 7224 }, { "epoch": 0.72, "learning_rate": 3.7397635499422903e-06, "loss": 2.3682, "step": 7225 }, { "epoch": 0.72, "learning_rate": 3.737233328269535e-06, "loss": 2.285, "step": 7226 }, { "epoch": 0.72, "learning_rate": 3.7347037661130792e-06, "loss": 2.2601, "step": 7227 }, { "epoch": 0.72, "learning_rate": 3.732174863739304e-06, "loss": 2.2518, "step": 7228 }, { "epoch": 0.72, "learning_rate": 3.7296466214145234e-06, "loss": 2.3786, "step": 7229 }, { "epoch": 0.72, "learning_rate": 3.727119039404977e-06, "loss": 2.4028, "step": 7230 }, { "epoch": 0.72, "learning_rate": 3.724592117976842e-06, "loss": 2.2413, "step": 7231 }, { "epoch": 0.72, "learning_rate": 3.72206585739622e-06, "loss": 2.2534, "step": 7232 }, { "epoch": 0.72, "learning_rate": 3.719540257929145e-06, "loss": 2.3095, "step": 7233 }, { "epoch": 0.72, "learning_rate": 3.7170153198415826e-06, "loss": 2.3434, "step": 7234 }, { "epoch": 0.72, "learning_rate": 3.7144910433994264e-06, "loss": 2.3046, "step": 7235 }, { "epoch": 0.72, "learning_rate": 3.7119674288685037e-06, "loss": 2.365, "step": 7236 }, { "epoch": 0.73, "learning_rate": 3.7094444765145674e-06, "loss": 2.3883, "step": 7237 }, { "epoch": 0.73, "learning_rate": 3.7069221866033067e-06, "loss": 2.3557, "step": 7238 }, { "epoch": 0.73, "learning_rate": 3.7044005594003307e-06, "loss": 2.2944, "step": 7239 }, { "epoch": 0.73, "learning_rate": 3.701879595171195e-06, "loss": 2.1854, "step": 7240 }, { "epoch": 0.73, "learning_rate": 3.6993592941813705e-06, "loss": 2.3605, "step": 7241 }, { "epoch": 0.73, "learning_rate": 3.696839656696266e-06, "loss": 2.3112, "step": 7242 }, { "epoch": 0.73, "learning_rate": 3.694320682981217e-06, "loss": 2.2851, "step": 7243 }, { "epoch": 0.73, "learning_rate": 3.6918023733014908e-06, "loss": 2.1924, "step": 7244 }, { "epoch": 0.73, "learning_rate": 3.689284727922283e-06, "loss": 2.154, "step": 7245 }, { "epoch": 0.73, "learning_rate": 3.6867677471087226e-06, "loss": 2.2927, "step": 7246 }, { "epoch": 0.73, "learning_rate": 3.684251431125865e-06, "loss": 2.2053, "step": 7247 }, { "epoch": 0.73, "learning_rate": 3.6817357802386977e-06, "loss": 2.3027, "step": 7248 }, { "epoch": 0.73, "learning_rate": 3.679220794712137e-06, "loss": 2.2835, "step": 7249 }, { "epoch": 0.73, "learning_rate": 3.6767064748110314e-06, "loss": 2.3702, "step": 7250 }, { "epoch": 0.73, "learning_rate": 3.6741928208001566e-06, "loss": 2.3857, "step": 7251 }, { "epoch": 0.73, "learning_rate": 3.671679832944218e-06, "loss": 2.3288, "step": 7252 }, { "epoch": 0.73, "learning_rate": 3.669167511507854e-06, "loss": 2.3666, "step": 7253 }, { "epoch": 0.73, "learning_rate": 3.66665585675563e-06, "loss": 2.301, "step": 7254 }, { "epoch": 0.73, "learning_rate": 3.664144868952042e-06, "loss": 2.3127, "step": 7255 }, { "epoch": 0.73, "learning_rate": 3.661634548361517e-06, "loss": 2.2829, "step": 7256 }, { "epoch": 0.73, "learning_rate": 3.6591248952484047e-06, "loss": 2.3616, "step": 7257 }, { "epoch": 0.73, "learning_rate": 3.6566159098770004e-06, "loss": 2.3917, "step": 7258 }, { "epoch": 0.73, "learning_rate": 3.654107592511512e-06, "loss": 2.2623, "step": 7259 }, { "epoch": 0.73, "learning_rate": 3.651599943416088e-06, "loss": 2.2484, "step": 7260 }, { "epoch": 0.73, "learning_rate": 3.6490929628548e-06, "loss": 2.2853, "step": 7261 }, { "epoch": 0.73, "learning_rate": 3.6465866510916527e-06, "loss": 2.3553, "step": 7262 }, { "epoch": 0.73, "learning_rate": 3.6440810083905797e-06, "loss": 2.2983, "step": 7263 }, { "epoch": 0.73, "learning_rate": 3.6415760350154427e-06, "loss": 2.2479, "step": 7264 }, { "epoch": 0.73, "learning_rate": 3.639071731230036e-06, "loss": 2.3572, "step": 7265 }, { "epoch": 0.73, "learning_rate": 3.6365680972980775e-06, "loss": 2.3606, "step": 7266 }, { "epoch": 0.73, "learning_rate": 3.6340651334832256e-06, "loss": 2.3227, "step": 7267 }, { "epoch": 0.73, "learning_rate": 3.6315628400490567e-06, "loss": 2.2913, "step": 7268 }, { "epoch": 0.73, "learning_rate": 3.6290612172590823e-06, "loss": 2.3622, "step": 7269 }, { "epoch": 0.73, "learning_rate": 3.626560265376742e-06, "loss": 2.338, "step": 7270 }, { "epoch": 0.73, "learning_rate": 3.6240599846654035e-06, "loss": 2.3227, "step": 7271 }, { "epoch": 0.73, "learning_rate": 3.62156037538837e-06, "loss": 2.2592, "step": 7272 }, { "epoch": 0.73, "learning_rate": 3.619061437808862e-06, "loss": 2.2794, "step": 7273 }, { "epoch": 0.73, "learning_rate": 3.6165631721900387e-06, "loss": 2.3005, "step": 7274 }, { "epoch": 0.73, "learning_rate": 3.614065578794983e-06, "loss": 2.2472, "step": 7275 }, { "epoch": 0.73, "learning_rate": 3.611568657886718e-06, "loss": 2.3574, "step": 7276 }, { "epoch": 0.73, "learning_rate": 3.609072409728186e-06, "loss": 2.3587, "step": 7277 }, { "epoch": 0.73, "learning_rate": 3.606576834582257e-06, "loss": 2.2994, "step": 7278 }, { "epoch": 0.73, "learning_rate": 3.6040819327117373e-06, "loss": 2.2964, "step": 7279 }, { "epoch": 0.73, "learning_rate": 3.601587704379356e-06, "loss": 2.3576, "step": 7280 }, { "epoch": 0.73, "learning_rate": 3.599094149847776e-06, "loss": 2.3527, "step": 7281 }, { "epoch": 0.73, "learning_rate": 3.596601269379586e-06, "loss": 2.2897, "step": 7282 }, { "epoch": 0.73, "learning_rate": 3.5941090632373064e-06, "loss": 2.2683, "step": 7283 }, { "epoch": 0.73, "learning_rate": 3.5916175316833813e-06, "loss": 2.2138, "step": 7284 }, { "epoch": 0.73, "learning_rate": 3.5891266749801934e-06, "loss": 2.2984, "step": 7285 }, { "epoch": 0.73, "learning_rate": 3.5866364933900466e-06, "loss": 2.2518, "step": 7286 }, { "epoch": 0.73, "learning_rate": 3.5841469871751745e-06, "loss": 2.4084, "step": 7287 }, { "epoch": 0.73, "learning_rate": 3.5816581565977416e-06, "loss": 2.3895, "step": 7288 }, { "epoch": 0.73, "learning_rate": 3.5791700019198404e-06, "loss": 2.4264, "step": 7289 }, { "epoch": 0.73, "learning_rate": 3.576682523403492e-06, "loss": 2.2294, "step": 7290 }, { "epoch": 0.73, "learning_rate": 3.574195721310646e-06, "loss": 2.3835, "step": 7291 }, { "epoch": 0.73, "learning_rate": 3.571709595903182e-06, "loss": 2.3187, "step": 7292 }, { "epoch": 0.73, "learning_rate": 3.5692241474429077e-06, "loss": 2.3201, "step": 7293 }, { "epoch": 0.73, "learning_rate": 3.5667393761915592e-06, "loss": 2.2727, "step": 7294 }, { "epoch": 0.73, "learning_rate": 3.564255282410802e-06, "loss": 2.2846, "step": 7295 }, { "epoch": 0.73, "learning_rate": 3.561771866362229e-06, "loss": 2.271, "step": 7296 }, { "epoch": 0.73, "learning_rate": 3.559289128307364e-06, "loss": 2.3619, "step": 7297 }, { "epoch": 0.73, "learning_rate": 3.5568070685076563e-06, "loss": 2.375, "step": 7298 }, { "epoch": 0.73, "learning_rate": 3.554325687224486e-06, "loss": 2.2992, "step": 7299 }, { "epoch": 0.73, "learning_rate": 3.5518449847191603e-06, "loss": 2.2344, "step": 7300 }, { "epoch": 0.73, "learning_rate": 3.549364961252918e-06, "loss": 2.4192, "step": 7301 }, { "epoch": 0.73, "learning_rate": 3.5468856170869192e-06, "loss": 2.3258, "step": 7302 }, { "epoch": 0.73, "learning_rate": 3.5444069524822643e-06, "loss": 2.3802, "step": 7303 }, { "epoch": 0.73, "learning_rate": 3.541928967699971e-06, "loss": 2.3809, "step": 7304 }, { "epoch": 0.73, "learning_rate": 3.539451663000992e-06, "loss": 2.2958, "step": 7305 }, { "epoch": 0.73, "learning_rate": 3.5369750386462045e-06, "loss": 2.2001, "step": 7306 }, { "epoch": 0.73, "learning_rate": 3.5344990948964163e-06, "loss": 2.3453, "step": 7307 }, { "epoch": 0.73, "learning_rate": 3.532023832012361e-06, "loss": 2.3917, "step": 7308 }, { "epoch": 0.73, "learning_rate": 3.5295492502547057e-06, "loss": 2.3587, "step": 7309 }, { "epoch": 0.73, "learning_rate": 3.5270753498840393e-06, "loss": 2.398, "step": 7310 }, { "epoch": 0.73, "learning_rate": 3.5246021311608802e-06, "loss": 2.2684, "step": 7311 }, { "epoch": 0.73, "learning_rate": 3.522129594345687e-06, "loss": 2.2885, "step": 7312 }, { "epoch": 0.73, "learning_rate": 3.519657739698825e-06, "loss": 2.1801, "step": 7313 }, { "epoch": 0.73, "learning_rate": 3.517186567480605e-06, "loss": 2.2638, "step": 7314 }, { "epoch": 0.73, "learning_rate": 3.5147160779512567e-06, "loss": 2.3463, "step": 7315 }, { "epoch": 0.73, "learning_rate": 3.512246271370944e-06, "loss": 2.2511, "step": 7316 }, { "epoch": 0.73, "learning_rate": 3.5097771479997543e-06, "loss": 2.2065, "step": 7317 }, { "epoch": 0.73, "learning_rate": 3.5073087080977054e-06, "loss": 2.3136, "step": 7318 }, { "epoch": 0.73, "learning_rate": 3.504840951924743e-06, "loss": 2.2755, "step": 7319 }, { "epoch": 0.73, "learning_rate": 3.5023738797407357e-06, "loss": 2.2489, "step": 7320 }, { "epoch": 0.73, "learning_rate": 3.4999074918054922e-06, "loss": 2.2928, "step": 7321 }, { "epoch": 0.73, "learning_rate": 3.4974417883787382e-06, "loss": 2.2767, "step": 7322 }, { "epoch": 0.73, "learning_rate": 3.494976769720132e-06, "loss": 2.2106, "step": 7323 }, { "epoch": 0.73, "learning_rate": 3.492512436089256e-06, "loss": 2.2816, "step": 7324 }, { "epoch": 0.73, "learning_rate": 3.490048787745626e-06, "loss": 2.2792, "step": 7325 }, { "epoch": 0.73, "learning_rate": 3.4875858249486796e-06, "loss": 2.3597, "step": 7326 }, { "epoch": 0.73, "learning_rate": 3.485123547957787e-06, "loss": 2.2997, "step": 7327 }, { "epoch": 0.73, "learning_rate": 3.482661957032244e-06, "loss": 2.345, "step": 7328 }, { "epoch": 0.73, "learning_rate": 3.4802010524312725e-06, "loss": 2.3814, "step": 7329 }, { "epoch": 0.73, "learning_rate": 3.4777408344140283e-06, "loss": 2.2198, "step": 7330 }, { "epoch": 0.73, "learning_rate": 3.4752813032395905e-06, "loss": 2.4845, "step": 7331 }, { "epoch": 0.73, "learning_rate": 3.4728224591669636e-06, "loss": 2.4064, "step": 7332 }, { "epoch": 0.73, "learning_rate": 3.470364302455084e-06, "loss": 2.2589, "step": 7333 }, { "epoch": 0.73, "learning_rate": 3.4679068333628117e-06, "loss": 2.3201, "step": 7334 }, { "epoch": 0.73, "learning_rate": 3.46545005214894e-06, "loss": 2.2272, "step": 7335 }, { "epoch": 0.73, "learning_rate": 3.4629939590721883e-06, "loss": 2.2627, "step": 7336 }, { "epoch": 0.74, "learning_rate": 3.460538554391194e-06, "loss": 2.3629, "step": 7337 }, { "epoch": 0.74, "learning_rate": 3.45808383836453e-06, "loss": 2.3016, "step": 7338 }, { "epoch": 0.74, "learning_rate": 3.455629811250704e-06, "loss": 2.2912, "step": 7339 }, { "epoch": 0.74, "learning_rate": 3.4531764733081386e-06, "loss": 2.3837, "step": 7340 }, { "epoch": 0.74, "learning_rate": 3.45072382479519e-06, "loss": 2.266, "step": 7341 }, { "epoch": 0.74, "learning_rate": 3.44827186597014e-06, "loss": 2.3176, "step": 7342 }, { "epoch": 0.74, "learning_rate": 3.4458205970911973e-06, "loss": 2.305, "step": 7343 }, { "epoch": 0.74, "learning_rate": 3.4433700184165007e-06, "loss": 2.3309, "step": 7344 }, { "epoch": 0.74, "learning_rate": 3.440920130204114e-06, "loss": 2.2567, "step": 7345 }, { "epoch": 0.74, "learning_rate": 3.438470932712028e-06, "loss": 2.3008, "step": 7346 }, { "epoch": 0.74, "learning_rate": 3.4360224261981587e-06, "loss": 2.2799, "step": 7347 }, { "epoch": 0.74, "learning_rate": 3.4335746109203594e-06, "loss": 2.215, "step": 7348 }, { "epoch": 0.74, "learning_rate": 3.4311274871363985e-06, "loss": 2.3269, "step": 7349 }, { "epoch": 0.74, "learning_rate": 3.4286810551039783e-06, "loss": 2.2561, "step": 7350 }, { "epoch": 0.74, "learning_rate": 3.426235315080725e-06, "loss": 2.3158, "step": 7351 }, { "epoch": 0.74, "learning_rate": 3.423790267324194e-06, "loss": 2.2671, "step": 7352 }, { "epoch": 0.74, "learning_rate": 3.4213459120918678e-06, "loss": 2.3093, "step": 7353 }, { "epoch": 0.74, "learning_rate": 3.418902249641155e-06, "loss": 2.3703, "step": 7354 }, { "epoch": 0.74, "learning_rate": 3.4164592802293904e-06, "loss": 2.31, "step": 7355 }, { "epoch": 0.74, "learning_rate": 3.414017004113839e-06, "loss": 2.4082, "step": 7356 }, { "epoch": 0.74, "learning_rate": 3.4115754215516884e-06, "loss": 2.3295, "step": 7357 }, { "epoch": 0.74, "learning_rate": 3.409134532800057e-06, "loss": 2.391, "step": 7358 }, { "epoch": 0.74, "learning_rate": 3.406694338115989e-06, "loss": 2.3116, "step": 7359 }, { "epoch": 0.74, "learning_rate": 3.4042548377564543e-06, "loss": 2.3359, "step": 7360 }, { "epoch": 0.74, "learning_rate": 3.4018160319783523e-06, "loss": 2.1934, "step": 7361 }, { "epoch": 0.74, "learning_rate": 3.3993779210385047e-06, "loss": 2.3859, "step": 7362 }, { "epoch": 0.74, "learning_rate": 3.3969405051936655e-06, "loss": 2.1936, "step": 7363 }, { "epoch": 0.74, "learning_rate": 3.394503784700508e-06, "loss": 2.2928, "step": 7364 }, { "epoch": 0.74, "learning_rate": 3.3920677598156437e-06, "loss": 2.3197, "step": 7365 }, { "epoch": 0.74, "learning_rate": 3.3896324307956018e-06, "loss": 2.319, "step": 7366 }, { "epoch": 0.74, "learning_rate": 3.3871977978968405e-06, "loss": 2.3854, "step": 7367 }, { "epoch": 0.74, "learning_rate": 3.384763861375746e-06, "loss": 2.3279, "step": 7368 }, { "epoch": 0.74, "learning_rate": 3.3823306214886277e-06, "loss": 2.3289, "step": 7369 }, { "epoch": 0.74, "learning_rate": 3.3798980784917255e-06, "loss": 2.3563, "step": 7370 }, { "epoch": 0.74, "learning_rate": 3.3774662326412045e-06, "loss": 2.2231, "step": 7371 }, { "epoch": 0.74, "learning_rate": 3.3750350841931558e-06, "loss": 2.2157, "step": 7372 }, { "epoch": 0.74, "learning_rate": 3.3726046334035933e-06, "loss": 2.3092, "step": 7373 }, { "epoch": 0.74, "learning_rate": 3.3701748805284705e-06, "loss": 2.1776, "step": 7374 }, { "epoch": 0.74, "learning_rate": 3.367745825823654e-06, "loss": 2.3162, "step": 7375 }, { "epoch": 0.74, "learning_rate": 3.3653174695449454e-06, "loss": 2.2981, "step": 7376 }, { "epoch": 0.74, "learning_rate": 3.362889811948061e-06, "loss": 2.2023, "step": 7377 }, { "epoch": 0.74, "learning_rate": 3.360462853288656e-06, "loss": 2.3158, "step": 7378 }, { "epoch": 0.74, "learning_rate": 3.358036593822306e-06, "loss": 2.3199, "step": 7379 }, { "epoch": 0.74, "learning_rate": 3.3556110338045168e-06, "loss": 2.3155, "step": 7380 }, { "epoch": 0.74, "learning_rate": 3.3531861734907146e-06, "loss": 2.2136, "step": 7381 }, { "epoch": 0.74, "learning_rate": 3.350762013136255e-06, "loss": 2.3794, "step": 7382 }, { "epoch": 0.74, "learning_rate": 3.3483385529964253e-06, "loss": 2.2581, "step": 7383 }, { "epoch": 0.74, "learning_rate": 3.345915793326431e-06, "loss": 2.2552, "step": 7384 }, { "epoch": 0.74, "learning_rate": 3.343493734381407e-06, "loss": 2.2461, "step": 7385 }, { "epoch": 0.74, "learning_rate": 3.3410723764164143e-06, "loss": 2.3022, "step": 7386 }, { "epoch": 0.74, "learning_rate": 3.3386517196864408e-06, "loss": 2.2678, "step": 7387 }, { "epoch": 0.74, "learning_rate": 3.336231764446398e-06, "loss": 2.3575, "step": 7388 }, { "epoch": 0.74, "learning_rate": 3.333812510951128e-06, "loss": 2.3357, "step": 7389 }, { "epoch": 0.74, "learning_rate": 3.3313939594553922e-06, "loss": 2.2628, "step": 7390 }, { "epoch": 0.74, "learning_rate": 3.328976110213884e-06, "loss": 2.1694, "step": 7391 }, { "epoch": 0.74, "learning_rate": 3.3265589634812235e-06, "loss": 2.3119, "step": 7392 }, { "epoch": 0.74, "learning_rate": 3.3241425195119525e-06, "loss": 2.1858, "step": 7393 }, { "epoch": 0.74, "learning_rate": 3.321726778560542e-06, "loss": 2.2815, "step": 7394 }, { "epoch": 0.74, "learning_rate": 3.3193117408813856e-06, "loss": 2.1898, "step": 7395 }, { "epoch": 0.74, "learning_rate": 3.3168974067288063e-06, "loss": 2.3801, "step": 7396 }, { "epoch": 0.74, "learning_rate": 3.3144837763570513e-06, "loss": 2.355, "step": 7397 }, { "epoch": 0.74, "learning_rate": 3.3120708500202923e-06, "loss": 2.3022, "step": 7398 }, { "epoch": 0.74, "learning_rate": 3.3096586279726316e-06, "loss": 2.3652, "step": 7399 }, { "epoch": 0.74, "learning_rate": 3.3072471104680927e-06, "loss": 2.312, "step": 7400 }, { "epoch": 0.74, "learning_rate": 3.3048362977606254e-06, "loss": 2.3392, "step": 7401 }, { "epoch": 0.74, "learning_rate": 3.302426190104108e-06, "loss": 2.4214, "step": 7402 }, { "epoch": 0.74, "learning_rate": 3.3000167877523416e-06, "loss": 2.2648, "step": 7403 }, { "epoch": 0.74, "learning_rate": 3.297608090959056e-06, "loss": 2.3063, "step": 7404 }, { "epoch": 0.74, "learning_rate": 3.295200099977903e-06, "loss": 2.219, "step": 7405 }, { "epoch": 0.74, "learning_rate": 3.292792815062463e-06, "loss": 2.3681, "step": 7406 }, { "epoch": 0.74, "learning_rate": 3.2903862364662433e-06, "loss": 2.3446, "step": 7407 }, { "epoch": 0.74, "learning_rate": 3.2879803644426713e-06, "loss": 2.3266, "step": 7408 }, { "epoch": 0.74, "learning_rate": 3.285575199245101e-06, "loss": 2.302, "step": 7409 }, { "epoch": 0.74, "learning_rate": 3.2831707411268222e-06, "loss": 2.2564, "step": 7410 }, { "epoch": 0.74, "learning_rate": 3.2807669903410387e-06, "loss": 2.2763, "step": 7411 }, { "epoch": 0.74, "learning_rate": 3.2783639471408823e-06, "loss": 2.287, "step": 7412 }, { "epoch": 0.74, "learning_rate": 3.2759616117794124e-06, "loss": 2.3229, "step": 7413 }, { "epoch": 0.74, "learning_rate": 3.2735599845096123e-06, "loss": 2.343, "step": 7414 }, { "epoch": 0.74, "learning_rate": 3.2711590655843928e-06, "loss": 2.3424, "step": 7415 }, { "epoch": 0.74, "learning_rate": 3.2687588552565873e-06, "loss": 2.3388, "step": 7416 }, { "epoch": 0.74, "learning_rate": 3.266359353778956e-06, "loss": 2.3577, "step": 7417 }, { "epoch": 0.74, "learning_rate": 3.2639605614041846e-06, "loss": 2.3446, "step": 7418 }, { "epoch": 0.74, "learning_rate": 3.2615624783848853e-06, "loss": 2.3879, "step": 7419 }, { "epoch": 0.74, "learning_rate": 3.2591651049735916e-06, "loss": 2.2612, "step": 7420 }, { "epoch": 0.74, "learning_rate": 3.2567684414227673e-06, "loss": 2.2988, "step": 7421 }, { "epoch": 0.74, "learning_rate": 3.254372487984798e-06, "loss": 2.314, "step": 7422 }, { "epoch": 0.74, "learning_rate": 3.2519772449119944e-06, "loss": 2.2421, "step": 7423 }, { "epoch": 0.74, "learning_rate": 3.249582712456596e-06, "loss": 2.2624, "step": 7424 }, { "epoch": 0.74, "learning_rate": 3.247188890870764e-06, "loss": 2.2711, "step": 7425 }, { "epoch": 0.74, "learning_rate": 3.2447957804065845e-06, "loss": 2.3132, "step": 7426 }, { "epoch": 0.74, "learning_rate": 3.242403381316068e-06, "loss": 2.4004, "step": 7427 }, { "epoch": 0.74, "learning_rate": 3.2400116938511595e-06, "loss": 2.3503, "step": 7428 }, { "epoch": 0.74, "learning_rate": 3.2376207182637166e-06, "loss": 2.2265, "step": 7429 }, { "epoch": 0.74, "learning_rate": 3.2352304548055267e-06, "loss": 2.3301, "step": 7430 }, { "epoch": 0.74, "learning_rate": 3.232840903728305e-06, "loss": 2.2467, "step": 7431 }, { "epoch": 0.74, "learning_rate": 3.230452065283687e-06, "loss": 2.2597, "step": 7432 }, { "epoch": 0.74, "learning_rate": 3.228063939723235e-06, "loss": 2.3932, "step": 7433 }, { "epoch": 0.74, "learning_rate": 3.225676527298438e-06, "loss": 2.3419, "step": 7434 }, { "epoch": 0.74, "learning_rate": 3.223289828260707e-06, "loss": 2.3044, "step": 7435 }, { "epoch": 0.75, "learning_rate": 3.220903842861377e-06, "loss": 2.2549, "step": 7436 }, { "epoch": 0.75, "learning_rate": 3.2185185713517176e-06, "loss": 2.3724, "step": 7437 }, { "epoch": 0.75, "learning_rate": 3.216134013982911e-06, "loss": 2.3245, "step": 7438 }, { "epoch": 0.75, "learning_rate": 3.2137501710060726e-06, "loss": 2.2345, "step": 7439 }, { "epoch": 0.75, "learning_rate": 3.211367042672232e-06, "loss": 2.234, "step": 7440 }, { "epoch": 0.75, "learning_rate": 3.2089846292323544e-06, "loss": 2.2916, "step": 7441 }, { "epoch": 0.75, "learning_rate": 3.206602930937326e-06, "loss": 2.2039, "step": 7442 }, { "epoch": 0.75, "learning_rate": 3.2042219480379566e-06, "loss": 2.329, "step": 7443 }, { "epoch": 0.75, "learning_rate": 3.2018416807849827e-06, "loss": 2.3141, "step": 7444 }, { "epoch": 0.75, "learning_rate": 3.1994621294290596e-06, "loss": 2.2423, "step": 7445 }, { "epoch": 0.75, "learning_rate": 3.1970832942207796e-06, "loss": 2.2975, "step": 7446 }, { "epoch": 0.75, "learning_rate": 3.1947051754106483e-06, "loss": 2.361, "step": 7447 }, { "epoch": 0.75, "learning_rate": 3.1923277732491e-06, "loss": 2.2572, "step": 7448 }, { "epoch": 0.75, "learning_rate": 3.1899510879864928e-06, "loss": 2.3729, "step": 7449 }, { "epoch": 0.75, "learning_rate": 3.1875751198731074e-06, "loss": 2.3098, "step": 7450 }, { "epoch": 0.75, "learning_rate": 3.1851998691591535e-06, "loss": 2.3487, "step": 7451 }, { "epoch": 0.75, "learning_rate": 3.1828253360947625e-06, "loss": 2.3775, "step": 7452 }, { "epoch": 0.75, "learning_rate": 3.180451520929989e-06, "loss": 2.328, "step": 7453 }, { "epoch": 0.75, "learning_rate": 3.178078423914812e-06, "loss": 2.3036, "step": 7454 }, { "epoch": 0.75, "learning_rate": 3.175706045299143e-06, "loss": 2.1968, "step": 7455 }, { "epoch": 0.75, "learning_rate": 3.1733343853328067e-06, "loss": 2.3081, "step": 7456 }, { "epoch": 0.75, "learning_rate": 3.170963444265557e-06, "loss": 2.3313, "step": 7457 }, { "epoch": 0.75, "learning_rate": 3.168593222347073e-06, "loss": 2.3908, "step": 7458 }, { "epoch": 0.75, "learning_rate": 3.166223719826954e-06, "loss": 2.3157, "step": 7459 }, { "epoch": 0.75, "learning_rate": 3.16385493695473e-06, "loss": 2.2624, "step": 7460 }, { "epoch": 0.75, "learning_rate": 3.1614868739798497e-06, "loss": 2.2289, "step": 7461 }, { "epoch": 0.75, "learning_rate": 3.1591195311516877e-06, "loss": 2.2455, "step": 7462 }, { "epoch": 0.75, "learning_rate": 3.1567529087195437e-06, "loss": 2.2743, "step": 7463 }, { "epoch": 0.75, "learning_rate": 3.15438700693264e-06, "loss": 2.3316, "step": 7464 }, { "epoch": 0.75, "learning_rate": 3.1520218260401238e-06, "loss": 2.3019, "step": 7465 }, { "epoch": 0.75, "learning_rate": 3.149657366291068e-06, "loss": 2.3277, "step": 7466 }, { "epoch": 0.75, "learning_rate": 3.1472936279344656e-06, "loss": 2.2035, "step": 7467 }, { "epoch": 0.75, "learning_rate": 3.144930611219238e-06, "loss": 2.3018, "step": 7468 }, { "epoch": 0.75, "learning_rate": 3.1425683163942265e-06, "loss": 2.3441, "step": 7469 }, { "epoch": 0.75, "learning_rate": 3.1402067437082005e-06, "loss": 2.3809, "step": 7470 }, { "epoch": 0.75, "learning_rate": 3.137845893409851e-06, "loss": 2.2653, "step": 7471 }, { "epoch": 0.75, "learning_rate": 3.135485765747789e-06, "loss": 2.3317, "step": 7472 }, { "epoch": 0.75, "learning_rate": 3.133126360970561e-06, "loss": 2.3979, "step": 7473 }, { "epoch": 0.75, "learning_rate": 3.130767679326626e-06, "loss": 2.2156, "step": 7474 }, { "epoch": 0.75, "learning_rate": 3.1284097210643715e-06, "loss": 2.2294, "step": 7475 }, { "epoch": 0.75, "learning_rate": 3.1260524864321073e-06, "loss": 2.2063, "step": 7476 }, { "epoch": 0.75, "learning_rate": 3.1236959756780695e-06, "loss": 2.3177, "step": 7477 }, { "epoch": 0.75, "learning_rate": 3.1213401890504146e-06, "loss": 2.3286, "step": 7478 }, { "epoch": 0.75, "learning_rate": 3.118985126797226e-06, "loss": 2.2607, "step": 7479 }, { "epoch": 0.75, "learning_rate": 3.116630789166508e-06, "loss": 2.2641, "step": 7480 }, { "epoch": 0.75, "learning_rate": 3.114277176406192e-06, "loss": 2.2812, "step": 7481 }, { "epoch": 0.75, "learning_rate": 3.1119242887641286e-06, "loss": 2.3746, "step": 7482 }, { "epoch": 0.75, "learning_rate": 3.109572126488096e-06, "loss": 2.2706, "step": 7483 }, { "epoch": 0.75, "learning_rate": 3.107220689825795e-06, "loss": 2.3397, "step": 7484 }, { "epoch": 0.75, "learning_rate": 3.104869979024849e-06, "loss": 2.2645, "step": 7485 }, { "epoch": 0.75, "learning_rate": 3.102519994332804e-06, "loss": 2.3121, "step": 7486 }, { "epoch": 0.75, "learning_rate": 3.1001707359971346e-06, "loss": 2.2811, "step": 7487 }, { "epoch": 0.75, "learning_rate": 3.0978222042652317e-06, "loss": 2.223, "step": 7488 }, { "epoch": 0.75, "learning_rate": 3.095474399384414e-06, "loss": 2.4416, "step": 7489 }, { "epoch": 0.75, "learning_rate": 3.0931273216019207e-06, "loss": 2.245, "step": 7490 }, { "epoch": 0.75, "learning_rate": 3.090780971164924e-06, "loss": 2.275, "step": 7491 }, { "epoch": 0.75, "learning_rate": 3.0884353483205065e-06, "loss": 2.2814, "step": 7492 }, { "epoch": 0.75, "learning_rate": 3.086090453315682e-06, "loss": 2.3218, "step": 7493 }, { "epoch": 0.75, "learning_rate": 3.0837462863973844e-06, "loss": 2.2948, "step": 7494 }, { "epoch": 0.75, "learning_rate": 3.0814028478124724e-06, "loss": 2.2398, "step": 7495 }, { "epoch": 0.75, "learning_rate": 3.0790601378077277e-06, "loss": 2.1282, "step": 7496 }, { "epoch": 0.75, "learning_rate": 3.0767181566298553e-06, "loss": 2.3399, "step": 7497 }, { "epoch": 0.75, "learning_rate": 3.0743769045254834e-06, "loss": 2.3287, "step": 7498 }, { "epoch": 0.75, "learning_rate": 3.072036381741159e-06, "loss": 2.2497, "step": 7499 }, { "epoch": 0.75, "learning_rate": 3.0696965885233655e-06, "loss": 2.275, "step": 7500 }, { "epoch": 0.75, "learning_rate": 3.067357525118495e-06, "loss": 2.2812, "step": 7501 }, { "epoch": 0.75, "learning_rate": 3.065019191772871e-06, "loss": 2.2563, "step": 7502 }, { "epoch": 0.75, "learning_rate": 3.0626815887327378e-06, "loss": 2.3849, "step": 7503 }, { "epoch": 0.75, "learning_rate": 3.060344716244259e-06, "loss": 2.3736, "step": 7504 }, { "epoch": 0.75, "learning_rate": 3.058008574553526e-06, "loss": 2.2315, "step": 7505 }, { "epoch": 0.75, "learning_rate": 3.055673163906552e-06, "loss": 2.202, "step": 7506 }, { "epoch": 0.75, "learning_rate": 3.053338484549274e-06, "loss": 2.3499, "step": 7507 }, { "epoch": 0.75, "learning_rate": 3.051004536727549e-06, "loss": 2.2276, "step": 7508 }, { "epoch": 0.75, "learning_rate": 3.0486713206871642e-06, "loss": 2.3438, "step": 7509 }, { "epoch": 0.75, "learning_rate": 3.0463388366738213e-06, "loss": 2.3752, "step": 7510 }, { "epoch": 0.75, "learning_rate": 3.0440070849331494e-06, "loss": 2.2674, "step": 7511 }, { "epoch": 0.75, "learning_rate": 3.041676065710699e-06, "loss": 2.372, "step": 7512 }, { "epoch": 0.75, "learning_rate": 3.0393457792519444e-06, "loss": 2.2915, "step": 7513 }, { "epoch": 0.75, "learning_rate": 3.0370162258022806e-06, "loss": 2.3485, "step": 7514 }, { "epoch": 0.75, "learning_rate": 3.03468740560703e-06, "loss": 2.3365, "step": 7515 }, { "epoch": 0.75, "learning_rate": 3.0323593189114307e-06, "loss": 2.2584, "step": 7516 }, { "epoch": 0.75, "learning_rate": 3.0300319659606493e-06, "loss": 2.3462, "step": 7517 }, { "epoch": 0.75, "learning_rate": 3.0277053469997754e-06, "loss": 2.3049, "step": 7518 }, { "epoch": 0.75, "learning_rate": 3.0253794622738196e-06, "loss": 2.2706, "step": 7519 }, { "epoch": 0.75, "learning_rate": 3.0230543120277134e-06, "loss": 2.304, "step": 7520 }, { "epoch": 0.75, "learning_rate": 3.0207298965063124e-06, "loss": 2.3156, "step": 7521 }, { "epoch": 0.75, "learning_rate": 3.018406215954396e-06, "loss": 2.1374, "step": 7522 }, { "epoch": 0.75, "learning_rate": 3.0160832706166644e-06, "loss": 2.2472, "step": 7523 }, { "epoch": 0.75, "learning_rate": 3.013761060737741e-06, "loss": 2.2255, "step": 7524 }, { "epoch": 0.75, "learning_rate": 3.0114395865621727e-06, "loss": 2.2913, "step": 7525 }, { "epoch": 0.75, "learning_rate": 3.009118848334428e-06, "loss": 2.2102, "step": 7526 }, { "epoch": 0.75, "learning_rate": 3.006798846298897e-06, "loss": 2.3027, "step": 7527 }, { "epoch": 0.75, "learning_rate": 3.004479580699895e-06, "loss": 2.2968, "step": 7528 }, { "epoch": 0.75, "learning_rate": 3.002161051781657e-06, "loss": 2.3315, "step": 7529 }, { "epoch": 0.75, "learning_rate": 2.9998432597883407e-06, "loss": 2.2286, "step": 7530 }, { "epoch": 0.75, "learning_rate": 2.9975262049640297e-06, "loss": 2.3628, "step": 7531 }, { "epoch": 0.75, "learning_rate": 2.9952098875527247e-06, "loss": 2.2358, "step": 7532 }, { "epoch": 0.75, "learning_rate": 2.992894307798351e-06, "loss": 2.3163, "step": 7533 }, { "epoch": 0.75, "learning_rate": 2.9905794659447553e-06, "loss": 2.2407, "step": 7534 }, { "epoch": 0.75, "learning_rate": 2.9882653622357138e-06, "loss": 2.4086, "step": 7535 }, { "epoch": 0.76, "learning_rate": 2.9859519969149144e-06, "loss": 2.3819, "step": 7536 }, { "epoch": 0.76, "learning_rate": 2.9836393702259723e-06, "loss": 2.3321, "step": 7537 }, { "epoch": 0.76, "learning_rate": 2.981327482412426e-06, "loss": 2.2945, "step": 7538 }, { "epoch": 0.76, "learning_rate": 2.9790163337177334e-06, "loss": 2.337, "step": 7539 }, { "epoch": 0.76, "learning_rate": 2.9767059243852748e-06, "loss": 2.2745, "step": 7540 }, { "epoch": 0.76, "learning_rate": 2.974396254658356e-06, "loss": 2.3078, "step": 7541 }, { "epoch": 0.76, "learning_rate": 2.9720873247801996e-06, "loss": 2.2644, "step": 7542 }, { "epoch": 0.76, "learning_rate": 2.9697791349939566e-06, "loss": 2.2494, "step": 7543 }, { "epoch": 0.76, "learning_rate": 2.9674716855426932e-06, "loss": 2.2749, "step": 7544 }, { "epoch": 0.76, "learning_rate": 2.9651649766694034e-06, "loss": 2.2041, "step": 7545 }, { "epoch": 0.76, "learning_rate": 2.9628590086170017e-06, "loss": 2.2799, "step": 7546 }, { "epoch": 0.76, "learning_rate": 2.9605537816283214e-06, "loss": 2.2968, "step": 7547 }, { "epoch": 0.76, "learning_rate": 2.958249295946122e-06, "loss": 2.1896, "step": 7548 }, { "epoch": 0.76, "learning_rate": 2.955945551813081e-06, "loss": 2.3511, "step": 7549 }, { "epoch": 0.76, "learning_rate": 2.9536425494718025e-06, "loss": 2.4095, "step": 7550 }, { "epoch": 0.76, "learning_rate": 2.9513402891648093e-06, "loss": 2.3989, "step": 7551 }, { "epoch": 0.76, "learning_rate": 2.9490387711345412e-06, "loss": 2.3266, "step": 7552 }, { "epoch": 0.76, "learning_rate": 2.9467379956233756e-06, "loss": 2.3215, "step": 7553 }, { "epoch": 0.76, "learning_rate": 2.9444379628735955e-06, "loss": 2.2993, "step": 7554 }, { "epoch": 0.76, "learning_rate": 2.9421386731274117e-06, "loss": 2.3902, "step": 7555 }, { "epoch": 0.76, "learning_rate": 2.939840126626957e-06, "loss": 2.3793, "step": 7556 }, { "epoch": 0.76, "learning_rate": 2.9375423236142862e-06, "loss": 2.3263, "step": 7557 }, { "epoch": 0.76, "learning_rate": 2.9352452643313743e-06, "loss": 2.2379, "step": 7558 }, { "epoch": 0.76, "learning_rate": 2.9329489490201203e-06, "loss": 2.2673, "step": 7559 }, { "epoch": 0.76, "learning_rate": 2.9306533779223413e-06, "loss": 2.2428, "step": 7560 }, { "epoch": 0.76, "learning_rate": 2.928358551279776e-06, "loss": 2.3161, "step": 7561 }, { "epoch": 0.76, "learning_rate": 2.9260644693340944e-06, "loss": 2.2326, "step": 7562 }, { "epoch": 0.76, "learning_rate": 2.9237711323268757e-06, "loss": 2.3629, "step": 7563 }, { "epoch": 0.76, "learning_rate": 2.921478540499627e-06, "loss": 2.3476, "step": 7564 }, { "epoch": 0.76, "learning_rate": 2.919186694093773e-06, "loss": 2.3641, "step": 7565 }, { "epoch": 0.76, "learning_rate": 2.916895593350665e-06, "loss": 2.1911, "step": 7566 }, { "epoch": 0.76, "learning_rate": 2.914605238511574e-06, "loss": 2.2812, "step": 7567 }, { "epoch": 0.76, "learning_rate": 2.912315629817687e-06, "loss": 2.2799, "step": 7568 }, { "epoch": 0.76, "learning_rate": 2.910026767510119e-06, "loss": 2.3372, "step": 7569 }, { "epoch": 0.76, "learning_rate": 2.9077386518299024e-06, "loss": 2.3416, "step": 7570 }, { "epoch": 0.76, "learning_rate": 2.905451283017997e-06, "loss": 2.3227, "step": 7571 }, { "epoch": 0.76, "learning_rate": 2.903164661315279e-06, "loss": 2.4046, "step": 7572 }, { "epoch": 0.76, "learning_rate": 2.9008787869625466e-06, "loss": 2.2537, "step": 7573 }, { "epoch": 0.76, "learning_rate": 2.898593660200518e-06, "loss": 2.4141, "step": 7574 }, { "epoch": 0.76, "learning_rate": 2.8963092812698357e-06, "loss": 2.209, "step": 7575 }, { "epoch": 0.76, "learning_rate": 2.8940256504110607e-06, "loss": 2.1998, "step": 7576 }, { "epoch": 0.76, "learning_rate": 2.891742767864677e-06, "loss": 2.3157, "step": 7577 }, { "epoch": 0.76, "learning_rate": 2.8894606338710906e-06, "loss": 2.2771, "step": 7578 }, { "epoch": 0.76, "learning_rate": 2.887179248670622e-06, "loss": 2.2776, "step": 7579 }, { "epoch": 0.76, "learning_rate": 2.884898612503525e-06, "loss": 2.3526, "step": 7580 }, { "epoch": 0.76, "learning_rate": 2.882618725609966e-06, "loss": 2.3234, "step": 7581 }, { "epoch": 0.76, "learning_rate": 2.8803395882300323e-06, "loss": 2.2764, "step": 7582 }, { "epoch": 0.76, "learning_rate": 2.8780612006037345e-06, "loss": 2.2383, "step": 7583 }, { "epoch": 0.76, "learning_rate": 2.875783562971005e-06, "loss": 2.2839, "step": 7584 }, { "epoch": 0.76, "learning_rate": 2.8735066755716967e-06, "loss": 2.2975, "step": 7585 }, { "epoch": 0.76, "learning_rate": 2.8712305386455795e-06, "loss": 2.3423, "step": 7586 }, { "epoch": 0.76, "learning_rate": 2.8689551524323522e-06, "loss": 2.3568, "step": 7587 }, { "epoch": 0.76, "learning_rate": 2.866680517171626e-06, "loss": 2.3224, "step": 7588 }, { "epoch": 0.76, "learning_rate": 2.8644066331029398e-06, "loss": 2.3086, "step": 7589 }, { "epoch": 0.76, "learning_rate": 2.862133500465749e-06, "loss": 2.3288, "step": 7590 }, { "epoch": 0.76, "learning_rate": 2.859861119499432e-06, "loss": 2.2866, "step": 7591 }, { "epoch": 0.76, "learning_rate": 2.857589490443289e-06, "loss": 2.2288, "step": 7592 }, { "epoch": 0.76, "learning_rate": 2.8553186135365374e-06, "loss": 2.2382, "step": 7593 }, { "epoch": 0.76, "learning_rate": 2.8530484890183176e-06, "loss": 2.3163, "step": 7594 }, { "epoch": 0.76, "learning_rate": 2.8507791171276934e-06, "loss": 2.3361, "step": 7595 }, { "epoch": 0.76, "learning_rate": 2.848510498103644e-06, "loss": 2.2693, "step": 7596 }, { "epoch": 0.76, "learning_rate": 2.846242632185069e-06, "loss": 2.2527, "step": 7597 }, { "epoch": 0.76, "learning_rate": 2.8439755196107997e-06, "loss": 2.3622, "step": 7598 }, { "epoch": 0.76, "learning_rate": 2.841709160619576e-06, "loss": 2.3276, "step": 7599 }, { "epoch": 0.76, "learning_rate": 2.8394435554500612e-06, "loss": 2.2593, "step": 7600 }, { "epoch": 0.76, "learning_rate": 2.8371787043408426e-06, "loss": 2.2139, "step": 7601 }, { "epoch": 0.76, "learning_rate": 2.8349146075304255e-06, "loss": 2.3736, "step": 7602 }, { "epoch": 0.76, "learning_rate": 2.8326512652572356e-06, "loss": 2.2871, "step": 7603 }, { "epoch": 0.76, "learning_rate": 2.83038867775962e-06, "loss": 2.3322, "step": 7604 }, { "epoch": 0.76, "learning_rate": 2.828126845275846e-06, "loss": 2.2122, "step": 7605 }, { "epoch": 0.76, "learning_rate": 2.8258657680440993e-06, "loss": 2.1878, "step": 7606 }, { "epoch": 0.76, "learning_rate": 2.8236054463024967e-06, "loss": 2.3505, "step": 7607 }, { "epoch": 0.76, "learning_rate": 2.821345880289058e-06, "loss": 2.2763, "step": 7608 }, { "epoch": 0.76, "learning_rate": 2.819087070241736e-06, "loss": 2.2854, "step": 7609 }, { "epoch": 0.76, "learning_rate": 2.816829016398399e-06, "loss": 2.3101, "step": 7610 }, { "epoch": 0.76, "learning_rate": 2.814571718996838e-06, "loss": 2.2185, "step": 7611 }, { "epoch": 0.76, "learning_rate": 2.812315178274764e-06, "loss": 2.3349, "step": 7612 }, { "epoch": 0.76, "learning_rate": 2.8100593944698063e-06, "loss": 2.3815, "step": 7613 }, { "epoch": 0.76, "learning_rate": 2.8078043678195165e-06, "loss": 2.2419, "step": 7614 }, { "epoch": 0.76, "learning_rate": 2.805550098561364e-06, "loss": 2.2679, "step": 7615 }, { "epoch": 0.76, "learning_rate": 2.8032965869327434e-06, "loss": 2.3303, "step": 7616 }, { "epoch": 0.76, "learning_rate": 2.8010438331709656e-06, "loss": 2.2805, "step": 7617 }, { "epoch": 0.76, "learning_rate": 2.798791837513262e-06, "loss": 2.2412, "step": 7618 }, { "epoch": 0.76, "learning_rate": 2.796540600196784e-06, "loss": 2.3029, "step": 7619 }, { "epoch": 0.76, "learning_rate": 2.794290121458605e-06, "loss": 2.2998, "step": 7620 }, { "epoch": 0.76, "learning_rate": 2.792040401535716e-06, "loss": 2.3123, "step": 7621 }, { "epoch": 0.76, "learning_rate": 2.789791440665031e-06, "loss": 2.4086, "step": 7622 }, { "epoch": 0.76, "learning_rate": 2.78754323908338e-06, "loss": 2.3687, "step": 7623 }, { "epoch": 0.76, "learning_rate": 2.785295797027514e-06, "loss": 2.3305, "step": 7624 }, { "epoch": 0.76, "learning_rate": 2.783049114734112e-06, "loss": 2.3148, "step": 7625 }, { "epoch": 0.76, "learning_rate": 2.780803192439763e-06, "loss": 2.3408, "step": 7626 }, { "epoch": 0.76, "learning_rate": 2.778558030380979e-06, "loss": 2.2765, "step": 7627 }, { "epoch": 0.76, "learning_rate": 2.776313628794193e-06, "loss": 2.3437, "step": 7628 }, { "epoch": 0.76, "learning_rate": 2.7740699879157573e-06, "loss": 2.2269, "step": 7629 }, { "epoch": 0.76, "learning_rate": 2.7718271079819437e-06, "loss": 2.3709, "step": 7630 }, { "epoch": 0.76, "learning_rate": 2.7695849892289473e-06, "loss": 2.3558, "step": 7631 }, { "epoch": 0.76, "learning_rate": 2.7673436318928737e-06, "loss": 2.2833, "step": 7632 }, { "epoch": 0.76, "learning_rate": 2.7651030362097554e-06, "loss": 2.2442, "step": 7633 }, { "epoch": 0.76, "learning_rate": 2.76286320241555e-06, "loss": 2.389, "step": 7634 }, { "epoch": 0.76, "learning_rate": 2.760624130746126e-06, "loss": 2.2434, "step": 7635 }, { "epoch": 0.77, "learning_rate": 2.7583858214372726e-06, "loss": 2.3714, "step": 7636 }, { "epoch": 0.77, "learning_rate": 2.7561482747247025e-06, "loss": 2.3367, "step": 7637 }, { "epoch": 0.77, "learning_rate": 2.7539114908440446e-06, "loss": 2.2462, "step": 7638 }, { "epoch": 0.77, "learning_rate": 2.751675470030851e-06, "loss": 2.3312, "step": 7639 }, { "epoch": 0.77, "learning_rate": 2.74944021252059e-06, "loss": 2.3672, "step": 7640 }, { "epoch": 0.77, "learning_rate": 2.747205718548651e-06, "loss": 2.3445, "step": 7641 }, { "epoch": 0.77, "learning_rate": 2.7449719883503413e-06, "loss": 2.327, "step": 7642 }, { "epoch": 0.77, "learning_rate": 2.742739022160893e-06, "loss": 2.2074, "step": 7643 }, { "epoch": 0.77, "learning_rate": 2.740506820215454e-06, "loss": 2.2153, "step": 7644 }, { "epoch": 0.77, "learning_rate": 2.7382753827490892e-06, "loss": 2.4162, "step": 7645 }, { "epoch": 0.77, "learning_rate": 2.7360447099967892e-06, "loss": 2.2804, "step": 7646 }, { "epoch": 0.77, "learning_rate": 2.7338148021934565e-06, "loss": 2.2184, "step": 7647 }, { "epoch": 0.77, "learning_rate": 2.73158565957392e-06, "loss": 2.2715, "step": 7648 }, { "epoch": 0.77, "learning_rate": 2.729357282372923e-06, "loss": 2.2606, "step": 7649 }, { "epoch": 0.77, "learning_rate": 2.727129670825133e-06, "loss": 2.3098, "step": 7650 }, { "epoch": 0.77, "learning_rate": 2.724902825165131e-06, "loss": 2.3166, "step": 7651 }, { "epoch": 0.77, "learning_rate": 2.722676745627424e-06, "loss": 2.3706, "step": 7652 }, { "epoch": 0.77, "learning_rate": 2.7204514324464326e-06, "loss": 2.2424, "step": 7653 }, { "epoch": 0.77, "learning_rate": 2.7182268858564986e-06, "loss": 2.2069, "step": 7654 }, { "epoch": 0.77, "learning_rate": 2.7160031060918857e-06, "loss": 2.2752, "step": 7655 }, { "epoch": 0.77, "learning_rate": 2.713780093386772e-06, "loss": 2.385, "step": 7656 }, { "epoch": 0.77, "learning_rate": 2.711557847975259e-06, "loss": 2.3274, "step": 7657 }, { "epoch": 0.77, "learning_rate": 2.7093363700913657e-06, "loss": 2.3152, "step": 7658 }, { "epoch": 0.77, "learning_rate": 2.7071156599690294e-06, "loss": 2.3471, "step": 7659 }, { "epoch": 0.77, "learning_rate": 2.7048957178421063e-06, "loss": 2.3085, "step": 7660 }, { "epoch": 0.77, "learning_rate": 2.702676543944377e-06, "loss": 2.2781, "step": 7661 }, { "epoch": 0.77, "learning_rate": 2.7004581385095363e-06, "loss": 2.3472, "step": 7662 }, { "epoch": 0.77, "learning_rate": 2.6982405017711965e-06, "loss": 2.2315, "step": 7663 }, { "epoch": 0.77, "learning_rate": 2.6960236339628933e-06, "loss": 2.3529, "step": 7664 }, { "epoch": 0.77, "learning_rate": 2.693807535318078e-06, "loss": 2.2929, "step": 7665 }, { "epoch": 0.77, "learning_rate": 2.691592206070124e-06, "loss": 2.327, "step": 7666 }, { "epoch": 0.77, "learning_rate": 2.6893776464523203e-06, "loss": 2.2632, "step": 7667 }, { "epoch": 0.77, "learning_rate": 2.6871638566978777e-06, "loss": 2.3279, "step": 7668 }, { "epoch": 0.77, "learning_rate": 2.6849508370399223e-06, "loss": 2.3508, "step": 7669 }, { "epoch": 0.77, "learning_rate": 2.6827385877115073e-06, "loss": 2.2418, "step": 7670 }, { "epoch": 0.77, "learning_rate": 2.6805271089455984e-06, "loss": 2.3242, "step": 7671 }, { "epoch": 0.77, "learning_rate": 2.678316400975076e-06, "loss": 2.2362, "step": 7672 }, { "epoch": 0.77, "learning_rate": 2.676106464032746e-06, "loss": 2.1819, "step": 7673 }, { "epoch": 0.77, "learning_rate": 2.6738972983513333e-06, "loss": 2.3269, "step": 7674 }, { "epoch": 0.77, "learning_rate": 2.6716889041634775e-06, "loss": 2.3146, "step": 7675 }, { "epoch": 0.77, "learning_rate": 2.669481281701739e-06, "loss": 2.3457, "step": 7676 }, { "epoch": 0.77, "learning_rate": 2.6672744311986e-06, "loss": 2.3254, "step": 7677 }, { "epoch": 0.77, "learning_rate": 2.665068352886452e-06, "loss": 2.3152, "step": 7678 }, { "epoch": 0.77, "learning_rate": 2.6628630469976193e-06, "loss": 2.3319, "step": 7679 }, { "epoch": 0.77, "learning_rate": 2.6606585137643324e-06, "loss": 2.3119, "step": 7680 }, { "epoch": 0.77, "learning_rate": 2.6584547534187487e-06, "loss": 2.2979, "step": 7681 }, { "epoch": 0.77, "learning_rate": 2.6562517661929376e-06, "loss": 2.2546, "step": 7682 }, { "epoch": 0.77, "learning_rate": 2.6540495523188915e-06, "loss": 2.2135, "step": 7683 }, { "epoch": 0.77, "learning_rate": 2.651848112028519e-06, "loss": 2.2353, "step": 7684 }, { "epoch": 0.77, "learning_rate": 2.649647445553649e-06, "loss": 2.3657, "step": 7685 }, { "epoch": 0.77, "learning_rate": 2.6474475531260278e-06, "loss": 2.2293, "step": 7686 }, { "epoch": 0.77, "learning_rate": 2.6452484349773187e-06, "loss": 2.3919, "step": 7687 }, { "epoch": 0.77, "learning_rate": 2.64305009133911e-06, "loss": 2.3262, "step": 7688 }, { "epoch": 0.77, "learning_rate": 2.6408525224429016e-06, "loss": 2.2142, "step": 7689 }, { "epoch": 0.77, "learning_rate": 2.6386557285201144e-06, "loss": 2.2241, "step": 7690 }, { "epoch": 0.77, "learning_rate": 2.636459709802085e-06, "loss": 2.252, "step": 7691 }, { "epoch": 0.77, "learning_rate": 2.6342644665200736e-06, "loss": 2.3027, "step": 7692 }, { "epoch": 0.77, "learning_rate": 2.6320699989052533e-06, "loss": 2.3647, "step": 7693 }, { "epoch": 0.77, "learning_rate": 2.62987630718872e-06, "loss": 2.2884, "step": 7694 }, { "epoch": 0.77, "learning_rate": 2.6276833916014843e-06, "loss": 2.3222, "step": 7695 }, { "epoch": 0.77, "learning_rate": 2.625491252374477e-06, "loss": 2.2283, "step": 7696 }, { "epoch": 0.77, "learning_rate": 2.6232998897385474e-06, "loss": 2.2903, "step": 7697 }, { "epoch": 0.77, "learning_rate": 2.621109303924463e-06, "loss": 2.3108, "step": 7698 }, { "epoch": 0.77, "learning_rate": 2.618919495162907e-06, "loss": 2.2205, "step": 7699 }, { "epoch": 0.77, "learning_rate": 2.6167304636844847e-06, "loss": 2.149, "step": 7700 }, { "epoch": 0.77, "learning_rate": 2.614542209719716e-06, "loss": 2.3006, "step": 7701 }, { "epoch": 0.77, "learning_rate": 2.6123547334990407e-06, "loss": 2.3042, "step": 7702 }, { "epoch": 0.77, "learning_rate": 2.610168035252817e-06, "loss": 2.2969, "step": 7703 }, { "epoch": 0.77, "learning_rate": 2.6079821152113172e-06, "loss": 2.2884, "step": 7704 }, { "epoch": 0.77, "learning_rate": 2.6057969736047417e-06, "loss": 2.4097, "step": 7705 }, { "epoch": 0.77, "learning_rate": 2.6036126106631986e-06, "loss": 2.3649, "step": 7706 }, { "epoch": 0.77, "learning_rate": 2.6014290266167186e-06, "loss": 2.256, "step": 7707 }, { "epoch": 0.77, "learning_rate": 2.5992462216952483e-06, "loss": 2.3679, "step": 7708 }, { "epoch": 0.77, "learning_rate": 2.597064196128655e-06, "loss": 2.3107, "step": 7709 }, { "epoch": 0.77, "learning_rate": 2.5948829501467198e-06, "loss": 2.326, "step": 7710 }, { "epoch": 0.77, "learning_rate": 2.592702483979146e-06, "loss": 2.2285, "step": 7711 }, { "epoch": 0.77, "learning_rate": 2.5905227978555537e-06, "loss": 2.3388, "step": 7712 }, { "epoch": 0.77, "learning_rate": 2.588343892005478e-06, "loss": 2.2459, "step": 7713 }, { "epoch": 0.77, "learning_rate": 2.586165766658377e-06, "loss": 2.3574, "step": 7714 }, { "epoch": 0.77, "learning_rate": 2.583988422043621e-06, "loss": 2.359, "step": 7715 }, { "epoch": 0.77, "learning_rate": 2.5818118583905017e-06, "loss": 2.3648, "step": 7716 }, { "epoch": 0.77, "learning_rate": 2.5796360759282278e-06, "loss": 2.2339, "step": 7717 }, { "epoch": 0.77, "learning_rate": 2.5774610748859252e-06, "loss": 2.3, "step": 7718 }, { "epoch": 0.77, "learning_rate": 2.575286855492638e-06, "loss": 2.3813, "step": 7719 }, { "epoch": 0.77, "learning_rate": 2.573113417977329e-06, "loss": 2.2378, "step": 7720 }, { "epoch": 0.77, "learning_rate": 2.570940762568874e-06, "loss": 2.2592, "step": 7721 }, { "epoch": 0.77, "learning_rate": 2.5687688894960703e-06, "loss": 2.3158, "step": 7722 }, { "epoch": 0.77, "learning_rate": 2.5665977989876366e-06, "loss": 2.304, "step": 7723 }, { "epoch": 0.77, "learning_rate": 2.564427491272203e-06, "loss": 2.2637, "step": 7724 }, { "epoch": 0.77, "learning_rate": 2.56225796657832e-06, "loss": 2.3356, "step": 7725 }, { "epoch": 0.77, "learning_rate": 2.560089225134452e-06, "loss": 2.29, "step": 7726 }, { "epoch": 0.77, "learning_rate": 2.557921267168986e-06, "loss": 2.3291, "step": 7727 }, { "epoch": 0.77, "learning_rate": 2.555754092910223e-06, "loss": 2.3494, "step": 7728 }, { "epoch": 0.77, "learning_rate": 2.553587702586384e-06, "loss": 2.2434, "step": 7729 }, { "epoch": 0.77, "learning_rate": 2.551422096425605e-06, "loss": 2.4806, "step": 7730 }, { "epoch": 0.77, "learning_rate": 2.5492572746559386e-06, "loss": 2.323, "step": 7731 }, { "epoch": 0.77, "learning_rate": 2.5470932375053624e-06, "loss": 2.2596, "step": 7732 }, { "epoch": 0.77, "learning_rate": 2.5449299852017618e-06, "loss": 2.3064, "step": 7733 }, { "epoch": 0.77, "learning_rate": 2.542767517972945e-06, "loss": 2.2399, "step": 7734 }, { "epoch": 0.77, "learning_rate": 2.5406058360466366e-06, "loss": 2.3563, "step": 7735 }, { "epoch": 0.78, "learning_rate": 2.538444939650475e-06, "loss": 2.3669, "step": 7736 }, { "epoch": 0.78, "learning_rate": 2.53628482901202e-06, "loss": 2.2244, "step": 7737 }, { "epoch": 0.78, "learning_rate": 2.5341255043587487e-06, "loss": 2.3593, "step": 7738 }, { "epoch": 0.78, "learning_rate": 2.5319669659180524e-06, "loss": 2.2623, "step": 7739 }, { "epoch": 0.78, "learning_rate": 2.529809213917239e-06, "loss": 2.3383, "step": 7740 }, { "epoch": 0.78, "learning_rate": 2.527652248583543e-06, "loss": 2.3159, "step": 7741 }, { "epoch": 0.78, "learning_rate": 2.5254960701441046e-06, "loss": 2.3538, "step": 7742 }, { "epoch": 0.78, "learning_rate": 2.5233406788259863e-06, "loss": 2.1741, "step": 7743 }, { "epoch": 0.78, "learning_rate": 2.521186074856168e-06, "loss": 2.3577, "step": 7744 }, { "epoch": 0.78, "learning_rate": 2.5190322584615434e-06, "loss": 2.3556, "step": 7745 }, { "epoch": 0.78, "learning_rate": 2.516879229868927e-06, "loss": 2.3338, "step": 7746 }, { "epoch": 0.78, "learning_rate": 2.5147269893050485e-06, "loss": 2.2943, "step": 7747 }, { "epoch": 0.78, "learning_rate": 2.5125755369965555e-06, "loss": 2.2619, "step": 7748 }, { "epoch": 0.78, "learning_rate": 2.5104248731700076e-06, "loss": 2.3203, "step": 7749 }, { "epoch": 0.78, "learning_rate": 2.508274998051894e-06, "loss": 2.2599, "step": 7750 }, { "epoch": 0.78, "learning_rate": 2.506125911868608e-06, "loss": 2.2941, "step": 7751 }, { "epoch": 0.78, "learning_rate": 2.5039776148464646e-06, "loss": 2.299, "step": 7752 }, { "epoch": 0.78, "learning_rate": 2.5018301072116955e-06, "loss": 2.1746, "step": 7753 }, { "epoch": 0.78, "learning_rate": 2.4996833891904513e-06, "loss": 2.3957, "step": 7754 }, { "epoch": 0.78, "learning_rate": 2.4975374610087957e-06, "loss": 2.2354, "step": 7755 }, { "epoch": 0.78, "learning_rate": 2.4953923228927102e-06, "loss": 2.2052, "step": 7756 }, { "epoch": 0.78, "learning_rate": 2.493247975068096e-06, "loss": 2.2673, "step": 7757 }, { "epoch": 0.78, "learning_rate": 2.491104417760768e-06, "loss": 2.2829, "step": 7758 }, { "epoch": 0.78, "learning_rate": 2.488961651196459e-06, "loss": 2.2835, "step": 7759 }, { "epoch": 0.78, "learning_rate": 2.486819675600818e-06, "loss": 2.1595, "step": 7760 }, { "epoch": 0.78, "learning_rate": 2.4846784911994116e-06, "loss": 2.221, "step": 7761 }, { "epoch": 0.78, "learning_rate": 2.482538098217723e-06, "loss": 2.2975, "step": 7762 }, { "epoch": 0.78, "learning_rate": 2.4803984968811502e-06, "loss": 2.2331, "step": 7763 }, { "epoch": 0.78, "learning_rate": 2.47825968741501e-06, "loss": 2.2299, "step": 7764 }, { "epoch": 0.78, "learning_rate": 2.4761216700445357e-06, "loss": 2.2372, "step": 7765 }, { "epoch": 0.78, "learning_rate": 2.4739844449948756e-06, "loss": 2.2372, "step": 7766 }, { "epoch": 0.78, "learning_rate": 2.471848012491094e-06, "loss": 2.3358, "step": 7767 }, { "epoch": 0.78, "learning_rate": 2.4697123727581773e-06, "loss": 2.2053, "step": 7768 }, { "epoch": 0.78, "learning_rate": 2.4675775260210232e-06, "loss": 2.3275, "step": 7769 }, { "epoch": 0.78, "learning_rate": 2.4654434725044453e-06, "loss": 2.4767, "step": 7770 }, { "epoch": 0.78, "learning_rate": 2.4633102124331764e-06, "loss": 2.2309, "step": 7771 }, { "epoch": 0.78, "learning_rate": 2.461177746031865e-06, "loss": 2.3639, "step": 7772 }, { "epoch": 0.78, "learning_rate": 2.4590460735250764e-06, "loss": 2.459, "step": 7773 }, { "epoch": 0.78, "learning_rate": 2.4569151951372895e-06, "loss": 2.3037, "step": 7774 }, { "epoch": 0.78, "learning_rate": 2.4547851110929035e-06, "loss": 2.2922, "step": 7775 }, { "epoch": 0.78, "learning_rate": 2.452655821616232e-06, "loss": 2.2865, "step": 7776 }, { "epoch": 0.78, "learning_rate": 2.4505273269315053e-06, "loss": 2.3878, "step": 7777 }, { "epoch": 0.78, "learning_rate": 2.4483996272628684e-06, "loss": 2.2547, "step": 7778 }, { "epoch": 0.78, "learning_rate": 2.4462727228343865e-06, "loss": 2.2337, "step": 7779 }, { "epoch": 0.78, "learning_rate": 2.4441466138700367e-06, "loss": 2.3917, "step": 7780 }, { "epoch": 0.78, "learning_rate": 2.4420213005937153e-06, "loss": 2.3777, "step": 7781 }, { "epoch": 0.78, "learning_rate": 2.439896783229232e-06, "loss": 2.2304, "step": 7782 }, { "epoch": 0.78, "learning_rate": 2.437773062000317e-06, "loss": 2.2632, "step": 7783 }, { "epoch": 0.78, "learning_rate": 2.4356501371306117e-06, "loss": 2.3257, "step": 7784 }, { "epoch": 0.78, "learning_rate": 2.433528008843674e-06, "loss": 2.2623, "step": 7785 }, { "epoch": 0.78, "learning_rate": 2.4314066773629863e-06, "loss": 2.289, "step": 7786 }, { "epoch": 0.78, "learning_rate": 2.4292861429119374e-06, "loss": 2.2872, "step": 7787 }, { "epoch": 0.78, "learning_rate": 2.4271664057138356e-06, "loss": 2.3097, "step": 7788 }, { "epoch": 0.78, "learning_rate": 2.425047465991904e-06, "loss": 2.2738, "step": 7789 }, { "epoch": 0.78, "learning_rate": 2.422929323969285e-06, "loss": 2.351, "step": 7790 }, { "epoch": 0.78, "learning_rate": 2.4208119798690335e-06, "loss": 2.3548, "step": 7791 }, { "epoch": 0.78, "learning_rate": 2.418695433914121e-06, "loss": 2.3378, "step": 7792 }, { "epoch": 0.78, "learning_rate": 2.416579686327437e-06, "loss": 2.298, "step": 7793 }, { "epoch": 0.78, "learning_rate": 2.414464737331782e-06, "loss": 2.3136, "step": 7794 }, { "epoch": 0.78, "learning_rate": 2.412350587149882e-06, "loss": 2.2752, "step": 7795 }, { "epoch": 0.78, "learning_rate": 2.41023723600437e-06, "loss": 2.2738, "step": 7796 }, { "epoch": 0.78, "learning_rate": 2.4081246841177973e-06, "loss": 2.3135, "step": 7797 }, { "epoch": 0.78, "learning_rate": 2.4060129317126325e-06, "loss": 2.2546, "step": 7798 }, { "epoch": 0.78, "learning_rate": 2.4039019790112605e-06, "loss": 2.234, "step": 7799 }, { "epoch": 0.78, "learning_rate": 2.4017918262359764e-06, "loss": 2.277, "step": 7800 }, { "epoch": 0.78, "learning_rate": 2.3996824736089963e-06, "loss": 2.3977, "step": 7801 }, { "epoch": 0.78, "learning_rate": 2.3975739213524507e-06, "loss": 2.264, "step": 7802 }, { "epoch": 0.78, "learning_rate": 2.395466169688385e-06, "loss": 2.377, "step": 7803 }, { "epoch": 0.78, "learning_rate": 2.3933592188387654e-06, "loss": 2.2451, "step": 7804 }, { "epoch": 0.78, "learning_rate": 2.3912530690254675e-06, "loss": 2.3621, "step": 7805 }, { "epoch": 0.78, "learning_rate": 2.389147720470285e-06, "loss": 2.307, "step": 7806 }, { "epoch": 0.78, "learning_rate": 2.387043173394926e-06, "loss": 2.2489, "step": 7807 }, { "epoch": 0.78, "learning_rate": 2.3849394280210146e-06, "loss": 2.2612, "step": 7808 }, { "epoch": 0.78, "learning_rate": 2.3828364845700922e-06, "loss": 2.3276, "step": 7809 }, { "epoch": 0.78, "learning_rate": 2.380734343263614e-06, "loss": 2.2146, "step": 7810 }, { "epoch": 0.78, "learning_rate": 2.3786330043229523e-06, "loss": 2.3779, "step": 7811 }, { "epoch": 0.78, "learning_rate": 2.376532467969389e-06, "loss": 2.2929, "step": 7812 }, { "epoch": 0.78, "learning_rate": 2.3744327344241336e-06, "loss": 2.3679, "step": 7813 }, { "epoch": 0.78, "learning_rate": 2.3723338039082997e-06, "loss": 2.3393, "step": 7814 }, { "epoch": 0.78, "learning_rate": 2.3702356766429226e-06, "loss": 2.3102, "step": 7815 }, { "epoch": 0.78, "learning_rate": 2.3681383528489477e-06, "loss": 2.2427, "step": 7816 }, { "epoch": 0.78, "learning_rate": 2.3660418327472423e-06, "loss": 2.3639, "step": 7817 }, { "epoch": 0.78, "learning_rate": 2.363946116558583e-06, "loss": 2.2944, "step": 7818 }, { "epoch": 0.78, "learning_rate": 2.3618512045036647e-06, "loss": 2.3446, "step": 7819 }, { "epoch": 0.78, "learning_rate": 2.359757096803099e-06, "loss": 2.2903, "step": 7820 }, { "epoch": 0.78, "learning_rate": 2.3576637936774105e-06, "loss": 2.3244, "step": 7821 }, { "epoch": 0.78, "learning_rate": 2.355571295347039e-06, "loss": 2.2278, "step": 7822 }, { "epoch": 0.78, "learning_rate": 2.3534796020323405e-06, "loss": 2.261, "step": 7823 }, { "epoch": 0.78, "learning_rate": 2.3513887139535864e-06, "loss": 2.2238, "step": 7824 }, { "epoch": 0.78, "learning_rate": 2.3492986313309628e-06, "loss": 2.3621, "step": 7825 }, { "epoch": 0.78, "learning_rate": 2.3472093543845707e-06, "loss": 2.2356, "step": 7826 }, { "epoch": 0.78, "learning_rate": 2.3451208833344262e-06, "loss": 2.2542, "step": 7827 }, { "epoch": 0.78, "learning_rate": 2.3430332184004635e-06, "loss": 2.2795, "step": 7828 }, { "epoch": 0.78, "learning_rate": 2.340946359802526e-06, "loss": 2.3461, "step": 7829 }, { "epoch": 0.78, "learning_rate": 2.3388603077603746e-06, "loss": 2.3054, "step": 7830 }, { "epoch": 0.78, "learning_rate": 2.3367750624936925e-06, "loss": 2.2701, "step": 7831 }, { "epoch": 0.78, "learning_rate": 2.3346906242220668e-06, "loss": 2.3031, "step": 7832 }, { "epoch": 0.78, "learning_rate": 2.3326069931650064e-06, "loss": 2.3669, "step": 7833 }, { "epoch": 0.78, "learning_rate": 2.330524169541931e-06, "loss": 2.328, "step": 7834 }, { "epoch": 0.78, "learning_rate": 2.32844215357218e-06, "loss": 2.2145, "step": 7835 }, { "epoch": 0.79, "learning_rate": 2.3263609454750046e-06, "loss": 2.2099, "step": 7836 }, { "epoch": 0.79, "learning_rate": 2.3242805454695705e-06, "loss": 2.2673, "step": 7837 }, { "epoch": 0.79, "learning_rate": 2.3222009537749614e-06, "loss": 2.3735, "step": 7838 }, { "epoch": 0.79, "learning_rate": 2.320122170610172e-06, "loss": 2.247, "step": 7839 }, { "epoch": 0.79, "learning_rate": 2.318044196194115e-06, "loss": 2.2959, "step": 7840 }, { "epoch": 0.79, "learning_rate": 2.315967030745615e-06, "loss": 2.2454, "step": 7841 }, { "epoch": 0.79, "learning_rate": 2.3138906744834142e-06, "loss": 2.2945, "step": 7842 }, { "epoch": 0.79, "learning_rate": 2.3118151276261703e-06, "loss": 2.3026, "step": 7843 }, { "epoch": 0.79, "learning_rate": 2.309740390392451e-06, "loss": 2.3563, "step": 7844 }, { "epoch": 0.79, "learning_rate": 2.307666463000743e-06, "loss": 2.3182, "step": 7845 }, { "epoch": 0.79, "learning_rate": 2.305593345669447e-06, "loss": 2.2916, "step": 7846 }, { "epoch": 0.79, "learning_rate": 2.3035210386168762e-06, "loss": 2.2605, "step": 7847 }, { "epoch": 0.79, "learning_rate": 2.301449542061259e-06, "loss": 2.2523, "step": 7848 }, { "epoch": 0.79, "learning_rate": 2.2993788562207443e-06, "loss": 2.236, "step": 7849 }, { "epoch": 0.79, "learning_rate": 2.2973089813133877e-06, "loss": 2.3221, "step": 7850 }, { "epoch": 0.79, "learning_rate": 2.2952399175571625e-06, "loss": 2.2402, "step": 7851 }, { "epoch": 0.79, "learning_rate": 2.2931716651699575e-06, "loss": 2.3385, "step": 7852 }, { "epoch": 0.79, "learning_rate": 2.2911042243695745e-06, "loss": 2.3805, "step": 7853 }, { "epoch": 0.79, "learning_rate": 2.289037595373731e-06, "loss": 2.3836, "step": 7854 }, { "epoch": 0.79, "learning_rate": 2.2869717784000577e-06, "loss": 2.3181, "step": 7855 }, { "epoch": 0.79, "learning_rate": 2.2849067736661023e-06, "loss": 2.2495, "step": 7856 }, { "epoch": 0.79, "learning_rate": 2.2828425813893207e-06, "loss": 2.3124, "step": 7857 }, { "epoch": 0.79, "learning_rate": 2.2807792017870944e-06, "loss": 2.4071, "step": 7858 }, { "epoch": 0.79, "learning_rate": 2.2787166350767096e-06, "loss": 2.283, "step": 7859 }, { "epoch": 0.79, "learning_rate": 2.2766548814753696e-06, "loss": 2.2387, "step": 7860 }, { "epoch": 0.79, "learning_rate": 2.274593941200194e-06, "loss": 2.3419, "step": 7861 }, { "epoch": 0.79, "learning_rate": 2.272533814468214e-06, "loss": 2.2845, "step": 7862 }, { "epoch": 0.79, "learning_rate": 2.2704745014963794e-06, "loss": 2.2735, "step": 7863 }, { "epoch": 0.79, "learning_rate": 2.2684160025015456e-06, "loss": 2.3603, "step": 7864 }, { "epoch": 0.79, "learning_rate": 2.2663583177004877e-06, "loss": 2.3538, "step": 7865 }, { "epoch": 0.79, "learning_rate": 2.264301447309902e-06, "loss": 2.3566, "step": 7866 }, { "epoch": 0.79, "learning_rate": 2.2622453915463893e-06, "loss": 2.3336, "step": 7867 }, { "epoch": 0.79, "learning_rate": 2.260190150626467e-06, "loss": 2.2338, "step": 7868 }, { "epoch": 0.79, "learning_rate": 2.2581357247665682e-06, "loss": 2.3003, "step": 7869 }, { "epoch": 0.79, "learning_rate": 2.256082114183038e-06, "loss": 2.3034, "step": 7870 }, { "epoch": 0.79, "learning_rate": 2.2540293190921382e-06, "loss": 2.3055, "step": 7871 }, { "epoch": 0.79, "learning_rate": 2.2519773397100443e-06, "loss": 2.3355, "step": 7872 }, { "epoch": 0.79, "learning_rate": 2.2499261762528422e-06, "loss": 2.286, "step": 7873 }, { "epoch": 0.79, "learning_rate": 2.2478758289365356e-06, "loss": 2.3138, "step": 7874 }, { "epoch": 0.79, "learning_rate": 2.245826297977044e-06, "loss": 2.3247, "step": 7875 }, { "epoch": 0.79, "learning_rate": 2.2437775835901974e-06, "loss": 2.3566, "step": 7876 }, { "epoch": 0.79, "learning_rate": 2.2417296859917406e-06, "loss": 2.3038, "step": 7877 }, { "epoch": 0.79, "learning_rate": 2.239682605397332e-06, "loss": 2.3024, "step": 7878 }, { "epoch": 0.79, "learning_rate": 2.2376363420225445e-06, "loss": 2.2814, "step": 7879 }, { "epoch": 0.79, "learning_rate": 2.2355908960828655e-06, "loss": 2.2415, "step": 7880 }, { "epoch": 0.79, "learning_rate": 2.233546267793696e-06, "loss": 2.3126, "step": 7881 }, { "epoch": 0.79, "learning_rate": 2.231502457370349e-06, "loss": 2.3275, "step": 7882 }, { "epoch": 0.79, "learning_rate": 2.2294594650280552e-06, "loss": 2.2261, "step": 7883 }, { "epoch": 0.79, "learning_rate": 2.2274172909819567e-06, "loss": 2.3849, "step": 7884 }, { "epoch": 0.79, "learning_rate": 2.2253759354471084e-06, "loss": 2.3271, "step": 7885 }, { "epoch": 0.79, "learning_rate": 2.223335398638481e-06, "loss": 2.2623, "step": 7886 }, { "epoch": 0.79, "learning_rate": 2.2212956807709586e-06, "loss": 2.2975, "step": 7887 }, { "epoch": 0.79, "learning_rate": 2.219256782059339e-06, "loss": 2.2103, "step": 7888 }, { "epoch": 0.79, "learning_rate": 2.2172187027183335e-06, "loss": 2.2973, "step": 7889 }, { "epoch": 0.79, "learning_rate": 2.2151814429625663e-06, "loss": 2.3151, "step": 7890 }, { "epoch": 0.79, "learning_rate": 2.213145003006576e-06, "loss": 2.2745, "step": 7891 }, { "epoch": 0.79, "learning_rate": 2.2111093830648134e-06, "loss": 2.2714, "step": 7892 }, { "epoch": 0.79, "learning_rate": 2.209074583351649e-06, "loss": 2.2142, "step": 7893 }, { "epoch": 0.79, "learning_rate": 2.2070406040813606e-06, "loss": 2.3544, "step": 7894 }, { "epoch": 0.79, "learning_rate": 2.2050074454681427e-06, "loss": 2.2591, "step": 7895 }, { "epoch": 0.79, "learning_rate": 2.2029751077260986e-06, "loss": 2.3262, "step": 7896 }, { "epoch": 0.79, "learning_rate": 2.200943591069251e-06, "loss": 2.1992, "step": 7897 }, { "epoch": 0.79, "learning_rate": 2.1989128957115336e-06, "loss": 2.2213, "step": 7898 }, { "epoch": 0.79, "learning_rate": 2.196883021866795e-06, "loss": 2.2325, "step": 7899 }, { "epoch": 0.79, "learning_rate": 2.194853969748794e-06, "loss": 2.3259, "step": 7900 }, { "epoch": 0.79, "learning_rate": 2.1928257395712016e-06, "loss": 2.2977, "step": 7901 }, { "epoch": 0.79, "learning_rate": 2.1907983315476176e-06, "loss": 2.3091, "step": 7902 }, { "epoch": 0.79, "learning_rate": 2.1887717458915327e-06, "loss": 2.2761, "step": 7903 }, { "epoch": 0.79, "learning_rate": 2.186745982816363e-06, "loss": 2.2511, "step": 7904 }, { "epoch": 0.79, "learning_rate": 2.184721042535439e-06, "loss": 2.3169, "step": 7905 }, { "epoch": 0.79, "learning_rate": 2.1826969252620013e-06, "loss": 2.2893, "step": 7906 }, { "epoch": 0.79, "learning_rate": 2.1806736312092047e-06, "loss": 2.326, "step": 7907 }, { "epoch": 0.79, "learning_rate": 2.1786511605901163e-06, "loss": 2.2558, "step": 7908 }, { "epoch": 0.79, "learning_rate": 2.1766295136177185e-06, "loss": 2.3467, "step": 7909 }, { "epoch": 0.79, "learning_rate": 2.1746086905049022e-06, "loss": 2.2511, "step": 7910 }, { "epoch": 0.79, "learning_rate": 2.1725886914644823e-06, "loss": 2.2676, "step": 7911 }, { "epoch": 0.79, "learning_rate": 2.1705695167091758e-06, "loss": 2.3345, "step": 7912 }, { "epoch": 0.79, "learning_rate": 2.1685511664516168e-06, "loss": 2.2412, "step": 7913 }, { "epoch": 0.79, "learning_rate": 2.1665336409043538e-06, "loss": 2.2579, "step": 7914 }, { "epoch": 0.79, "learning_rate": 2.164516940279846e-06, "loss": 2.2753, "step": 7915 }, { "epoch": 0.79, "learning_rate": 2.1625010647904686e-06, "loss": 2.3234, "step": 7916 }, { "epoch": 0.79, "learning_rate": 2.1604860146485073e-06, "loss": 2.2913, "step": 7917 }, { "epoch": 0.79, "learning_rate": 2.1584717900661623e-06, "loss": 2.3068, "step": 7918 }, { "epoch": 0.79, "learning_rate": 2.156458391255544e-06, "loss": 2.2419, "step": 7919 }, { "epoch": 0.79, "learning_rate": 2.154445818428683e-06, "loss": 2.3257, "step": 7920 }, { "epoch": 0.79, "learning_rate": 2.1524340717975166e-06, "loss": 2.335, "step": 7921 }, { "epoch": 0.79, "learning_rate": 2.150423151573897e-06, "loss": 2.3055, "step": 7922 }, { "epoch": 0.79, "learning_rate": 2.1484130579695883e-06, "loss": 2.3482, "step": 7923 }, { "epoch": 0.79, "learning_rate": 2.14640379119627e-06, "loss": 2.3124, "step": 7924 }, { "epoch": 0.79, "learning_rate": 2.14439535146553e-06, "loss": 2.2828, "step": 7925 }, { "epoch": 0.79, "learning_rate": 2.1423877389888748e-06, "loss": 2.311, "step": 7926 }, { "epoch": 0.79, "learning_rate": 2.1403809539777222e-06, "loss": 2.2413, "step": 7927 }, { "epoch": 0.79, "learning_rate": 2.138374996643394e-06, "loss": 2.2778, "step": 7928 }, { "epoch": 0.79, "learning_rate": 2.1363698671971423e-06, "loss": 2.275, "step": 7929 }, { "epoch": 0.79, "learning_rate": 2.134365565850117e-06, "loss": 2.3871, "step": 7930 }, { "epoch": 0.79, "learning_rate": 2.132362092813387e-06, "loss": 2.2575, "step": 7931 }, { "epoch": 0.79, "learning_rate": 2.130359448297934e-06, "loss": 2.3224, "step": 7932 }, { "epoch": 0.79, "learning_rate": 2.1283576325146503e-06, "loss": 2.2112, "step": 7933 }, { "epoch": 0.79, "learning_rate": 2.1263566456743422e-06, "loss": 2.2479, "step": 7934 }, { "epoch": 0.8, "learning_rate": 2.12435648798773e-06, "loss": 2.2792, "step": 7935 }, { "epoch": 0.8, "learning_rate": 2.1223571596654434e-06, "loss": 2.3486, "step": 7936 }, { "epoch": 0.8, "learning_rate": 2.120358660918025e-06, "loss": 2.3108, "step": 7937 }, { "epoch": 0.8, "learning_rate": 2.1183609919559368e-06, "loss": 2.2681, "step": 7938 }, { "epoch": 0.8, "learning_rate": 2.1163641529895464e-06, "loss": 2.3307, "step": 7939 }, { "epoch": 0.8, "learning_rate": 2.1143681442291344e-06, "loss": 2.3495, "step": 7940 }, { "epoch": 0.8, "learning_rate": 2.112372965884897e-06, "loss": 2.3282, "step": 7941 }, { "epoch": 0.8, "learning_rate": 2.1103786181669408e-06, "loss": 2.3721, "step": 7942 }, { "epoch": 0.8, "learning_rate": 2.108385101285284e-06, "loss": 2.2793, "step": 7943 }, { "epoch": 0.8, "learning_rate": 2.1063924154498626e-06, "loss": 2.2775, "step": 7944 }, { "epoch": 0.8, "learning_rate": 2.1044005608705174e-06, "loss": 2.3766, "step": 7945 }, { "epoch": 0.8, "learning_rate": 2.1024095377570088e-06, "loss": 2.3964, "step": 7946 }, { "epoch": 0.8, "learning_rate": 2.100419346319005e-06, "loss": 2.4288, "step": 7947 }, { "epoch": 0.8, "learning_rate": 2.0984299867660873e-06, "loss": 2.3368, "step": 7948 }, { "epoch": 0.8, "learning_rate": 2.096441459307752e-06, "loss": 2.263, "step": 7949 }, { "epoch": 0.8, "learning_rate": 2.0944537641534045e-06, "loss": 2.216, "step": 7950 }, { "epoch": 0.8, "learning_rate": 2.0924669015123643e-06, "loss": 2.1753, "step": 7951 }, { "epoch": 0.8, "learning_rate": 2.090480871593864e-06, "loss": 2.2626, "step": 7952 }, { "epoch": 0.8, "learning_rate": 2.0884956746070463e-06, "loss": 2.3208, "step": 7953 }, { "epoch": 0.8, "learning_rate": 2.0865113107609668e-06, "loss": 2.3125, "step": 7954 }, { "epoch": 0.8, "learning_rate": 2.0845277802645937e-06, "loss": 2.1703, "step": 7955 }, { "epoch": 0.8, "learning_rate": 2.08254508332681e-06, "loss": 2.1679, "step": 7956 }, { "epoch": 0.8, "learning_rate": 2.0805632201564076e-06, "loss": 2.3568, "step": 7957 }, { "epoch": 0.8, "learning_rate": 2.078582190962091e-06, "loss": 2.3027, "step": 7958 }, { "epoch": 0.8, "learning_rate": 2.0766019959524774e-06, "loss": 2.3053, "step": 7959 }, { "epoch": 0.8, "learning_rate": 2.0746226353360977e-06, "loss": 2.2867, "step": 7960 }, { "epoch": 0.8, "learning_rate": 2.072644109321391e-06, "loss": 2.3535, "step": 7961 }, { "epoch": 0.8, "learning_rate": 2.0706664181167125e-06, "loss": 2.3135, "step": 7962 }, { "epoch": 0.8, "learning_rate": 2.068689561930327e-06, "loss": 2.257, "step": 7963 }, { "epoch": 0.8, "learning_rate": 2.0667135409704097e-06, "loss": 2.2285, "step": 7964 }, { "epoch": 0.8, "learning_rate": 2.064738355445057e-06, "loss": 2.2964, "step": 7965 }, { "epoch": 0.8, "learning_rate": 2.06276400556227e-06, "loss": 2.2195, "step": 7966 }, { "epoch": 0.8, "learning_rate": 2.060790491529957e-06, "loss": 2.2976, "step": 7967 }, { "epoch": 0.8, "learning_rate": 2.0588178135559456e-06, "loss": 2.313, "step": 7968 }, { "epoch": 0.8, "learning_rate": 2.056845971847976e-06, "loss": 2.3813, "step": 7969 }, { "epoch": 0.8, "learning_rate": 2.0548749666136957e-06, "loss": 2.3495, "step": 7970 }, { "epoch": 0.8, "learning_rate": 2.0529047980606676e-06, "loss": 2.4214, "step": 7971 }, { "epoch": 0.8, "learning_rate": 2.0509354663963642e-06, "loss": 2.3173, "step": 7972 }, { "epoch": 0.8, "learning_rate": 2.048966971828169e-06, "loss": 2.367, "step": 7973 }, { "epoch": 0.8, "learning_rate": 2.046999314563385e-06, "loss": 2.2824, "step": 7974 }, { "epoch": 0.8, "learning_rate": 2.045032494809217e-06, "loss": 2.3041, "step": 7975 }, { "epoch": 0.8, "learning_rate": 2.0430665127727867e-06, "loss": 2.2506, "step": 7976 }, { "epoch": 0.8, "learning_rate": 2.041101368661128e-06, "loss": 2.2493, "step": 7977 }, { "epoch": 0.8, "learning_rate": 2.0391370626811835e-06, "loss": 2.2451, "step": 7978 }, { "epoch": 0.8, "learning_rate": 2.03717359503981e-06, "loss": 2.373, "step": 7979 }, { "epoch": 0.8, "learning_rate": 2.035210965943776e-06, "loss": 2.2908, "step": 7980 }, { "epoch": 0.8, "learning_rate": 2.0332491755997595e-06, "loss": 2.273, "step": 7981 }, { "epoch": 0.8, "learning_rate": 2.0312882242143506e-06, "loss": 2.1881, "step": 7982 }, { "epoch": 0.8, "learning_rate": 2.0293281119940565e-06, "loss": 2.3314, "step": 7983 }, { "epoch": 0.8, "learning_rate": 2.0273688391452907e-06, "loss": 2.2979, "step": 7984 }, { "epoch": 0.8, "learning_rate": 2.0254104058743774e-06, "loss": 2.2895, "step": 7985 }, { "epoch": 0.8, "learning_rate": 2.0234528123875554e-06, "loss": 2.2951, "step": 7986 }, { "epoch": 0.8, "learning_rate": 2.0214960588909727e-06, "loss": 2.2883, "step": 7987 }, { "epoch": 0.8, "learning_rate": 2.0195401455906917e-06, "loss": 2.3048, "step": 7988 }, { "epoch": 0.8, "learning_rate": 2.017585072692685e-06, "loss": 2.3239, "step": 7989 }, { "epoch": 0.8, "learning_rate": 2.0156308404028335e-06, "loss": 2.2698, "step": 7990 }, { "epoch": 0.8, "learning_rate": 2.0136774489269363e-06, "loss": 2.2219, "step": 7991 }, { "epoch": 0.8, "learning_rate": 2.011724898470697e-06, "loss": 2.2876, "step": 7992 }, { "epoch": 0.8, "learning_rate": 2.0097731892397364e-06, "loss": 2.4172, "step": 7993 }, { "epoch": 0.8, "learning_rate": 2.007822321439583e-06, "loss": 2.2973, "step": 7994 }, { "epoch": 0.8, "learning_rate": 2.005872295275677e-06, "loss": 2.39, "step": 7995 }, { "epoch": 0.8, "learning_rate": 2.0039231109533718e-06, "loss": 2.2879, "step": 7996 }, { "epoch": 0.8, "learning_rate": 2.0019747686779313e-06, "loss": 2.3233, "step": 7997 }, { "epoch": 0.8, "learning_rate": 2.0000272686545296e-06, "loss": 2.2997, "step": 7998 }, { "epoch": 0.8, "learning_rate": 1.9980806110882533e-06, "loss": 2.3483, "step": 7999 }, { "epoch": 0.8, "learning_rate": 1.9961347961840982e-06, "loss": 2.197, "step": 8000 }, { "epoch": 0.8, "learning_rate": 1.9941898241469783e-06, "loss": 2.3963, "step": 8001 }, { "epoch": 0.8, "learning_rate": 1.9922456951817093e-06, "loss": 2.2526, "step": 8002 }, { "epoch": 0.8, "learning_rate": 1.9903024094930257e-06, "loss": 2.2241, "step": 8003 }, { "epoch": 0.8, "learning_rate": 1.988359967285567e-06, "loss": 2.1566, "step": 8004 }, { "epoch": 0.8, "learning_rate": 1.9864183687638893e-06, "loss": 2.3317, "step": 8005 }, { "epoch": 0.8, "learning_rate": 1.984477614132456e-06, "loss": 2.2746, "step": 8006 }, { "epoch": 0.8, "learning_rate": 1.982537703595644e-06, "loss": 2.3276, "step": 8007 }, { "epoch": 0.8, "learning_rate": 1.9805986373577403e-06, "loss": 2.2765, "step": 8008 }, { "epoch": 0.8, "learning_rate": 1.9786604156229418e-06, "loss": 2.1658, "step": 8009 }, { "epoch": 0.8, "learning_rate": 1.9767230385953595e-06, "loss": 2.3149, "step": 8010 }, { "epoch": 0.8, "learning_rate": 1.974786506479013e-06, "loss": 2.3304, "step": 8011 }, { "epoch": 0.8, "learning_rate": 1.972850819477834e-06, "loss": 2.268, "step": 8012 }, { "epoch": 0.8, "learning_rate": 1.9709159777956632e-06, "loss": 2.3216, "step": 8013 }, { "epoch": 0.8, "learning_rate": 1.9689819816362567e-06, "loss": 2.2767, "step": 8014 }, { "epoch": 0.8, "learning_rate": 1.9670488312032775e-06, "loss": 2.3168, "step": 8015 }, { "epoch": 0.8, "learning_rate": 1.9651165267003002e-06, "loss": 2.36, "step": 8016 }, { "epoch": 0.8, "learning_rate": 1.963185068330812e-06, "loss": 2.35, "step": 8017 }, { "epoch": 0.8, "learning_rate": 1.961254456298206e-06, "loss": 2.2576, "step": 8018 }, { "epoch": 0.8, "learning_rate": 1.9593246908057973e-06, "loss": 2.3319, "step": 8019 }, { "epoch": 0.8, "learning_rate": 1.9573957720568003e-06, "loss": 2.3357, "step": 8020 }, { "epoch": 0.8, "learning_rate": 1.9554677002543452e-06, "loss": 2.3156, "step": 8021 }, { "epoch": 0.8, "learning_rate": 1.953540475601473e-06, "loss": 2.2967, "step": 8022 }, { "epoch": 0.8, "learning_rate": 1.9516140983011344e-06, "loss": 2.3215, "step": 8023 }, { "epoch": 0.8, "learning_rate": 1.9496885685561904e-06, "loss": 2.3016, "step": 8024 }, { "epoch": 0.8, "learning_rate": 1.947763886569416e-06, "loss": 2.2037, "step": 8025 }, { "epoch": 0.8, "learning_rate": 1.945840052543493e-06, "loss": 2.2898, "step": 8026 }, { "epoch": 0.8, "learning_rate": 1.9439170666810124e-06, "loss": 2.3525, "step": 8027 }, { "epoch": 0.8, "learning_rate": 1.9419949291844862e-06, "loss": 2.3243, "step": 8028 }, { "epoch": 0.8, "learning_rate": 1.9400736402563257e-06, "loss": 2.2625, "step": 8029 }, { "epoch": 0.8, "learning_rate": 1.938153200098861e-06, "loss": 2.3043, "step": 8030 }, { "epoch": 0.8, "learning_rate": 1.936233608914322e-06, "loss": 2.3583, "step": 8031 }, { "epoch": 0.8, "learning_rate": 1.9343148669048597e-06, "loss": 2.2206, "step": 8032 }, { "epoch": 0.8, "learning_rate": 1.9323969742725313e-06, "loss": 2.27, "step": 8033 }, { "epoch": 0.8, "learning_rate": 1.9304799312193067e-06, "loss": 2.3587, "step": 8034 }, { "epoch": 0.81, "learning_rate": 1.9285637379470613e-06, "loss": 2.2513, "step": 8035 }, { "epoch": 0.81, "learning_rate": 1.9266483946575897e-06, "loss": 2.2561, "step": 8036 }, { "epoch": 0.81, "learning_rate": 1.924733901552589e-06, "loss": 2.3213, "step": 8037 }, { "epoch": 0.81, "learning_rate": 1.922820258833671e-06, "loss": 2.3398, "step": 8038 }, { "epoch": 0.81, "learning_rate": 1.9209074667023554e-06, "loss": 2.3921, "step": 8039 }, { "epoch": 0.81, "learning_rate": 1.9189955253600732e-06, "loss": 2.2917, "step": 8040 }, { "epoch": 0.81, "learning_rate": 1.9170844350081686e-06, "loss": 2.3422, "step": 8041 }, { "epoch": 0.81, "learning_rate": 1.915174195847891e-06, "loss": 2.3308, "step": 8042 }, { "epoch": 0.81, "learning_rate": 1.913264808080404e-06, "loss": 2.2582, "step": 8043 }, { "epoch": 0.81, "learning_rate": 1.911356271906778e-06, "loss": 2.3463, "step": 8044 }, { "epoch": 0.81, "learning_rate": 1.909448587528001e-06, "loss": 2.3393, "step": 8045 }, { "epoch": 0.81, "learning_rate": 1.907541755144965e-06, "loss": 2.2592, "step": 8046 }, { "epoch": 0.81, "learning_rate": 1.905635774958472e-06, "loss": 2.2254, "step": 8047 }, { "epoch": 0.81, "learning_rate": 1.9037306471692374e-06, "loss": 2.2606, "step": 8048 }, { "epoch": 0.81, "learning_rate": 1.9018263719778851e-06, "loss": 2.3243, "step": 8049 }, { "epoch": 0.81, "learning_rate": 1.899922949584948e-06, "loss": 2.2502, "step": 8050 }, { "epoch": 0.81, "learning_rate": 1.8980203801908737e-06, "loss": 2.2559, "step": 8051 }, { "epoch": 0.81, "learning_rate": 1.896118663996015e-06, "loss": 2.3224, "step": 8052 }, { "epoch": 0.81, "learning_rate": 1.8942178012006374e-06, "loss": 2.3198, "step": 8053 }, { "epoch": 0.81, "learning_rate": 1.8923177920049152e-06, "loss": 2.2878, "step": 8054 }, { "epoch": 0.81, "learning_rate": 1.890418636608935e-06, "loss": 2.3772, "step": 8055 }, { "epoch": 0.81, "learning_rate": 1.8885203352126912e-06, "loss": 2.4019, "step": 8056 }, { "epoch": 0.81, "learning_rate": 1.8866228880160897e-06, "loss": 2.306, "step": 8057 }, { "epoch": 0.81, "learning_rate": 1.8847262952189448e-06, "loss": 2.3069, "step": 8058 }, { "epoch": 0.81, "learning_rate": 1.8828305570209837e-06, "loss": 2.264, "step": 8059 }, { "epoch": 0.81, "learning_rate": 1.880935673621841e-06, "loss": 2.3195, "step": 8060 }, { "epoch": 0.81, "learning_rate": 1.8790416452210613e-06, "loss": 2.3454, "step": 8061 }, { "epoch": 0.81, "learning_rate": 1.8771484720180988e-06, "loss": 2.391, "step": 8062 }, { "epoch": 0.81, "learning_rate": 1.8752561542123226e-06, "loss": 2.3722, "step": 8063 }, { "epoch": 0.81, "learning_rate": 1.873364692003007e-06, "loss": 2.3025, "step": 8064 }, { "epoch": 0.81, "learning_rate": 1.8714740855893364e-06, "loss": 2.2585, "step": 8065 }, { "epoch": 0.81, "learning_rate": 1.8695843351704058e-06, "loss": 2.2749, "step": 8066 }, { "epoch": 0.81, "learning_rate": 1.8676954409452196e-06, "loss": 2.3103, "step": 8067 }, { "epoch": 0.81, "learning_rate": 1.8658074031126927e-06, "loss": 2.2494, "step": 8068 }, { "epoch": 0.81, "learning_rate": 1.86392022187165e-06, "loss": 2.302, "step": 8069 }, { "epoch": 0.81, "learning_rate": 1.8620338974208263e-06, "loss": 2.2978, "step": 8070 }, { "epoch": 0.81, "learning_rate": 1.8601484299588657e-06, "loss": 2.2783, "step": 8071 }, { "epoch": 0.81, "learning_rate": 1.8582638196843207e-06, "loss": 2.3612, "step": 8072 }, { "epoch": 0.81, "learning_rate": 1.8563800667956556e-06, "loss": 2.3019, "step": 8073 }, { "epoch": 0.81, "learning_rate": 1.8544971714912442e-06, "loss": 2.3494, "step": 8074 }, { "epoch": 0.81, "learning_rate": 1.8526151339693689e-06, "loss": 2.2849, "step": 8075 }, { "epoch": 0.81, "learning_rate": 1.8507339544282222e-06, "loss": 2.3526, "step": 8076 }, { "epoch": 0.81, "learning_rate": 1.8488536330659068e-06, "loss": 2.2767, "step": 8077 }, { "epoch": 0.81, "learning_rate": 1.8469741700804355e-06, "loss": 2.1673, "step": 8078 }, { "epoch": 0.81, "learning_rate": 1.8450955656697289e-06, "loss": 2.3544, "step": 8079 }, { "epoch": 0.81, "learning_rate": 1.8432178200316153e-06, "loss": 2.2661, "step": 8080 }, { "epoch": 0.81, "learning_rate": 1.841340933363841e-06, "loss": 2.3007, "step": 8081 }, { "epoch": 0.81, "learning_rate": 1.8394649058640534e-06, "loss": 2.2596, "step": 8082 }, { "epoch": 0.81, "learning_rate": 1.8375897377298124e-06, "loss": 2.2982, "step": 8083 }, { "epoch": 0.81, "learning_rate": 1.8357154291585877e-06, "loss": 2.2507, "step": 8084 }, { "epoch": 0.81, "learning_rate": 1.833841980347757e-06, "loss": 2.2332, "step": 8085 }, { "epoch": 0.81, "learning_rate": 1.83196939149461e-06, "loss": 2.3048, "step": 8086 }, { "epoch": 0.81, "learning_rate": 1.830097662796343e-06, "loss": 2.206, "step": 8087 }, { "epoch": 0.81, "learning_rate": 1.828226794450063e-06, "loss": 2.3345, "step": 8088 }, { "epoch": 0.81, "learning_rate": 1.8263567866527854e-06, "loss": 2.3238, "step": 8089 }, { "epoch": 0.81, "learning_rate": 1.82448763960144e-06, "loss": 2.3144, "step": 8090 }, { "epoch": 0.81, "learning_rate": 1.8226193534928604e-06, "loss": 2.3122, "step": 8091 }, { "epoch": 0.81, "learning_rate": 1.8207519285237896e-06, "loss": 2.3272, "step": 8092 }, { "epoch": 0.81, "learning_rate": 1.8188853648908823e-06, "loss": 2.178, "step": 8093 }, { "epoch": 0.81, "learning_rate": 1.8170196627907045e-06, "loss": 2.3176, "step": 8094 }, { "epoch": 0.81, "learning_rate": 1.8151548224197224e-06, "loss": 2.2716, "step": 8095 }, { "epoch": 0.81, "learning_rate": 1.8132908439743225e-06, "loss": 2.2076, "step": 8096 }, { "epoch": 0.81, "learning_rate": 1.811427727650793e-06, "loss": 2.4146, "step": 8097 }, { "epoch": 0.81, "learning_rate": 1.8095654736453328e-06, "loss": 2.3726, "step": 8098 }, { "epoch": 0.81, "learning_rate": 1.807704082154057e-06, "loss": 2.2102, "step": 8099 }, { "epoch": 0.81, "learning_rate": 1.8058435533729802e-06, "loss": 2.3513, "step": 8100 }, { "epoch": 0.81, "learning_rate": 1.803983887498031e-06, "loss": 2.2137, "step": 8101 }, { "epoch": 0.81, "learning_rate": 1.802125084725046e-06, "loss": 2.2897, "step": 8102 }, { "epoch": 0.81, "learning_rate": 1.80026714524977e-06, "loss": 2.2827, "step": 8103 }, { "epoch": 0.81, "learning_rate": 1.7984100692678596e-06, "loss": 2.2354, "step": 8104 }, { "epoch": 0.81, "learning_rate": 1.7965538569748775e-06, "loss": 2.267, "step": 8105 }, { "epoch": 0.81, "learning_rate": 1.794698508566297e-06, "loss": 2.3112, "step": 8106 }, { "epoch": 0.81, "learning_rate": 1.792844024237499e-06, "loss": 2.2855, "step": 8107 }, { "epoch": 0.81, "learning_rate": 1.7909904041837778e-06, "loss": 2.2792, "step": 8108 }, { "epoch": 0.81, "learning_rate": 1.789137648600332e-06, "loss": 2.2946, "step": 8109 }, { "epoch": 0.81, "learning_rate": 1.78728575768227e-06, "loss": 2.2036, "step": 8110 }, { "epoch": 0.81, "learning_rate": 1.7854347316246112e-06, "loss": 2.296, "step": 8111 }, { "epoch": 0.81, "learning_rate": 1.783584570622281e-06, "loss": 2.4085, "step": 8112 }, { "epoch": 0.81, "learning_rate": 1.7817352748701155e-06, "loss": 2.2467, "step": 8113 }, { "epoch": 0.81, "learning_rate": 1.7798868445628604e-06, "loss": 2.3038, "step": 8114 }, { "epoch": 0.81, "learning_rate": 1.7780392798951684e-06, "loss": 2.3398, "step": 8115 }, { "epoch": 0.81, "learning_rate": 1.776192581061602e-06, "loss": 2.305, "step": 8116 }, { "epoch": 0.81, "learning_rate": 1.7743467482566335e-06, "loss": 2.3505, "step": 8117 }, { "epoch": 0.81, "learning_rate": 1.7725017816746403e-06, "loss": 2.3189, "step": 8118 }, { "epoch": 0.81, "learning_rate": 1.7706576815099142e-06, "loss": 2.3199, "step": 8119 }, { "epoch": 0.81, "learning_rate": 1.7688144479566516e-06, "loss": 2.2476, "step": 8120 }, { "epoch": 0.81, "learning_rate": 1.7669720812089576e-06, "loss": 2.275, "step": 8121 }, { "epoch": 0.81, "learning_rate": 1.7651305814608487e-06, "loss": 2.3306, "step": 8122 }, { "epoch": 0.81, "learning_rate": 1.7632899489062493e-06, "loss": 2.2944, "step": 8123 }, { "epoch": 0.81, "learning_rate": 1.7614501837389897e-06, "loss": 2.2495, "step": 8124 }, { "epoch": 0.81, "learning_rate": 1.7596112861528104e-06, "loss": 2.2722, "step": 8125 }, { "epoch": 0.81, "learning_rate": 1.7577732563413641e-06, "loss": 2.3186, "step": 8126 }, { "epoch": 0.81, "learning_rate": 1.7559360944982085e-06, "loss": 2.2654, "step": 8127 }, { "epoch": 0.81, "learning_rate": 1.7540998008168097e-06, "loss": 2.4137, "step": 8128 }, { "epoch": 0.81, "learning_rate": 1.7522643754905432e-06, "loss": 2.4183, "step": 8129 }, { "epoch": 0.81, "learning_rate": 1.7504298187126933e-06, "loss": 2.2771, "step": 8130 }, { "epoch": 0.81, "learning_rate": 1.7485961306764532e-06, "loss": 2.23, "step": 8131 }, { "epoch": 0.81, "learning_rate": 1.7467633115749217e-06, "loss": 2.2675, "step": 8132 }, { "epoch": 0.81, "learning_rate": 1.744931361601111e-06, "loss": 2.3394, "step": 8133 }, { "epoch": 0.81, "learning_rate": 1.7431002809479381e-06, "loss": 2.2839, "step": 8134 }, { "epoch": 0.82, "learning_rate": 1.7412700698082296e-06, "loss": 2.3033, "step": 8135 }, { "epoch": 0.82, "learning_rate": 1.7394407283747195e-06, "loss": 2.266, "step": 8136 }, { "epoch": 0.82, "learning_rate": 1.7376122568400533e-06, "loss": 2.1441, "step": 8137 }, { "epoch": 0.82, "learning_rate": 1.7357846553967806e-06, "loss": 2.2868, "step": 8138 }, { "epoch": 0.82, "learning_rate": 1.7339579242373626e-06, "loss": 2.325, "step": 8139 }, { "epoch": 0.82, "learning_rate": 1.7321320635541684e-06, "loss": 2.2978, "step": 8140 }, { "epoch": 0.82, "learning_rate": 1.7303070735394733e-06, "loss": 2.3389, "step": 8141 }, { "epoch": 0.82, "learning_rate": 1.7284829543854631e-06, "loss": 2.2134, "step": 8142 }, { "epoch": 0.82, "learning_rate": 1.7266597062842294e-06, "loss": 2.1718, "step": 8143 }, { "epoch": 0.82, "learning_rate": 1.7248373294277787e-06, "loss": 2.3005, "step": 8144 }, { "epoch": 0.82, "learning_rate": 1.7230158240080175e-06, "loss": 2.2355, "step": 8145 }, { "epoch": 0.82, "learning_rate": 1.7211951902167645e-06, "loss": 2.4, "step": 8146 }, { "epoch": 0.82, "learning_rate": 1.7193754282457465e-06, "loss": 2.2798, "step": 8147 }, { "epoch": 0.82, "learning_rate": 1.7175565382865978e-06, "loss": 2.2931, "step": 8148 }, { "epoch": 0.82, "learning_rate": 1.7157385205308609e-06, "loss": 2.3413, "step": 8149 }, { "epoch": 0.82, "learning_rate": 1.7139213751699867e-06, "loss": 2.3338, "step": 8150 }, { "epoch": 0.82, "learning_rate": 1.712105102395335e-06, "loss": 2.3616, "step": 8151 }, { "epoch": 0.82, "learning_rate": 1.710289702398169e-06, "loss": 2.3249, "step": 8152 }, { "epoch": 0.82, "learning_rate": 1.7084751753696705e-06, "loss": 2.2638, "step": 8153 }, { "epoch": 0.82, "learning_rate": 1.7066615215009196e-06, "loss": 2.2506, "step": 8154 }, { "epoch": 0.82, "learning_rate": 1.7048487409829074e-06, "loss": 2.1996, "step": 8155 }, { "epoch": 0.82, "learning_rate": 1.703036834006534e-06, "loss": 2.3021, "step": 8156 }, { "epoch": 0.82, "learning_rate": 1.701225800762606e-06, "loss": 2.2324, "step": 8157 }, { "epoch": 0.82, "learning_rate": 1.6994156414418417e-06, "loss": 2.3655, "step": 8158 }, { "epoch": 0.82, "learning_rate": 1.6976063562348598e-06, "loss": 2.2547, "step": 8159 }, { "epoch": 0.82, "learning_rate": 1.6957979453321938e-06, "loss": 2.3672, "step": 8160 }, { "epoch": 0.82, "learning_rate": 1.6939904089242797e-06, "loss": 2.2901, "step": 8161 }, { "epoch": 0.82, "learning_rate": 1.6921837472014713e-06, "loss": 2.1819, "step": 8162 }, { "epoch": 0.82, "learning_rate": 1.6903779603540194e-06, "loss": 2.2287, "step": 8163 }, { "epoch": 0.82, "learning_rate": 1.6885730485720874e-06, "loss": 2.3461, "step": 8164 }, { "epoch": 0.82, "learning_rate": 1.6867690120457458e-06, "loss": 2.292, "step": 8165 }, { "epoch": 0.82, "learning_rate": 1.6849658509649746e-06, "loss": 2.2637, "step": 8166 }, { "epoch": 0.82, "learning_rate": 1.6831635655196588e-06, "loss": 2.2462, "step": 8167 }, { "epoch": 0.82, "learning_rate": 1.681362155899593e-06, "loss": 2.4388, "step": 8168 }, { "epoch": 0.82, "learning_rate": 1.679561622294479e-06, "loss": 2.3829, "step": 8169 }, { "epoch": 0.82, "learning_rate": 1.6777619648939248e-06, "loss": 2.4338, "step": 8170 }, { "epoch": 0.82, "learning_rate": 1.6759631838874513e-06, "loss": 2.2472, "step": 8171 }, { "epoch": 0.82, "learning_rate": 1.6741652794644825e-06, "loss": 2.2969, "step": 8172 }, { "epoch": 0.82, "learning_rate": 1.6723682518143502e-06, "loss": 2.2216, "step": 8173 }, { "epoch": 0.82, "learning_rate": 1.6705721011262954e-06, "loss": 2.3358, "step": 8174 }, { "epoch": 0.82, "learning_rate": 1.6687768275894667e-06, "loss": 2.4153, "step": 8175 }, { "epoch": 0.82, "learning_rate": 1.6669824313929195e-06, "loss": 2.2184, "step": 8176 }, { "epoch": 0.82, "learning_rate": 1.665188912725616e-06, "loss": 2.3036, "step": 8177 }, { "epoch": 0.82, "learning_rate": 1.6633962717764295e-06, "loss": 2.3147, "step": 8178 }, { "epoch": 0.82, "learning_rate": 1.6616045087341359e-06, "loss": 2.4021, "step": 8179 }, { "epoch": 0.82, "learning_rate": 1.659813623787424e-06, "loss": 2.3313, "step": 8180 }, { "epoch": 0.82, "learning_rate": 1.6580236171248853e-06, "loss": 2.3613, "step": 8181 }, { "epoch": 0.82, "learning_rate": 1.6562344889350224e-06, "loss": 2.3067, "step": 8182 }, { "epoch": 0.82, "learning_rate": 1.6544462394062422e-06, "loss": 2.22, "step": 8183 }, { "epoch": 0.82, "learning_rate": 1.6526588687268618e-06, "loss": 2.2018, "step": 8184 }, { "epoch": 0.82, "learning_rate": 1.6508723770851054e-06, "loss": 2.3079, "step": 8185 }, { "epoch": 0.82, "learning_rate": 1.6490867646691034e-06, "loss": 2.3688, "step": 8186 }, { "epoch": 0.82, "learning_rate": 1.6473020316668942e-06, "loss": 2.2471, "step": 8187 }, { "epoch": 0.82, "learning_rate": 1.6455181782664199e-06, "loss": 2.2718, "step": 8188 }, { "epoch": 0.82, "learning_rate": 1.643735204655541e-06, "loss": 2.2399, "step": 8189 }, { "epoch": 0.82, "learning_rate": 1.6419531110220133e-06, "loss": 2.2437, "step": 8190 }, { "epoch": 0.82, "learning_rate": 1.6401718975535053e-06, "loss": 2.285, "step": 8191 }, { "epoch": 0.82, "learning_rate": 1.6383915644375924e-06, "loss": 2.3227, "step": 8192 }, { "epoch": 0.82, "learning_rate": 1.6366121118617583e-06, "loss": 2.202, "step": 8193 }, { "epoch": 0.82, "learning_rate": 1.6348335400133896e-06, "loss": 2.3446, "step": 8194 }, { "epoch": 0.82, "learning_rate": 1.6330558490797866e-06, "loss": 2.3185, "step": 8195 }, { "epoch": 0.82, "learning_rate": 1.6312790392481504e-06, "loss": 2.2643, "step": 8196 }, { "epoch": 0.82, "learning_rate": 1.6295031107055925e-06, "loss": 2.4039, "step": 8197 }, { "epoch": 0.82, "learning_rate": 1.627728063639138e-06, "loss": 2.2641, "step": 8198 }, { "epoch": 0.82, "learning_rate": 1.6259538982357037e-06, "loss": 2.3031, "step": 8199 }, { "epoch": 0.82, "learning_rate": 1.6241806146821282e-06, "loss": 2.1904, "step": 8200 }, { "epoch": 0.82, "learning_rate": 1.6224082131651487e-06, "loss": 2.2777, "step": 8201 }, { "epoch": 0.82, "learning_rate": 1.6206366938714135e-06, "loss": 2.1993, "step": 8202 }, { "epoch": 0.82, "learning_rate": 1.618866056987477e-06, "loss": 2.1519, "step": 8203 }, { "epoch": 0.82, "learning_rate": 1.6170963026997999e-06, "loss": 2.3757, "step": 8204 }, { "epoch": 0.82, "learning_rate": 1.6153274311947486e-06, "loss": 2.2381, "step": 8205 }, { "epoch": 0.82, "learning_rate": 1.6135594426586043e-06, "loss": 2.3014, "step": 8206 }, { "epoch": 0.82, "learning_rate": 1.6117923372775456e-06, "loss": 2.3323, "step": 8207 }, { "epoch": 0.82, "learning_rate": 1.6100261152376618e-06, "loss": 2.3896, "step": 8208 }, { "epoch": 0.82, "learning_rate": 1.6082607767249515e-06, "loss": 2.2688, "step": 8209 }, { "epoch": 0.82, "learning_rate": 1.606496321925315e-06, "loss": 2.2372, "step": 8210 }, { "epoch": 0.82, "learning_rate": 1.6047327510245648e-06, "loss": 2.3984, "step": 8211 }, { "epoch": 0.82, "learning_rate": 1.6029700642084177e-06, "loss": 2.3464, "step": 8212 }, { "epoch": 0.82, "learning_rate": 1.601208261662498e-06, "loss": 2.2033, "step": 8213 }, { "epoch": 0.82, "learning_rate": 1.5994473435723334e-06, "loss": 2.3661, "step": 8214 }, { "epoch": 0.82, "learning_rate": 1.5976873101233681e-06, "loss": 2.2242, "step": 8215 }, { "epoch": 0.82, "learning_rate": 1.5959281615009425e-06, "loss": 2.3021, "step": 8216 }, { "epoch": 0.82, "learning_rate": 1.5941698978903096e-06, "loss": 2.3128, "step": 8217 }, { "epoch": 0.82, "learning_rate": 1.5924125194766271e-06, "loss": 2.2718, "step": 8218 }, { "epoch": 0.82, "learning_rate": 1.590656026444961e-06, "loss": 2.2458, "step": 8219 }, { "epoch": 0.82, "learning_rate": 1.5889004189802814e-06, "loss": 2.3139, "step": 8220 }, { "epoch": 0.82, "learning_rate": 1.5871456972674692e-06, "loss": 2.3377, "step": 8221 }, { "epoch": 0.82, "learning_rate": 1.58539186149131e-06, "loss": 2.2439, "step": 8222 }, { "epoch": 0.82, "learning_rate": 1.5836389118364903e-06, "loss": 2.1956, "step": 8223 }, { "epoch": 0.82, "learning_rate": 1.5818868484876159e-06, "loss": 2.261, "step": 8224 }, { "epoch": 0.82, "learning_rate": 1.5801356716291882e-06, "loss": 2.2496, "step": 8225 }, { "epoch": 0.82, "learning_rate": 1.5783853814456207e-06, "loss": 2.3937, "step": 8226 }, { "epoch": 0.82, "learning_rate": 1.5766359781212326e-06, "loss": 2.2856, "step": 8227 }, { "epoch": 0.82, "learning_rate": 1.5748874618402477e-06, "loss": 2.3156, "step": 8228 }, { "epoch": 0.82, "learning_rate": 1.5731398327867986e-06, "loss": 2.2554, "step": 8229 }, { "epoch": 0.82, "learning_rate": 1.5713930911449239e-06, "loss": 2.209, "step": 8230 }, { "epoch": 0.82, "learning_rate": 1.5696472370985672e-06, "loss": 2.2905, "step": 8231 }, { "epoch": 0.82, "learning_rate": 1.5679022708315806e-06, "loss": 2.3033, "step": 8232 }, { "epoch": 0.82, "learning_rate": 1.5661581925277237e-06, "loss": 2.3793, "step": 8233 }, { "epoch": 0.82, "learning_rate": 1.5644150023706606e-06, "loss": 2.2973, "step": 8234 }, { "epoch": 0.83, "learning_rate": 1.5626727005439624e-06, "loss": 2.2208, "step": 8235 }, { "epoch": 0.83, "learning_rate": 1.5609312872311045e-06, "loss": 2.2682, "step": 8236 }, { "epoch": 0.83, "learning_rate": 1.5591907626154734e-06, "loss": 2.3092, "step": 8237 }, { "epoch": 0.83, "learning_rate": 1.5574511268803572e-06, "loss": 2.4966, "step": 8238 }, { "epoch": 0.83, "learning_rate": 1.5557123802089546e-06, "loss": 2.3691, "step": 8239 }, { "epoch": 0.83, "learning_rate": 1.5539745227843673e-06, "loss": 2.2758, "step": 8240 }, { "epoch": 0.83, "learning_rate": 1.5522375547896041e-06, "loss": 2.2776, "step": 8241 }, { "epoch": 0.83, "learning_rate": 1.5505014764075832e-06, "loss": 2.3278, "step": 8242 }, { "epoch": 0.83, "learning_rate": 1.548766287821124e-06, "loss": 2.2917, "step": 8243 }, { "epoch": 0.83, "learning_rate": 1.547031989212957e-06, "loss": 2.2506, "step": 8244 }, { "epoch": 0.83, "learning_rate": 1.545298580765715e-06, "loss": 2.2844, "step": 8245 }, { "epoch": 0.83, "learning_rate": 1.5435660626619408e-06, "loss": 2.1539, "step": 8246 }, { "epoch": 0.83, "learning_rate": 1.5418344350840798e-06, "loss": 2.2891, "step": 8247 }, { "epoch": 0.83, "learning_rate": 1.5401036982144856e-06, "loss": 2.3413, "step": 8248 }, { "epoch": 0.83, "learning_rate": 1.5383738522354197e-06, "loss": 2.3117, "step": 8249 }, { "epoch": 0.83, "learning_rate": 1.5366448973290437e-06, "loss": 2.2446, "step": 8250 }, { "epoch": 0.83, "learning_rate": 1.5349168336774346e-06, "loss": 2.267, "step": 8251 }, { "epoch": 0.83, "learning_rate": 1.5331896614625675e-06, "loss": 2.3115, "step": 8252 }, { "epoch": 0.83, "learning_rate": 1.531463380866327e-06, "loss": 2.3048, "step": 8253 }, { "epoch": 0.83, "learning_rate": 1.5297379920705046e-06, "loss": 2.3441, "step": 8254 }, { "epoch": 0.83, "learning_rate": 1.528013495256796e-06, "loss": 2.2338, "step": 8255 }, { "epoch": 0.83, "learning_rate": 1.5262898906068024e-06, "loss": 2.2697, "step": 8256 }, { "epoch": 0.83, "learning_rate": 1.5245671783020332e-06, "loss": 2.3333, "step": 8257 }, { "epoch": 0.83, "learning_rate": 1.5228453585239033e-06, "loss": 2.3588, "step": 8258 }, { "epoch": 0.83, "learning_rate": 1.521124431453731e-06, "loss": 2.3269, "step": 8259 }, { "epoch": 0.83, "learning_rate": 1.5194043972727467e-06, "loss": 2.2783, "step": 8260 }, { "epoch": 0.83, "learning_rate": 1.5176852561620835e-06, "loss": 2.2104, "step": 8261 }, { "epoch": 0.83, "learning_rate": 1.5159670083027744e-06, "loss": 2.2848, "step": 8262 }, { "epoch": 0.83, "learning_rate": 1.5142496538757678e-06, "loss": 2.3154, "step": 8263 }, { "epoch": 0.83, "learning_rate": 1.5125331930619113e-06, "loss": 2.3102, "step": 8264 }, { "epoch": 0.83, "learning_rate": 1.510817626041964e-06, "loss": 2.2542, "step": 8265 }, { "epoch": 0.83, "learning_rate": 1.5091029529965861e-06, "loss": 2.3013, "step": 8266 }, { "epoch": 0.83, "learning_rate": 1.5073891741063461e-06, "loss": 2.2873, "step": 8267 }, { "epoch": 0.83, "learning_rate": 1.5056762895517152e-06, "loss": 2.3573, "step": 8268 }, { "epoch": 0.83, "learning_rate": 1.5039642995130787e-06, "loss": 2.2826, "step": 8269 }, { "epoch": 0.83, "learning_rate": 1.5022532041707183e-06, "loss": 2.3598, "step": 8270 }, { "epoch": 0.83, "learning_rate": 1.5005430037048251e-06, "loss": 2.2366, "step": 8271 }, { "epoch": 0.83, "learning_rate": 1.4988336982954976e-06, "loss": 2.3638, "step": 8272 }, { "epoch": 0.83, "learning_rate": 1.4971252881227373e-06, "loss": 2.3359, "step": 8273 }, { "epoch": 0.83, "learning_rate": 1.4954177733664522e-06, "loss": 2.4158, "step": 8274 }, { "epoch": 0.83, "learning_rate": 1.4937111542064575e-06, "loss": 2.2477, "step": 8275 }, { "epoch": 0.83, "learning_rate": 1.4920054308224718e-06, "loss": 2.3119, "step": 8276 }, { "epoch": 0.83, "learning_rate": 1.4903006033941203e-06, "loss": 2.2898, "step": 8277 }, { "epoch": 0.83, "learning_rate": 1.4885966721009359e-06, "loss": 2.2589, "step": 8278 }, { "epoch": 0.83, "learning_rate": 1.4868936371223552e-06, "loss": 2.3643, "step": 8279 }, { "epoch": 0.83, "learning_rate": 1.4851914986377204e-06, "loss": 2.236, "step": 8280 }, { "epoch": 0.83, "learning_rate": 1.4834902568262788e-06, "loss": 2.3419, "step": 8281 }, { "epoch": 0.83, "learning_rate": 1.4817899118671842e-06, "loss": 2.3232, "step": 8282 }, { "epoch": 0.83, "learning_rate": 1.4800904639394943e-06, "loss": 2.2169, "step": 8283 }, { "epoch": 0.83, "learning_rate": 1.4783919132221758e-06, "loss": 2.2469, "step": 8284 }, { "epoch": 0.83, "learning_rate": 1.4766942598940981e-06, "loss": 2.2294, "step": 8285 }, { "epoch": 0.83, "learning_rate": 1.474997504134037e-06, "loss": 2.2873, "step": 8286 }, { "epoch": 0.83, "learning_rate": 1.4733016461206727e-06, "loss": 2.2162, "step": 8287 }, { "epoch": 0.83, "learning_rate": 1.471606686032593e-06, "loss": 2.3421, "step": 8288 }, { "epoch": 0.83, "learning_rate": 1.4699126240482887e-06, "loss": 2.2714, "step": 8289 }, { "epoch": 0.83, "learning_rate": 1.4682194603461585e-06, "loss": 2.2687, "step": 8290 }, { "epoch": 0.83, "learning_rate": 1.4665271951045045e-06, "loss": 2.2586, "step": 8291 }, { "epoch": 0.83, "learning_rate": 1.464835828501534e-06, "loss": 2.2232, "step": 8292 }, { "epoch": 0.83, "learning_rate": 1.4631453607153623e-06, "loss": 2.293, "step": 8293 }, { "epoch": 0.83, "learning_rate": 1.461455791924008e-06, "loss": 2.2509, "step": 8294 }, { "epoch": 0.83, "learning_rate": 1.4597671223053922e-06, "loss": 2.3152, "step": 8295 }, { "epoch": 0.83, "learning_rate": 1.4580793520373492e-06, "loss": 2.1909, "step": 8296 }, { "epoch": 0.83, "learning_rate": 1.4563924812976127e-06, "loss": 2.3397, "step": 8297 }, { "epoch": 0.83, "learning_rate": 1.4547065102638215e-06, "loss": 2.2438, "step": 8298 }, { "epoch": 0.83, "learning_rate": 1.453021439113521e-06, "loss": 2.3056, "step": 8299 }, { "epoch": 0.83, "learning_rate": 1.4513372680241634e-06, "loss": 2.3027, "step": 8300 }, { "epoch": 0.83, "learning_rate": 1.4496539971731028e-06, "loss": 2.3055, "step": 8301 }, { "epoch": 0.83, "learning_rate": 1.4479716267376022e-06, "loss": 2.2283, "step": 8302 }, { "epoch": 0.83, "learning_rate": 1.4462901568948252e-06, "loss": 2.1713, "step": 8303 }, { "epoch": 0.83, "learning_rate": 1.4446095878218448e-06, "loss": 2.4129, "step": 8304 }, { "epoch": 0.83, "learning_rate": 1.442929919695638e-06, "loss": 2.2603, "step": 8305 }, { "epoch": 0.83, "learning_rate": 1.441251152693085e-06, "loss": 2.3733, "step": 8306 }, { "epoch": 0.83, "learning_rate": 1.439573286990974e-06, "loss": 2.2943, "step": 8307 }, { "epoch": 0.83, "learning_rate": 1.4378963227659959e-06, "loss": 2.4018, "step": 8308 }, { "epoch": 0.83, "learning_rate": 1.4362202601947472e-06, "loss": 2.2683, "step": 8309 }, { "epoch": 0.83, "learning_rate": 1.4345450994537314e-06, "loss": 2.2948, "step": 8310 }, { "epoch": 0.83, "learning_rate": 1.4328708407193548e-06, "loss": 2.3476, "step": 8311 }, { "epoch": 0.83, "learning_rate": 1.4311974841679289e-06, "loss": 2.3407, "step": 8312 }, { "epoch": 0.83, "learning_rate": 1.429525029975668e-06, "loss": 2.2676, "step": 8313 }, { "epoch": 0.83, "learning_rate": 1.4278534783187003e-06, "loss": 2.2416, "step": 8314 }, { "epoch": 0.83, "learning_rate": 1.4261828293730495e-06, "loss": 2.3505, "step": 8315 }, { "epoch": 0.83, "learning_rate": 1.424513083314647e-06, "loss": 2.3042, "step": 8316 }, { "epoch": 0.83, "learning_rate": 1.4228442403193299e-06, "loss": 2.2869, "step": 8317 }, { "epoch": 0.83, "learning_rate": 1.4211763005628399e-06, "loss": 2.2775, "step": 8318 }, { "epoch": 0.83, "learning_rate": 1.419509264220824e-06, "loss": 2.4084, "step": 8319 }, { "epoch": 0.83, "learning_rate": 1.4178431314688334e-06, "loss": 2.2967, "step": 8320 }, { "epoch": 0.83, "learning_rate": 1.416177902482324e-06, "loss": 2.1966, "step": 8321 }, { "epoch": 0.83, "learning_rate": 1.4145135774366558e-06, "loss": 2.3974, "step": 8322 }, { "epoch": 0.83, "learning_rate": 1.4128501565070973e-06, "loss": 2.3805, "step": 8323 }, { "epoch": 0.83, "learning_rate": 1.4111876398688196e-06, "loss": 2.276, "step": 8324 }, { "epoch": 0.83, "learning_rate": 1.4095260276968969e-06, "loss": 2.2365, "step": 8325 }, { "epoch": 0.83, "learning_rate": 1.4078653201663084e-06, "loss": 2.2687, "step": 8326 }, { "epoch": 0.83, "learning_rate": 1.4062055174519384e-06, "loss": 2.2473, "step": 8327 }, { "epoch": 0.83, "learning_rate": 1.4045466197285795e-06, "loss": 2.2726, "step": 8328 }, { "epoch": 0.83, "learning_rate": 1.402888627170923e-06, "loss": 2.3627, "step": 8329 }, { "epoch": 0.83, "learning_rate": 1.4012315399535704e-06, "loss": 2.1628, "step": 8330 }, { "epoch": 0.83, "learning_rate": 1.399575358251022e-06, "loss": 2.3538, "step": 8331 }, { "epoch": 0.83, "learning_rate": 1.3979200822376904e-06, "loss": 2.3123, "step": 8332 }, { "epoch": 0.83, "learning_rate": 1.3962657120878875e-06, "loss": 2.3013, "step": 8333 }, { "epoch": 0.83, "learning_rate": 1.3946122479758294e-06, "loss": 2.3263, "step": 8334 }, { "epoch": 0.84, "learning_rate": 1.3929596900756393e-06, "loss": 2.2554, "step": 8335 }, { "epoch": 0.84, "learning_rate": 1.3913080385613443e-06, "loss": 2.2533, "step": 8336 }, { "epoch": 0.84, "learning_rate": 1.3896572936068741e-06, "loss": 2.1919, "step": 8337 }, { "epoch": 0.84, "learning_rate": 1.3880074553860667e-06, "loss": 2.2865, "step": 8338 }, { "epoch": 0.84, "learning_rate": 1.3863585240726607e-06, "loss": 2.3949, "step": 8339 }, { "epoch": 0.84, "learning_rate": 1.3847104998402994e-06, "loss": 2.2573, "step": 8340 }, { "epoch": 0.84, "learning_rate": 1.383063382862536e-06, "loss": 2.2288, "step": 8341 }, { "epoch": 0.84, "learning_rate": 1.3814171733128224e-06, "loss": 2.3332, "step": 8342 }, { "epoch": 0.84, "learning_rate": 1.3797718713645169e-06, "loss": 2.253, "step": 8343 }, { "epoch": 0.84, "learning_rate": 1.3781274771908825e-06, "loss": 2.2651, "step": 8344 }, { "epoch": 0.84, "learning_rate": 1.3764839909650863e-06, "loss": 2.2587, "step": 8345 }, { "epoch": 0.84, "learning_rate": 1.3748414128601984e-06, "loss": 2.1853, "step": 8346 }, { "epoch": 0.84, "learning_rate": 1.373199743049195e-06, "loss": 2.2501, "step": 8347 }, { "epoch": 0.84, "learning_rate": 1.3715589817049579e-06, "loss": 2.246, "step": 8348 }, { "epoch": 0.84, "learning_rate": 1.36991912900027e-06, "loss": 2.349, "step": 8349 }, { "epoch": 0.84, "learning_rate": 1.3682801851078208e-06, "loss": 2.3203, "step": 8350 }, { "epoch": 0.84, "learning_rate": 1.3666421502002026e-06, "loss": 2.2871, "step": 8351 }, { "epoch": 0.84, "learning_rate": 1.3650050244499135e-06, "loss": 2.2987, "step": 8352 }, { "epoch": 0.84, "learning_rate": 1.3633688080293538e-06, "loss": 2.2066, "step": 8353 }, { "epoch": 0.84, "learning_rate": 1.3617335011108312e-06, "loss": 2.3461, "step": 8354 }, { "epoch": 0.84, "learning_rate": 1.3600991038665557e-06, "loss": 2.2472, "step": 8355 }, { "epoch": 0.84, "learning_rate": 1.3584656164686394e-06, "loss": 2.2732, "step": 8356 }, { "epoch": 0.84, "learning_rate": 1.3568330390891038e-06, "loss": 2.2162, "step": 8357 }, { "epoch": 0.84, "learning_rate": 1.3552013718998668e-06, "loss": 2.2865, "step": 8358 }, { "epoch": 0.84, "learning_rate": 1.3535706150727602e-06, "loss": 2.2719, "step": 8359 }, { "epoch": 0.84, "learning_rate": 1.3519407687795138e-06, "loss": 2.3205, "step": 8360 }, { "epoch": 0.84, "learning_rate": 1.350311833191762e-06, "loss": 2.4112, "step": 8361 }, { "epoch": 0.84, "learning_rate": 1.3486838084810438e-06, "loss": 2.2519, "step": 8362 }, { "epoch": 0.84, "learning_rate": 1.3470566948188024e-06, "loss": 2.4025, "step": 8363 }, { "epoch": 0.84, "learning_rate": 1.345430492376385e-06, "loss": 2.3325, "step": 8364 }, { "epoch": 0.84, "learning_rate": 1.3438052013250435e-06, "loss": 2.3376, "step": 8365 }, { "epoch": 0.84, "learning_rate": 1.3421808218359322e-06, "loss": 2.3053, "step": 8366 }, { "epoch": 0.84, "learning_rate": 1.340557354080111e-06, "loss": 2.2249, "step": 8367 }, { "epoch": 0.84, "learning_rate": 1.338934798228544e-06, "loss": 2.2367, "step": 8368 }, { "epoch": 0.84, "learning_rate": 1.3373131544520979e-06, "loss": 2.2662, "step": 8369 }, { "epoch": 0.84, "learning_rate": 1.3356924229215429e-06, "loss": 2.3501, "step": 8370 }, { "epoch": 0.84, "learning_rate": 1.3340726038075558e-06, "loss": 2.2274, "step": 8371 }, { "epoch": 0.84, "learning_rate": 1.3324536972807146e-06, "loss": 2.2361, "step": 8372 }, { "epoch": 0.84, "learning_rate": 1.3308357035115027e-06, "loss": 2.2813, "step": 8373 }, { "epoch": 0.84, "learning_rate": 1.3292186226703075e-06, "loss": 2.1646, "step": 8374 }, { "epoch": 0.84, "learning_rate": 1.3276024549274157e-06, "loss": 2.2948, "step": 8375 }, { "epoch": 0.84, "learning_rate": 1.3259872004530295e-06, "loss": 2.3685, "step": 8376 }, { "epoch": 0.84, "learning_rate": 1.3243728594172422e-06, "loss": 2.243, "step": 8377 }, { "epoch": 0.84, "learning_rate": 1.3227594319900572e-06, "loss": 2.3582, "step": 8378 }, { "epoch": 0.84, "learning_rate": 1.3211469183413794e-06, "loss": 2.2607, "step": 8379 }, { "epoch": 0.84, "learning_rate": 1.319535318641021e-06, "loss": 2.3644, "step": 8380 }, { "epoch": 0.84, "learning_rate": 1.3179246330586937e-06, "loss": 2.365, "step": 8381 }, { "epoch": 0.84, "learning_rate": 1.3163148617640142e-06, "loss": 2.2331, "step": 8382 }, { "epoch": 0.84, "learning_rate": 1.3147060049265059e-06, "loss": 2.3164, "step": 8383 }, { "epoch": 0.84, "learning_rate": 1.3130980627155886e-06, "loss": 2.2925, "step": 8384 }, { "epoch": 0.84, "learning_rate": 1.3114910353005972e-06, "loss": 2.3212, "step": 8385 }, { "epoch": 0.84, "learning_rate": 1.3098849228507594e-06, "loss": 2.3889, "step": 8386 }, { "epoch": 0.84, "learning_rate": 1.308279725535213e-06, "loss": 2.3845, "step": 8387 }, { "epoch": 0.84, "learning_rate": 1.3066754435229968e-06, "loss": 2.308, "step": 8388 }, { "epoch": 0.84, "learning_rate": 1.305072076983055e-06, "loss": 2.268, "step": 8389 }, { "epoch": 0.84, "learning_rate": 1.3034696260842305e-06, "loss": 2.2993, "step": 8390 }, { "epoch": 0.84, "learning_rate": 1.3018680909952752e-06, "loss": 2.3891, "step": 8391 }, { "epoch": 0.84, "learning_rate": 1.300267471884843e-06, "loss": 2.2765, "step": 8392 }, { "epoch": 0.84, "learning_rate": 1.2986677689214888e-06, "loss": 2.3414, "step": 8393 }, { "epoch": 0.84, "learning_rate": 1.2970689822736782e-06, "loss": 2.256, "step": 8394 }, { "epoch": 0.84, "learning_rate": 1.2954711121097718e-06, "loss": 2.345, "step": 8395 }, { "epoch": 0.84, "learning_rate": 1.2938741585980386e-06, "loss": 2.2716, "step": 8396 }, { "epoch": 0.84, "learning_rate": 1.2922781219066506e-06, "loss": 2.2746, "step": 8397 }, { "epoch": 0.84, "learning_rate": 1.2906830022036798e-06, "loss": 2.1342, "step": 8398 }, { "epoch": 0.84, "learning_rate": 1.2890887996571066e-06, "loss": 2.3268, "step": 8399 }, { "epoch": 0.84, "learning_rate": 1.2874955144348112e-06, "loss": 2.2227, "step": 8400 }, { "epoch": 0.84, "learning_rate": 1.285903146704579e-06, "loss": 2.2937, "step": 8401 }, { "epoch": 0.84, "learning_rate": 1.2843116966340963e-06, "loss": 2.1911, "step": 8402 }, { "epoch": 0.84, "learning_rate": 1.2827211643909588e-06, "loss": 2.2196, "step": 8403 }, { "epoch": 0.84, "learning_rate": 1.2811315501426592e-06, "loss": 2.3532, "step": 8404 }, { "epoch": 0.84, "learning_rate": 1.2795428540565958e-06, "loss": 2.33, "step": 8405 }, { "epoch": 0.84, "learning_rate": 1.2779550763000703e-06, "loss": 2.2752, "step": 8406 }, { "epoch": 0.84, "learning_rate": 1.276368217040288e-06, "loss": 2.2972, "step": 8407 }, { "epoch": 0.84, "learning_rate": 1.2747822764443562e-06, "loss": 2.2441, "step": 8408 }, { "epoch": 0.84, "learning_rate": 1.2731972546792871e-06, "loss": 2.3182, "step": 8409 }, { "epoch": 0.84, "learning_rate": 1.2716131519119957e-06, "loss": 2.3674, "step": 8410 }, { "epoch": 0.84, "learning_rate": 1.2700299683092987e-06, "loss": 2.3063, "step": 8411 }, { "epoch": 0.84, "learning_rate": 1.2684477040379173e-06, "loss": 2.2949, "step": 8412 }, { "epoch": 0.84, "learning_rate": 1.266866359264477e-06, "loss": 2.3161, "step": 8413 }, { "epoch": 0.84, "learning_rate": 1.2652859341555047e-06, "loss": 2.3753, "step": 8414 }, { "epoch": 0.84, "learning_rate": 1.2637064288774303e-06, "loss": 2.315, "step": 8415 }, { "epoch": 0.84, "learning_rate": 1.2621278435965889e-06, "loss": 2.3474, "step": 8416 }, { "epoch": 0.84, "learning_rate": 1.2605501784792163e-06, "loss": 2.2978, "step": 8417 }, { "epoch": 0.84, "learning_rate": 1.2589734336914527e-06, "loss": 2.2958, "step": 8418 }, { "epoch": 0.84, "learning_rate": 1.2573976093993412e-06, "loss": 2.3396, "step": 8419 }, { "epoch": 0.84, "learning_rate": 1.2558227057688255e-06, "loss": 2.3087, "step": 8420 }, { "epoch": 0.84, "learning_rate": 1.2542487229657596e-06, "loss": 2.2701, "step": 8421 }, { "epoch": 0.84, "learning_rate": 1.2526756611558932e-06, "loss": 2.1836, "step": 8422 }, { "epoch": 0.84, "learning_rate": 1.2511035205048827e-06, "loss": 2.2991, "step": 8423 }, { "epoch": 0.84, "learning_rate": 1.2495323011782846e-06, "loss": 2.2112, "step": 8424 }, { "epoch": 0.84, "learning_rate": 1.2479620033415596e-06, "loss": 2.327, "step": 8425 }, { "epoch": 0.84, "learning_rate": 1.2463926271600745e-06, "loss": 2.0861, "step": 8426 }, { "epoch": 0.84, "learning_rate": 1.244824172799094e-06, "loss": 2.2635, "step": 8427 }, { "epoch": 0.84, "learning_rate": 1.2432566404237889e-06, "loss": 2.2955, "step": 8428 }, { "epoch": 0.84, "learning_rate": 1.241690030199233e-06, "loss": 2.2086, "step": 8429 }, { "epoch": 0.84, "learning_rate": 1.2401243422904008e-06, "loss": 2.3395, "step": 8430 }, { "epoch": 0.84, "learning_rate": 1.2385595768621705e-06, "loss": 2.3107, "step": 8431 }, { "epoch": 0.84, "learning_rate": 1.2369957340793259e-06, "loss": 2.3157, "step": 8432 }, { "epoch": 0.84, "learning_rate": 1.2354328141065496e-06, "loss": 2.2879, "step": 8433 }, { "epoch": 0.85, "learning_rate": 1.233870817108429e-06, "loss": 2.2485, "step": 8434 }, { "epoch": 0.85, "learning_rate": 1.2323097432494534e-06, "loss": 2.2832, "step": 8435 }, { "epoch": 0.85, "learning_rate": 1.2307495926940184e-06, "loss": 2.2636, "step": 8436 }, { "epoch": 0.85, "learning_rate": 1.2291903656064164e-06, "loss": 2.3491, "step": 8437 }, { "epoch": 0.85, "learning_rate": 1.2276320621508453e-06, "loss": 2.3692, "step": 8438 }, { "epoch": 0.85, "learning_rate": 1.2260746824914105e-06, "loss": 2.2375, "step": 8439 }, { "epoch": 0.85, "learning_rate": 1.2245182267921119e-06, "loss": 2.2878, "step": 8440 }, { "epoch": 0.85, "learning_rate": 1.2229626952168583e-06, "loss": 2.3388, "step": 8441 }, { "epoch": 0.85, "learning_rate": 1.2214080879294565e-06, "loss": 2.3814, "step": 8442 }, { "epoch": 0.85, "learning_rate": 1.21985440509362e-06, "loss": 2.2916, "step": 8443 }, { "epoch": 0.85, "learning_rate": 1.2183016468729624e-06, "loss": 2.3726, "step": 8444 }, { "epoch": 0.85, "learning_rate": 1.2167498134310018e-06, "loss": 2.2039, "step": 8445 }, { "epoch": 0.85, "learning_rate": 1.2151989049311574e-06, "loss": 2.3381, "step": 8446 }, { "epoch": 0.85, "learning_rate": 1.2136489215367487e-06, "loss": 2.1857, "step": 8447 }, { "epoch": 0.85, "learning_rate": 1.2120998634110048e-06, "loss": 2.2776, "step": 8448 }, { "epoch": 0.85, "learning_rate": 1.2105517307170523e-06, "loss": 2.3002, "step": 8449 }, { "epoch": 0.85, "learning_rate": 1.2090045236179205e-06, "loss": 2.3012, "step": 8450 }, { "epoch": 0.85, "learning_rate": 1.2074582422765412e-06, "loss": 2.3641, "step": 8451 }, { "epoch": 0.85, "learning_rate": 1.20591288685575e-06, "loss": 2.2689, "step": 8452 }, { "epoch": 0.85, "learning_rate": 1.204368457518288e-06, "loss": 2.2692, "step": 8453 }, { "epoch": 0.85, "learning_rate": 1.2028249544267878e-06, "loss": 2.1454, "step": 8454 }, { "epoch": 0.85, "learning_rate": 1.2012823777437965e-06, "loss": 2.3217, "step": 8455 }, { "epoch": 0.85, "learning_rate": 1.1997407276317563e-06, "loss": 2.2961, "step": 8456 }, { "epoch": 0.85, "learning_rate": 1.1982000042530183e-06, "loss": 2.2922, "step": 8457 }, { "epoch": 0.85, "learning_rate": 1.1966602077698298e-06, "loss": 2.3096, "step": 8458 }, { "epoch": 0.85, "learning_rate": 1.1951213383443438e-06, "loss": 2.303, "step": 8459 }, { "epoch": 0.85, "learning_rate": 1.1935833961386144e-06, "loss": 2.2606, "step": 8460 }, { "epoch": 0.85, "learning_rate": 1.1920463813145988e-06, "loss": 2.195, "step": 8461 }, { "epoch": 0.85, "learning_rate": 1.1905102940341561e-06, "loss": 2.3461, "step": 8462 }, { "epoch": 0.85, "learning_rate": 1.1889751344590472e-06, "loss": 2.2266, "step": 8463 }, { "epoch": 0.85, "learning_rate": 1.187440902750936e-06, "loss": 2.3542, "step": 8464 }, { "epoch": 0.85, "learning_rate": 1.1859075990713876e-06, "loss": 2.2862, "step": 8465 }, { "epoch": 0.85, "learning_rate": 1.184375223581873e-06, "loss": 2.2365, "step": 8466 }, { "epoch": 0.85, "learning_rate": 1.1828437764437628e-06, "loss": 2.3274, "step": 8467 }, { "epoch": 0.85, "learning_rate": 1.1813132578183274e-06, "loss": 2.3397, "step": 8468 }, { "epoch": 0.85, "learning_rate": 1.1797836678667428e-06, "loss": 2.365, "step": 8469 }, { "epoch": 0.85, "learning_rate": 1.1782550067500875e-06, "loss": 2.2805, "step": 8470 }, { "epoch": 0.85, "learning_rate": 1.1767272746293401e-06, "loss": 2.2763, "step": 8471 }, { "epoch": 0.85, "learning_rate": 1.175200471665382e-06, "loss": 2.2772, "step": 8472 }, { "epoch": 0.85, "learning_rate": 1.1736745980189967e-06, "loss": 2.2075, "step": 8473 }, { "epoch": 0.85, "learning_rate": 1.1721496538508715e-06, "loss": 2.3324, "step": 8474 }, { "epoch": 0.85, "learning_rate": 1.1706256393215932e-06, "loss": 2.3359, "step": 8475 }, { "epoch": 0.85, "learning_rate": 1.1691025545916511e-06, "loss": 2.3134, "step": 8476 }, { "epoch": 0.85, "learning_rate": 1.1675803998214407e-06, "loss": 2.2588, "step": 8477 }, { "epoch": 0.85, "learning_rate": 1.1660591751712535e-06, "loss": 2.3565, "step": 8478 }, { "epoch": 0.85, "learning_rate": 1.164538880801287e-06, "loss": 2.2694, "step": 8479 }, { "epoch": 0.85, "learning_rate": 1.1630195168716384e-06, "loss": 2.3539, "step": 8480 }, { "epoch": 0.85, "learning_rate": 1.1615010835423101e-06, "loss": 2.3195, "step": 8481 }, { "epoch": 0.85, "learning_rate": 1.159983580973203e-06, "loss": 2.2828, "step": 8482 }, { "epoch": 0.85, "learning_rate": 1.1584670093241202e-06, "loss": 2.3806, "step": 8483 }, { "epoch": 0.85, "learning_rate": 1.1569513687547706e-06, "loss": 2.2833, "step": 8484 }, { "epoch": 0.85, "learning_rate": 1.1554366594247623e-06, "loss": 2.1701, "step": 8485 }, { "epoch": 0.85, "learning_rate": 1.1539228814936055e-06, "loss": 2.2484, "step": 8486 }, { "epoch": 0.85, "learning_rate": 1.1524100351207124e-06, "loss": 2.3241, "step": 8487 }, { "epoch": 0.85, "learning_rate": 1.1508981204653957e-06, "loss": 2.4555, "step": 8488 }, { "epoch": 0.85, "learning_rate": 1.1493871376868715e-06, "loss": 2.3496, "step": 8489 }, { "epoch": 0.85, "learning_rate": 1.147877086944259e-06, "loss": 2.3299, "step": 8490 }, { "epoch": 0.85, "learning_rate": 1.1463679683965768e-06, "loss": 2.1915, "step": 8491 }, { "epoch": 0.85, "learning_rate": 1.1448597822027452e-06, "loss": 2.2591, "step": 8492 }, { "epoch": 0.85, "learning_rate": 1.143352528521593e-06, "loss": 2.1743, "step": 8493 }, { "epoch": 0.85, "learning_rate": 1.1418462075118398e-06, "loss": 2.2304, "step": 8494 }, { "epoch": 0.85, "learning_rate": 1.140340819332113e-06, "loss": 2.2844, "step": 8495 }, { "epoch": 0.85, "learning_rate": 1.1388363641409429e-06, "loss": 2.2859, "step": 8496 }, { "epoch": 0.85, "learning_rate": 1.137332842096759e-06, "loss": 2.2417, "step": 8497 }, { "epoch": 0.85, "learning_rate": 1.1358302533578947e-06, "loss": 2.3018, "step": 8498 }, { "epoch": 0.85, "learning_rate": 1.1343285980825824e-06, "loss": 2.1733, "step": 8499 }, { "epoch": 0.85, "learning_rate": 1.132827876428958e-06, "loss": 2.247, "step": 8500 }, { "epoch": 0.85, "learning_rate": 1.131328088555057e-06, "loss": 2.1983, "step": 8501 }, { "epoch": 0.85, "learning_rate": 1.1298292346188223e-06, "loss": 2.3119, "step": 8502 }, { "epoch": 0.85, "learning_rate": 1.1283313147780927e-06, "loss": 2.291, "step": 8503 }, { "epoch": 0.85, "learning_rate": 1.1268343291906102e-06, "loss": 2.284, "step": 8504 }, { "epoch": 0.85, "learning_rate": 1.1253382780140188e-06, "loss": 2.336, "step": 8505 }, { "epoch": 0.85, "learning_rate": 1.1238431614058632e-06, "loss": 2.3069, "step": 8506 }, { "epoch": 0.85, "learning_rate": 1.1223489795235908e-06, "loss": 2.2353, "step": 8507 }, { "epoch": 0.85, "learning_rate": 1.1208557325245496e-06, "loss": 2.2973, "step": 8508 }, { "epoch": 0.85, "learning_rate": 1.119363420565991e-06, "loss": 2.4387, "step": 8509 }, { "epoch": 0.85, "learning_rate": 1.1178720438050638e-06, "loss": 2.3462, "step": 8510 }, { "epoch": 0.85, "learning_rate": 1.116381602398826e-06, "loss": 2.2518, "step": 8511 }, { "epoch": 0.85, "learning_rate": 1.1148920965042288e-06, "loss": 2.2969, "step": 8512 }, { "epoch": 0.85, "learning_rate": 1.1134035262781295e-06, "loss": 2.3376, "step": 8513 }, { "epoch": 0.85, "learning_rate": 1.1119158918772854e-06, "loss": 2.304, "step": 8514 }, { "epoch": 0.85, "learning_rate": 1.1104291934583555e-06, "loss": 2.3513, "step": 8515 }, { "epoch": 0.85, "learning_rate": 1.1089434311778991e-06, "loss": 2.2279, "step": 8516 }, { "epoch": 0.85, "learning_rate": 1.107458605192383e-06, "loss": 2.1522, "step": 8517 }, { "epoch": 0.85, "learning_rate": 1.1059747156581636e-06, "loss": 2.244, "step": 8518 }, { "epoch": 0.85, "learning_rate": 1.1044917627315078e-06, "loss": 2.2938, "step": 8519 }, { "epoch": 0.85, "learning_rate": 1.103009746568583e-06, "loss": 2.3391, "step": 8520 }, { "epoch": 0.85, "learning_rate": 1.1015286673254577e-06, "loss": 2.361, "step": 8521 }, { "epoch": 0.85, "learning_rate": 1.1000485251580995e-06, "loss": 2.2967, "step": 8522 }, { "epoch": 0.85, "learning_rate": 1.098569320222377e-06, "loss": 2.2448, "step": 8523 }, { "epoch": 0.85, "learning_rate": 1.097091052674063e-06, "loss": 2.2282, "step": 8524 }, { "epoch": 0.85, "learning_rate": 1.09561372266883e-06, "loss": 2.1615, "step": 8525 }, { "epoch": 0.85, "learning_rate": 1.0941373303622526e-06, "loss": 2.4171, "step": 8526 }, { "epoch": 0.85, "learning_rate": 1.092661875909805e-06, "loss": 2.2935, "step": 8527 }, { "epoch": 0.85, "learning_rate": 1.0911873594668609e-06, "loss": 2.2867, "step": 8528 }, { "epoch": 0.85, "learning_rate": 1.0897137811887037e-06, "loss": 2.215, "step": 8529 }, { "epoch": 0.85, "learning_rate": 1.0882411412305093e-06, "loss": 2.3158, "step": 8530 }, { "epoch": 0.85, "learning_rate": 1.0867694397473583e-06, "loss": 2.3573, "step": 8531 }, { "epoch": 0.85, "learning_rate": 1.0852986768942308e-06, "loss": 2.3039, "step": 8532 }, { "epoch": 0.85, "learning_rate": 1.08382885282601e-06, "loss": 2.3742, "step": 8533 }, { "epoch": 0.86, "learning_rate": 1.0823599676974795e-06, "loss": 2.3034, "step": 8534 }, { "epoch": 0.86, "learning_rate": 1.0808920216633234e-06, "loss": 2.2695, "step": 8535 }, { "epoch": 0.86, "learning_rate": 1.0794250148781283e-06, "loss": 2.2765, "step": 8536 }, { "epoch": 0.86, "learning_rate": 1.0779589474963792e-06, "loss": 2.3735, "step": 8537 }, { "epoch": 0.86, "learning_rate": 1.0764938196724661e-06, "loss": 2.304, "step": 8538 }, { "epoch": 0.86, "learning_rate": 1.0750296315606768e-06, "loss": 2.2983, "step": 8539 }, { "epoch": 0.86, "learning_rate": 1.073566383315202e-06, "loss": 2.2837, "step": 8540 }, { "epoch": 0.86, "learning_rate": 1.0721040750901312e-06, "loss": 2.263, "step": 8541 }, { "epoch": 0.86, "learning_rate": 1.0706427070394588e-06, "loss": 2.3154, "step": 8542 }, { "epoch": 0.86, "learning_rate": 1.0691822793170748e-06, "loss": 2.2521, "step": 8543 }, { "epoch": 0.86, "learning_rate": 1.0677227920767764e-06, "loss": 2.2244, "step": 8544 }, { "epoch": 0.86, "learning_rate": 1.0662642454722538e-06, "loss": 2.3367, "step": 8545 }, { "epoch": 0.86, "learning_rate": 1.0648066396571089e-06, "loss": 2.205, "step": 8546 }, { "epoch": 0.86, "learning_rate": 1.0633499747848352e-06, "loss": 2.2675, "step": 8547 }, { "epoch": 0.86, "learning_rate": 1.0618942510088315e-06, "loss": 2.2437, "step": 8548 }, { "epoch": 0.86, "learning_rate": 1.060439468482396e-06, "loss": 2.2073, "step": 8549 }, { "epoch": 0.86, "learning_rate": 1.0589856273587284e-06, "loss": 2.3129, "step": 8550 }, { "epoch": 0.86, "learning_rate": 1.0575327277909275e-06, "loss": 2.2085, "step": 8551 }, { "epoch": 0.86, "learning_rate": 1.0560807699319964e-06, "loss": 2.4012, "step": 8552 }, { "epoch": 0.86, "learning_rate": 1.054629753934837e-06, "loss": 2.3109, "step": 8553 }, { "epoch": 0.86, "learning_rate": 1.0531796799522497e-06, "loss": 2.3507, "step": 8554 }, { "epoch": 0.86, "learning_rate": 1.0517305481369422e-06, "loss": 2.2012, "step": 8555 }, { "epoch": 0.86, "learning_rate": 1.0502823586415168e-06, "loss": 2.3294, "step": 8556 }, { "epoch": 0.86, "learning_rate": 1.0488351116184802e-06, "loss": 2.2388, "step": 8557 }, { "epoch": 0.86, "learning_rate": 1.0473888072202354e-06, "loss": 2.2812, "step": 8558 }, { "epoch": 0.86, "learning_rate": 1.0459434455990913e-06, "loss": 2.2761, "step": 8559 }, { "epoch": 0.86, "learning_rate": 1.0444990269072542e-06, "loss": 2.2706, "step": 8560 }, { "epoch": 0.86, "learning_rate": 1.0430555512968332e-06, "loss": 2.3216, "step": 8561 }, { "epoch": 0.86, "learning_rate": 1.041613018919836e-06, "loss": 2.3543, "step": 8562 }, { "epoch": 0.86, "learning_rate": 1.0401714299281717e-06, "loss": 2.2816, "step": 8563 }, { "epoch": 0.86, "learning_rate": 1.0387307844736527e-06, "loss": 2.2141, "step": 8564 }, { "epoch": 0.86, "learning_rate": 1.0372910827079885e-06, "loss": 2.2906, "step": 8565 }, { "epoch": 0.86, "learning_rate": 1.0358523247827912e-06, "loss": 2.3107, "step": 8566 }, { "epoch": 0.86, "learning_rate": 1.0344145108495718e-06, "loss": 2.2402, "step": 8567 }, { "epoch": 0.86, "learning_rate": 1.0329776410597425e-06, "loss": 2.2974, "step": 8568 }, { "epoch": 0.86, "learning_rate": 1.031541715564618e-06, "loss": 2.3383, "step": 8569 }, { "epoch": 0.86, "learning_rate": 1.0301067345154115e-06, "loss": 2.3476, "step": 8570 }, { "epoch": 0.86, "learning_rate": 1.0286726980632366e-06, "loss": 2.2676, "step": 8571 }, { "epoch": 0.86, "learning_rate": 1.0272396063591062e-06, "loss": 2.2128, "step": 8572 }, { "epoch": 0.86, "learning_rate": 1.0258074595539403e-06, "loss": 2.3255, "step": 8573 }, { "epoch": 0.86, "learning_rate": 1.0243762577985516e-06, "loss": 2.2802, "step": 8574 }, { "epoch": 0.86, "learning_rate": 1.0229460012436576e-06, "loss": 2.257, "step": 8575 }, { "epoch": 0.86, "learning_rate": 1.0215166900398754e-06, "loss": 2.3059, "step": 8576 }, { "epoch": 0.86, "learning_rate": 1.0200883243377203e-06, "loss": 2.2467, "step": 8577 }, { "epoch": 0.86, "learning_rate": 1.0186609042876106e-06, "loss": 2.3723, "step": 8578 }, { "epoch": 0.86, "learning_rate": 1.0172344300398651e-06, "loss": 2.3186, "step": 8579 }, { "epoch": 0.86, "learning_rate": 1.0158089017447015e-06, "loss": 2.3059, "step": 8580 }, { "epoch": 0.86, "learning_rate": 1.0143843195522396e-06, "loss": 2.3995, "step": 8581 }, { "epoch": 0.86, "learning_rate": 1.0129606836124972e-06, "loss": 2.3314, "step": 8582 }, { "epoch": 0.86, "learning_rate": 1.0115379940753956e-06, "loss": 2.3928, "step": 8583 }, { "epoch": 0.86, "learning_rate": 1.0101162510907524e-06, "loss": 2.3872, "step": 8584 }, { "epoch": 0.86, "learning_rate": 1.0086954548082894e-06, "loss": 2.2962, "step": 8585 }, { "epoch": 0.86, "learning_rate": 1.0072756053776268e-06, "loss": 2.3394, "step": 8586 }, { "epoch": 0.86, "learning_rate": 1.0058567029482845e-06, "loss": 2.4099, "step": 8587 }, { "epoch": 0.86, "learning_rate": 1.004438747669686e-06, "loss": 2.3109, "step": 8588 }, { "epoch": 0.86, "learning_rate": 1.00302173969115e-06, "loss": 2.2668, "step": 8589 }, { "epoch": 0.86, "learning_rate": 1.0016056791618977e-06, "loss": 2.3528, "step": 8590 }, { "epoch": 0.86, "learning_rate": 1.0001905662310529e-06, "loss": 2.2537, "step": 8591 }, { "epoch": 0.86, "learning_rate": 9.987764010476385e-07, "loss": 2.2227, "step": 8592 }, { "epoch": 0.86, "learning_rate": 9.973631837605745e-07, "loss": 2.2677, "step": 8593 }, { "epoch": 0.86, "learning_rate": 9.959509145186841e-07, "loss": 2.352, "step": 8594 }, { "epoch": 0.86, "learning_rate": 9.945395934706891e-07, "loss": 2.2781, "step": 8595 }, { "epoch": 0.86, "learning_rate": 9.931292207652131e-07, "loss": 2.2899, "step": 8596 }, { "epoch": 0.86, "learning_rate": 9.917197965507796e-07, "loss": 2.3065, "step": 8597 }, { "epoch": 0.86, "learning_rate": 9.903113209758098e-07, "loss": 2.373, "step": 8598 }, { "epoch": 0.86, "learning_rate": 9.88903794188627e-07, "loss": 2.3567, "step": 8599 }, { "epoch": 0.86, "learning_rate": 9.874972163374553e-07, "loss": 2.1558, "step": 8600 }, { "epoch": 0.86, "learning_rate": 9.860915875704168e-07, "loss": 2.3002, "step": 8601 }, { "epoch": 0.86, "learning_rate": 9.846869080355358e-07, "loss": 2.2376, "step": 8602 }, { "epoch": 0.86, "learning_rate": 9.832831778807362e-07, "loss": 2.2644, "step": 8603 }, { "epoch": 0.86, "learning_rate": 9.818803972538382e-07, "loss": 2.3175, "step": 8604 }, { "epoch": 0.86, "learning_rate": 9.804785663025684e-07, "loss": 2.135, "step": 8605 }, { "epoch": 0.86, "learning_rate": 9.790776851745486e-07, "loss": 2.2165, "step": 8606 }, { "epoch": 0.86, "learning_rate": 9.776777540173031e-07, "loss": 2.3271, "step": 8607 }, { "epoch": 0.86, "learning_rate": 9.762787729782518e-07, "loss": 2.3577, "step": 8608 }, { "epoch": 0.86, "learning_rate": 9.748807422047224e-07, "loss": 2.1849, "step": 8609 }, { "epoch": 0.86, "learning_rate": 9.73483661843937e-07, "loss": 2.2867, "step": 8610 }, { "epoch": 0.86, "learning_rate": 9.720875320430168e-07, "loss": 2.2743, "step": 8611 }, { "epoch": 0.86, "learning_rate": 9.706923529489864e-07, "loss": 2.3287, "step": 8612 }, { "epoch": 0.86, "learning_rate": 9.692981247087675e-07, "loss": 2.3449, "step": 8613 }, { "epoch": 0.86, "learning_rate": 9.679048474691832e-07, "loss": 2.2892, "step": 8614 }, { "epoch": 0.86, "learning_rate": 9.665125213769565e-07, "loss": 2.3152, "step": 8615 }, { "epoch": 0.86, "learning_rate": 9.651211465787091e-07, "loss": 2.3429, "step": 8616 }, { "epoch": 0.86, "learning_rate": 9.637307232209625e-07, "loss": 2.2438, "step": 8617 }, { "epoch": 0.86, "learning_rate": 9.623412514501407e-07, "loss": 2.2362, "step": 8618 }, { "epoch": 0.86, "learning_rate": 9.609527314125645e-07, "loss": 2.3149, "step": 8619 }, { "epoch": 0.86, "learning_rate": 9.595651632544545e-07, "loss": 2.2704, "step": 8620 }, { "epoch": 0.86, "learning_rate": 9.581785471219363e-07, "loss": 2.3318, "step": 8621 }, { "epoch": 0.86, "learning_rate": 9.567928831610252e-07, "loss": 2.3022, "step": 8622 }, { "epoch": 0.86, "learning_rate": 9.554081715176444e-07, "loss": 2.3442, "step": 8623 }, { "epoch": 0.86, "learning_rate": 9.540244123376152e-07, "loss": 2.2771, "step": 8624 }, { "epoch": 0.86, "learning_rate": 9.526416057666565e-07, "loss": 2.3456, "step": 8625 }, { "epoch": 0.86, "learning_rate": 9.512597519503863e-07, "loss": 2.3719, "step": 8626 }, { "epoch": 0.86, "learning_rate": 9.498788510343293e-07, "loss": 2.2085, "step": 8627 }, { "epoch": 0.86, "learning_rate": 9.484989031639025e-07, "loss": 2.3644, "step": 8628 }, { "epoch": 0.86, "learning_rate": 9.471199084844241e-07, "loss": 2.2764, "step": 8629 }, { "epoch": 0.86, "learning_rate": 9.457418671411122e-07, "loss": 2.3672, "step": 8630 }, { "epoch": 0.86, "learning_rate": 9.443647792790855e-07, "loss": 2.228, "step": 8631 }, { "epoch": 0.86, "learning_rate": 9.429886450433623e-07, "loss": 2.3478, "step": 8632 }, { "epoch": 0.86, "learning_rate": 9.416134645788599e-07, "loss": 2.2427, "step": 8633 }, { "epoch": 0.87, "learning_rate": 9.402392380303937e-07, "loss": 2.174, "step": 8634 }, { "epoch": 0.87, "learning_rate": 9.388659655426791e-07, "loss": 2.2399, "step": 8635 }, { "epoch": 0.87, "learning_rate": 9.374936472603347e-07, "loss": 2.2848, "step": 8636 }, { "epoch": 0.87, "learning_rate": 9.36122283327876e-07, "loss": 2.2678, "step": 8637 }, { "epoch": 0.87, "learning_rate": 9.347518738897166e-07, "loss": 2.2986, "step": 8638 }, { "epoch": 0.87, "learning_rate": 9.33382419090172e-07, "loss": 2.2562, "step": 8639 }, { "epoch": 0.87, "learning_rate": 9.320139190734534e-07, "loss": 2.243, "step": 8640 }, { "epoch": 0.87, "learning_rate": 9.306463739836768e-07, "loss": 2.2613, "step": 8641 }, { "epoch": 0.87, "learning_rate": 9.292797839648549e-07, "loss": 2.3389, "step": 8642 }, { "epoch": 0.87, "learning_rate": 9.279141491608978e-07, "loss": 2.2636, "step": 8643 }, { "epoch": 0.87, "learning_rate": 9.265494697156186e-07, "loss": 2.2907, "step": 8644 }, { "epoch": 0.87, "learning_rate": 9.251857457727287e-07, "loss": 2.2791, "step": 8645 }, { "epoch": 0.87, "learning_rate": 9.238229774758367e-07, "loss": 2.2319, "step": 8646 }, { "epoch": 0.87, "learning_rate": 9.224611649684545e-07, "loss": 2.3583, "step": 8647 }, { "epoch": 0.87, "learning_rate": 9.211003083939896e-07, "loss": 2.2421, "step": 8648 }, { "epoch": 0.87, "learning_rate": 9.197404078957506e-07, "loss": 2.2503, "step": 8649 }, { "epoch": 0.87, "learning_rate": 9.183814636169464e-07, "loss": 2.2592, "step": 8650 }, { "epoch": 0.87, "learning_rate": 9.170234757006824e-07, "loss": 2.283, "step": 8651 }, { "epoch": 0.87, "learning_rate": 9.156664442899654e-07, "loss": 2.2532, "step": 8652 }, { "epoch": 0.87, "learning_rate": 9.143103695277e-07, "loss": 2.2788, "step": 8653 }, { "epoch": 0.87, "learning_rate": 9.129552515566931e-07, "loss": 2.3073, "step": 8654 }, { "epoch": 0.87, "learning_rate": 9.116010905196493e-07, "loss": 2.2381, "step": 8655 }, { "epoch": 0.87, "learning_rate": 9.102478865591691e-07, "loss": 2.2775, "step": 8656 }, { "epoch": 0.87, "learning_rate": 9.088956398177573e-07, "loss": 2.3173, "step": 8657 }, { "epoch": 0.87, "learning_rate": 9.075443504378156e-07, "loss": 2.307, "step": 8658 }, { "epoch": 0.87, "learning_rate": 9.061940185616425e-07, "loss": 2.3633, "step": 8659 }, { "epoch": 0.87, "learning_rate": 9.048446443314407e-07, "loss": 2.2904, "step": 8660 }, { "epoch": 0.87, "learning_rate": 9.034962278893078e-07, "loss": 2.2241, "step": 8661 }, { "epoch": 0.87, "learning_rate": 9.021487693772435e-07, "loss": 2.307, "step": 8662 }, { "epoch": 0.87, "learning_rate": 9.008022689371443e-07, "loss": 2.3589, "step": 8663 }, { "epoch": 0.87, "learning_rate": 8.994567267108067e-07, "loss": 2.3466, "step": 8664 }, { "epoch": 0.87, "learning_rate": 8.981121428399275e-07, "loss": 2.3249, "step": 8665 }, { "epoch": 0.87, "learning_rate": 8.967685174661001e-07, "loss": 2.2385, "step": 8666 }, { "epoch": 0.87, "learning_rate": 8.954258507308189e-07, "loss": 2.267, "step": 8667 }, { "epoch": 0.87, "learning_rate": 8.940841427754765e-07, "loss": 2.2809, "step": 8668 }, { "epoch": 0.87, "learning_rate": 8.927433937413654e-07, "loss": 2.299, "step": 8669 }, { "epoch": 0.87, "learning_rate": 8.914036037696771e-07, "loss": 2.3346, "step": 8670 }, { "epoch": 0.87, "learning_rate": 8.900647730014977e-07, "loss": 2.2781, "step": 8671 }, { "epoch": 0.87, "learning_rate": 8.88726901577821e-07, "loss": 2.3623, "step": 8672 }, { "epoch": 0.87, "learning_rate": 8.873899896395332e-07, "loss": 2.3282, "step": 8673 }, { "epoch": 0.87, "learning_rate": 8.860540373274218e-07, "loss": 2.3526, "step": 8674 }, { "epoch": 0.87, "learning_rate": 8.847190447821708e-07, "loss": 2.2319, "step": 8675 }, { "epoch": 0.87, "learning_rate": 8.833850121443665e-07, "loss": 2.2876, "step": 8676 }, { "epoch": 0.87, "learning_rate": 8.820519395544913e-07, "loss": 2.3422, "step": 8677 }, { "epoch": 0.87, "learning_rate": 8.807198271529282e-07, "loss": 2.2607, "step": 8678 }, { "epoch": 0.87, "learning_rate": 8.793886750799596e-07, "loss": 2.4491, "step": 8679 }, { "epoch": 0.87, "learning_rate": 8.780584834757632e-07, "loss": 2.3832, "step": 8680 }, { "epoch": 0.87, "learning_rate": 8.767292524804217e-07, "loss": 2.3025, "step": 8681 }, { "epoch": 0.87, "learning_rate": 8.754009822339105e-07, "loss": 2.3013, "step": 8682 }, { "epoch": 0.87, "learning_rate": 8.740736728761079e-07, "loss": 2.2174, "step": 8683 }, { "epoch": 0.87, "learning_rate": 8.727473245467887e-07, "loss": 2.1636, "step": 8684 }, { "epoch": 0.87, "learning_rate": 8.714219373856292e-07, "loss": 2.3095, "step": 8685 }, { "epoch": 0.87, "learning_rate": 8.700975115321985e-07, "loss": 2.3286, "step": 8686 }, { "epoch": 0.87, "learning_rate": 8.68774047125972e-07, "loss": 2.3148, "step": 8687 }, { "epoch": 0.87, "learning_rate": 8.674515443063191e-07, "loss": 2.305, "step": 8688 }, { "epoch": 0.87, "learning_rate": 8.661300032125075e-07, "loss": 2.3514, "step": 8689 }, { "epoch": 0.87, "learning_rate": 8.648094239837101e-07, "loss": 2.2767, "step": 8690 }, { "epoch": 0.87, "learning_rate": 8.634898067589903e-07, "loss": 2.2052, "step": 8691 }, { "epoch": 0.87, "learning_rate": 8.621711516773146e-07, "loss": 2.1877, "step": 8692 }, { "epoch": 0.87, "learning_rate": 8.608534588775474e-07, "loss": 2.2916, "step": 8693 }, { "epoch": 0.87, "learning_rate": 8.595367284984523e-07, "loss": 2.2383, "step": 8694 }, { "epoch": 0.87, "learning_rate": 8.582209606786884e-07, "loss": 2.2948, "step": 8695 }, { "epoch": 0.87, "learning_rate": 8.569061555568192e-07, "loss": 2.2638, "step": 8696 }, { "epoch": 0.87, "learning_rate": 8.555923132713007e-07, "loss": 2.2772, "step": 8697 }, { "epoch": 0.87, "learning_rate": 8.542794339604899e-07, "loss": 2.3706, "step": 8698 }, { "epoch": 0.87, "learning_rate": 8.529675177626473e-07, "loss": 2.2083, "step": 8699 }, { "epoch": 0.87, "learning_rate": 8.516565648159237e-07, "loss": 2.2913, "step": 8700 }, { "epoch": 0.87, "learning_rate": 8.50346575258374e-07, "loss": 2.3187, "step": 8701 }, { "epoch": 0.87, "learning_rate": 8.490375492279479e-07, "loss": 2.2635, "step": 8702 }, { "epoch": 0.87, "learning_rate": 8.477294868624986e-07, "loss": 2.3922, "step": 8703 }, { "epoch": 0.87, "learning_rate": 8.464223882997724e-07, "loss": 2.2474, "step": 8704 }, { "epoch": 0.87, "learning_rate": 8.451162536774171e-07, "loss": 2.2989, "step": 8705 }, { "epoch": 0.87, "learning_rate": 8.438110831329793e-07, "loss": 2.3501, "step": 8706 }, { "epoch": 0.87, "learning_rate": 8.425068768039024e-07, "loss": 2.281, "step": 8707 }, { "epoch": 0.87, "learning_rate": 8.412036348275298e-07, "loss": 2.3294, "step": 8708 }, { "epoch": 0.87, "learning_rate": 8.399013573411019e-07, "loss": 2.3497, "step": 8709 }, { "epoch": 0.87, "learning_rate": 8.386000444817588e-07, "loss": 2.3672, "step": 8710 }, { "epoch": 0.87, "learning_rate": 8.372996963865387e-07, "loss": 2.3437, "step": 8711 }, { "epoch": 0.87, "learning_rate": 8.360003131923766e-07, "loss": 2.2954, "step": 8712 }, { "epoch": 0.87, "learning_rate": 8.347018950361097e-07, "loss": 2.3015, "step": 8713 }, { "epoch": 0.87, "learning_rate": 8.334044420544696e-07, "loss": 2.2317, "step": 8714 }, { "epoch": 0.87, "learning_rate": 8.32107954384086e-07, "loss": 2.2643, "step": 8715 }, { "epoch": 0.87, "learning_rate": 8.30812432161493e-07, "loss": 2.2234, "step": 8716 }, { "epoch": 0.87, "learning_rate": 8.295178755231159e-07, "loss": 2.3443, "step": 8717 }, { "epoch": 0.87, "learning_rate": 8.282242846052824e-07, "loss": 2.2397, "step": 8718 }, { "epoch": 0.87, "learning_rate": 8.269316595442167e-07, "loss": 2.269, "step": 8719 }, { "epoch": 0.87, "learning_rate": 8.256400004760423e-07, "loss": 2.3258, "step": 8720 }, { "epoch": 0.87, "learning_rate": 8.243493075367814e-07, "loss": 2.3264, "step": 8721 }, { "epoch": 0.87, "learning_rate": 8.230595808623521e-07, "loss": 2.3078, "step": 8722 }, { "epoch": 0.87, "learning_rate": 8.217708205885721e-07, "loss": 2.2804, "step": 8723 }, { "epoch": 0.87, "learning_rate": 8.204830268511588e-07, "loss": 2.323, "step": 8724 }, { "epoch": 0.87, "learning_rate": 8.191961997857257e-07, "loss": 2.2685, "step": 8725 }, { "epoch": 0.87, "learning_rate": 8.179103395277854e-07, "loss": 2.2576, "step": 8726 }, { "epoch": 0.87, "learning_rate": 8.166254462127498e-07, "loss": 2.2567, "step": 8727 }, { "epoch": 0.87, "learning_rate": 8.153415199759263e-07, "loss": 2.2496, "step": 8728 }, { "epoch": 0.87, "learning_rate": 8.140585609525232e-07, "loss": 2.3664, "step": 8729 }, { "epoch": 0.87, "learning_rate": 8.127765692776446e-07, "loss": 2.2766, "step": 8730 }, { "epoch": 0.87, "learning_rate": 8.114955450862938e-07, "loss": 2.3171, "step": 8731 }, { "epoch": 0.87, "learning_rate": 8.102154885133729e-07, "loss": 2.2608, "step": 8732 }, { "epoch": 0.87, "learning_rate": 8.089363996936805e-07, "loss": 2.272, "step": 8733 }, { "epoch": 0.88, "learning_rate": 8.076582787619158e-07, "loss": 2.2687, "step": 8734 }, { "epoch": 0.88, "learning_rate": 8.063811258526743e-07, "loss": 2.3062, "step": 8735 }, { "epoch": 0.88, "learning_rate": 8.051049411004485e-07, "loss": 2.2388, "step": 8736 }, { "epoch": 0.88, "learning_rate": 8.03829724639632e-07, "loss": 2.3315, "step": 8737 }, { "epoch": 0.88, "learning_rate": 8.025554766045129e-07, "loss": 2.2671, "step": 8738 }, { "epoch": 0.88, "learning_rate": 8.012821971292806e-07, "loss": 2.2675, "step": 8739 }, { "epoch": 0.88, "learning_rate": 8.000098863480199e-07, "loss": 2.1837, "step": 8740 }, { "epoch": 0.88, "learning_rate": 7.987385443947138e-07, "loss": 2.3083, "step": 8741 }, { "epoch": 0.88, "learning_rate": 7.974681714032451e-07, "loss": 2.2987, "step": 8742 }, { "epoch": 0.88, "learning_rate": 7.961987675073945e-07, "loss": 2.2431, "step": 8743 }, { "epoch": 0.88, "learning_rate": 7.949303328408398e-07, "loss": 2.3432, "step": 8744 }, { "epoch": 0.88, "learning_rate": 7.936628675371549e-07, "loss": 2.3005, "step": 8745 }, { "epoch": 0.88, "learning_rate": 7.923963717298155e-07, "loss": 2.2077, "step": 8746 }, { "epoch": 0.88, "learning_rate": 7.911308455521916e-07, "loss": 2.2157, "step": 8747 }, { "epoch": 0.88, "learning_rate": 7.89866289137553e-07, "loss": 2.3354, "step": 8748 }, { "epoch": 0.88, "learning_rate": 7.88602702619069e-07, "loss": 2.3294, "step": 8749 }, { "epoch": 0.88, "learning_rate": 7.873400861298008e-07, "loss": 2.2927, "step": 8750 }, { "epoch": 0.88, "learning_rate": 7.860784398027122e-07, "loss": 2.3594, "step": 8751 }, { "epoch": 0.88, "learning_rate": 7.848177637706656e-07, "loss": 2.3092, "step": 8752 }, { "epoch": 0.88, "learning_rate": 7.835580581664204e-07, "loss": 2.1865, "step": 8753 }, { "epoch": 0.88, "learning_rate": 7.822993231226306e-07, "loss": 2.2918, "step": 8754 }, { "epoch": 0.88, "learning_rate": 7.810415587718523e-07, "loss": 2.3223, "step": 8755 }, { "epoch": 0.88, "learning_rate": 7.797847652465373e-07, "loss": 2.2673, "step": 8756 }, { "epoch": 0.88, "learning_rate": 7.785289426790343e-07, "loss": 2.3463, "step": 8757 }, { "epoch": 0.88, "learning_rate": 7.772740912015919e-07, "loss": 2.2878, "step": 8758 }, { "epoch": 0.88, "learning_rate": 7.760202109463555e-07, "loss": 2.287, "step": 8759 }, { "epoch": 0.88, "learning_rate": 7.74767302045365e-07, "loss": 2.2311, "step": 8760 }, { "epoch": 0.88, "learning_rate": 7.73515364630566e-07, "loss": 2.295, "step": 8761 }, { "epoch": 0.88, "learning_rate": 7.722643988337942e-07, "loss": 2.3244, "step": 8762 }, { "epoch": 0.88, "learning_rate": 7.710144047867862e-07, "loss": 2.2867, "step": 8763 }, { "epoch": 0.88, "learning_rate": 7.69765382621176e-07, "loss": 2.2818, "step": 8764 }, { "epoch": 0.88, "learning_rate": 7.685173324684947e-07, "loss": 2.2382, "step": 8765 }, { "epoch": 0.88, "learning_rate": 7.672702544601707e-07, "loss": 2.2554, "step": 8766 }, { "epoch": 0.88, "learning_rate": 7.660241487275311e-07, "loss": 2.3773, "step": 8767 }, { "epoch": 0.88, "learning_rate": 7.647790154018008e-07, "loss": 2.249, "step": 8768 }, { "epoch": 0.88, "learning_rate": 7.635348546141008e-07, "loss": 2.3264, "step": 8769 }, { "epoch": 0.88, "learning_rate": 7.622916664954505e-07, "loss": 2.2538, "step": 8770 }, { "epoch": 0.88, "learning_rate": 7.610494511767685e-07, "loss": 2.3399, "step": 8771 }, { "epoch": 0.88, "learning_rate": 7.598082087888669e-07, "loss": 2.2536, "step": 8772 }, { "epoch": 0.88, "learning_rate": 7.585679394624601e-07, "loss": 2.2579, "step": 8773 }, { "epoch": 0.88, "learning_rate": 7.573286433281568e-07, "loss": 2.28, "step": 8774 }, { "epoch": 0.88, "learning_rate": 7.560903205164649e-07, "loss": 2.2919, "step": 8775 }, { "epoch": 0.88, "learning_rate": 7.548529711577868e-07, "loss": 2.3243, "step": 8776 }, { "epoch": 0.88, "learning_rate": 7.536165953824281e-07, "loss": 2.347, "step": 8777 }, { "epoch": 0.88, "learning_rate": 7.523811933205838e-07, "loss": 2.2802, "step": 8778 }, { "epoch": 0.88, "learning_rate": 7.511467651023552e-07, "loss": 2.3327, "step": 8779 }, { "epoch": 0.88, "learning_rate": 7.499133108577361e-07, "loss": 2.3246, "step": 8780 }, { "epoch": 0.88, "learning_rate": 7.486808307166182e-07, "loss": 2.2543, "step": 8781 }, { "epoch": 0.88, "learning_rate": 7.4744932480879e-07, "loss": 2.3057, "step": 8782 }, { "epoch": 0.88, "learning_rate": 7.462187932639387e-07, "loss": 2.2916, "step": 8783 }, { "epoch": 0.88, "learning_rate": 7.449892362116484e-07, "loss": 2.3472, "step": 8784 }, { "epoch": 0.88, "learning_rate": 7.437606537814024e-07, "loss": 2.2582, "step": 8785 }, { "epoch": 0.88, "learning_rate": 7.425330461025771e-07, "loss": 2.3143, "step": 8786 }, { "epoch": 0.88, "learning_rate": 7.413064133044479e-07, "loss": 2.3068, "step": 8787 }, { "epoch": 0.88, "learning_rate": 7.400807555161949e-07, "loss": 2.2356, "step": 8788 }, { "epoch": 0.88, "learning_rate": 7.388560728668814e-07, "loss": 2.3592, "step": 8789 }, { "epoch": 0.88, "learning_rate": 7.3763236548548e-07, "loss": 2.1993, "step": 8790 }, { "epoch": 0.88, "learning_rate": 7.364096335008553e-07, "loss": 2.3762, "step": 8791 }, { "epoch": 0.88, "learning_rate": 7.351878770417686e-07, "loss": 2.2605, "step": 8792 }, { "epoch": 0.88, "learning_rate": 7.339670962368828e-07, "loss": 2.2228, "step": 8793 }, { "epoch": 0.88, "learning_rate": 7.327472912147526e-07, "loss": 2.2042, "step": 8794 }, { "epoch": 0.88, "learning_rate": 7.315284621038355e-07, "loss": 2.2673, "step": 8795 }, { "epoch": 0.88, "learning_rate": 7.303106090324785e-07, "loss": 2.3572, "step": 8796 }, { "epoch": 0.88, "learning_rate": 7.29093732128936e-07, "loss": 2.3762, "step": 8797 }, { "epoch": 0.88, "learning_rate": 7.27877831521352e-07, "loss": 2.3501, "step": 8798 }, { "epoch": 0.88, "learning_rate": 7.266629073377707e-07, "loss": 2.2711, "step": 8799 }, { "epoch": 0.88, "learning_rate": 7.254489597061321e-07, "loss": 2.2374, "step": 8800 }, { "epoch": 0.88, "learning_rate": 7.242359887542738e-07, "loss": 2.3357, "step": 8801 }, { "epoch": 0.88, "learning_rate": 7.230239946099304e-07, "loss": 2.3798, "step": 8802 }, { "epoch": 0.88, "learning_rate": 7.218129774007343e-07, "loss": 2.2839, "step": 8803 }, { "epoch": 0.88, "learning_rate": 7.206029372542155e-07, "loss": 2.2871, "step": 8804 }, { "epoch": 0.88, "learning_rate": 7.193938742977991e-07, "loss": 2.3277, "step": 8805 }, { "epoch": 0.88, "learning_rate": 7.181857886588095e-07, "loss": 2.2847, "step": 8806 }, { "epoch": 0.88, "learning_rate": 7.169786804644663e-07, "loss": 2.2891, "step": 8807 }, { "epoch": 0.88, "learning_rate": 7.157725498418889e-07, "loss": 2.2144, "step": 8808 }, { "epoch": 0.88, "learning_rate": 7.1456739691809e-07, "loss": 2.3355, "step": 8809 }, { "epoch": 0.88, "learning_rate": 7.133632218199815e-07, "loss": 2.273, "step": 8810 }, { "epoch": 0.88, "learning_rate": 7.12160024674372e-07, "loss": 2.1646, "step": 8811 }, { "epoch": 0.88, "learning_rate": 7.109578056079703e-07, "loss": 2.2996, "step": 8812 }, { "epoch": 0.88, "learning_rate": 7.097565647473736e-07, "loss": 2.2395, "step": 8813 }, { "epoch": 0.88, "learning_rate": 7.085563022190833e-07, "loss": 2.2706, "step": 8814 }, { "epoch": 0.88, "learning_rate": 7.073570181494982e-07, "loss": 2.2463, "step": 8815 }, { "epoch": 0.88, "learning_rate": 7.061587126649116e-07, "loss": 2.282, "step": 8816 }, { "epoch": 0.88, "learning_rate": 7.049613858915128e-07, "loss": 2.2725, "step": 8817 }, { "epoch": 0.88, "learning_rate": 7.037650379553895e-07, "loss": 2.2922, "step": 8818 }, { "epoch": 0.88, "learning_rate": 7.025696689825256e-07, "loss": 2.2865, "step": 8819 }, { "epoch": 0.88, "learning_rate": 7.013752790988037e-07, "loss": 2.2567, "step": 8820 }, { "epoch": 0.88, "learning_rate": 7.001818684300022e-07, "loss": 2.2199, "step": 8821 }, { "epoch": 0.88, "learning_rate": 6.989894371017946e-07, "loss": 2.3358, "step": 8822 }, { "epoch": 0.88, "learning_rate": 6.97797985239752e-07, "loss": 2.2716, "step": 8823 }, { "epoch": 0.88, "learning_rate": 6.966075129693462e-07, "loss": 2.383, "step": 8824 }, { "epoch": 0.88, "learning_rate": 6.954180204159422e-07, "loss": 2.1646, "step": 8825 }, { "epoch": 0.88, "learning_rate": 6.942295077048011e-07, "loss": 2.2804, "step": 8826 }, { "epoch": 0.88, "learning_rate": 6.930419749610839e-07, "loss": 2.4046, "step": 8827 }, { "epoch": 0.88, "learning_rate": 6.91855422309845e-07, "loss": 2.3406, "step": 8828 }, { "epoch": 0.88, "learning_rate": 6.906698498760389e-07, "loss": 2.2789, "step": 8829 }, { "epoch": 0.88, "learning_rate": 6.894852577845135e-07, "loss": 2.2734, "step": 8830 }, { "epoch": 0.88, "learning_rate": 6.883016461600167e-07, "loss": 2.2459, "step": 8831 }, { "epoch": 0.88, "learning_rate": 6.871190151271911e-07, "loss": 2.3435, "step": 8832 }, { "epoch": 0.88, "learning_rate": 6.85937364810576e-07, "loss": 2.286, "step": 8833 }, { "epoch": 0.89, "learning_rate": 6.847566953346096e-07, "loss": 2.2434, "step": 8834 }, { "epoch": 0.89, "learning_rate": 6.835770068236236e-07, "loss": 2.2416, "step": 8835 }, { "epoch": 0.89, "learning_rate": 6.823982994018485e-07, "loss": 2.3131, "step": 8836 }, { "epoch": 0.89, "learning_rate": 6.812205731934118e-07, "loss": 2.2558, "step": 8837 }, { "epoch": 0.89, "learning_rate": 6.800438283223365e-07, "loss": 2.3302, "step": 8838 }, { "epoch": 0.89, "learning_rate": 6.788680649125434e-07, "loss": 2.218, "step": 8839 }, { "epoch": 0.89, "learning_rate": 6.776932830878469e-07, "loss": 2.2883, "step": 8840 }, { "epoch": 0.89, "learning_rate": 6.765194829719613e-07, "loss": 2.1906, "step": 8841 }, { "epoch": 0.89, "learning_rate": 6.753466646884976e-07, "loss": 2.2361, "step": 8842 }, { "epoch": 0.89, "learning_rate": 6.741748283609628e-07, "loss": 2.2857, "step": 8843 }, { "epoch": 0.89, "learning_rate": 6.73003974112758e-07, "loss": 2.2308, "step": 8844 }, { "epoch": 0.89, "learning_rate": 6.718341020671848e-07, "loss": 2.1727, "step": 8845 }, { "epoch": 0.89, "learning_rate": 6.706652123474388e-07, "loss": 2.2967, "step": 8846 }, { "epoch": 0.89, "learning_rate": 6.694973050766118e-07, "loss": 2.3398, "step": 8847 }, { "epoch": 0.89, "learning_rate": 6.683303803776953e-07, "loss": 2.3768, "step": 8848 }, { "epoch": 0.89, "learning_rate": 6.671644383735732e-07, "loss": 2.2497, "step": 8849 }, { "epoch": 0.89, "learning_rate": 6.659994791870283e-07, "loss": 2.3638, "step": 8850 }, { "epoch": 0.89, "learning_rate": 6.648355029407405e-07, "loss": 2.2944, "step": 8851 }, { "epoch": 0.89, "learning_rate": 6.636725097572872e-07, "loss": 2.3659, "step": 8852 }, { "epoch": 0.89, "learning_rate": 6.625104997591358e-07, "loss": 2.3524, "step": 8853 }, { "epoch": 0.89, "learning_rate": 6.613494730686565e-07, "loss": 2.3657, "step": 8854 }, { "epoch": 0.89, "learning_rate": 6.601894298081157e-07, "loss": 2.2707, "step": 8855 }, { "epoch": 0.89, "learning_rate": 6.590303700996714e-07, "loss": 2.2878, "step": 8856 }, { "epoch": 0.89, "learning_rate": 6.578722940653848e-07, "loss": 2.3269, "step": 8857 }, { "epoch": 0.89, "learning_rate": 6.567152018272082e-07, "loss": 2.2883, "step": 8858 }, { "epoch": 0.89, "learning_rate": 6.5555909350699e-07, "loss": 2.2456, "step": 8859 }, { "epoch": 0.89, "learning_rate": 6.544039692264814e-07, "loss": 2.3624, "step": 8860 }, { "epoch": 0.89, "learning_rate": 6.532498291073231e-07, "loss": 2.2755, "step": 8861 }, { "epoch": 0.89, "learning_rate": 6.520966732710554e-07, "loss": 2.2557, "step": 8862 }, { "epoch": 0.89, "learning_rate": 6.509445018391147e-07, "loss": 2.2436, "step": 8863 }, { "epoch": 0.89, "learning_rate": 6.497933149328328e-07, "loss": 2.3622, "step": 8864 }, { "epoch": 0.89, "learning_rate": 6.486431126734372e-07, "loss": 2.28, "step": 8865 }, { "epoch": 0.89, "learning_rate": 6.474938951820542e-07, "loss": 2.3298, "step": 8866 }, { "epoch": 0.89, "learning_rate": 6.463456625797049e-07, "loss": 2.3068, "step": 8867 }, { "epoch": 0.89, "learning_rate": 6.451984149873047e-07, "loss": 2.3066, "step": 8868 }, { "epoch": 0.89, "learning_rate": 6.440521525256704e-07, "loss": 2.196, "step": 8869 }, { "epoch": 0.89, "learning_rate": 6.429068753155121e-07, "loss": 2.3192, "step": 8870 }, { "epoch": 0.89, "learning_rate": 6.417625834774344e-07, "loss": 2.3639, "step": 8871 }, { "epoch": 0.89, "learning_rate": 6.406192771319397e-07, "loss": 2.328, "step": 8872 }, { "epoch": 0.89, "learning_rate": 6.394769563994274e-07, "loss": 2.274, "step": 8873 }, { "epoch": 0.89, "learning_rate": 6.383356214001923e-07, "loss": 2.2958, "step": 8874 }, { "epoch": 0.89, "learning_rate": 6.37195272254425e-07, "loss": 2.3421, "step": 8875 }, { "epoch": 0.89, "learning_rate": 6.360559090822161e-07, "loss": 2.2236, "step": 8876 }, { "epoch": 0.89, "learning_rate": 6.349175320035427e-07, "loss": 2.3262, "step": 8877 }, { "epoch": 0.89, "learning_rate": 6.337801411382894e-07, "loss": 2.2455, "step": 8878 }, { "epoch": 0.89, "learning_rate": 6.32643736606231e-07, "loss": 2.2931, "step": 8879 }, { "epoch": 0.89, "learning_rate": 6.315083185270387e-07, "loss": 2.1962, "step": 8880 }, { "epoch": 0.89, "learning_rate": 6.303738870202813e-07, "loss": 2.3608, "step": 8881 }, { "epoch": 0.89, "learning_rate": 6.292404422054233e-07, "loss": 2.3183, "step": 8882 }, { "epoch": 0.89, "learning_rate": 6.281079842018234e-07, "loss": 2.265, "step": 8883 }, { "epoch": 0.89, "learning_rate": 6.269765131287387e-07, "loss": 2.3002, "step": 8884 }, { "epoch": 0.89, "learning_rate": 6.258460291053203e-07, "loss": 2.3157, "step": 8885 }, { "epoch": 0.89, "learning_rate": 6.247165322506199e-07, "loss": 2.1794, "step": 8886 }, { "epoch": 0.89, "learning_rate": 6.2358802268358e-07, "loss": 2.3059, "step": 8887 }, { "epoch": 0.89, "learning_rate": 6.224605005230399e-07, "loss": 2.3196, "step": 8888 }, { "epoch": 0.89, "learning_rate": 6.213339658877393e-07, "loss": 2.2918, "step": 8889 }, { "epoch": 0.89, "learning_rate": 6.202084188963076e-07, "loss": 2.3215, "step": 8890 }, { "epoch": 0.89, "learning_rate": 6.190838596672754e-07, "loss": 2.2347, "step": 8891 }, { "epoch": 0.89, "learning_rate": 6.179602883190661e-07, "loss": 2.2968, "step": 8892 }, { "epoch": 0.89, "learning_rate": 6.168377049700003e-07, "loss": 2.3218, "step": 8893 }, { "epoch": 0.89, "learning_rate": 6.157161097382946e-07, "loss": 2.2747, "step": 8894 }, { "epoch": 0.89, "learning_rate": 6.145955027420613e-07, "loss": 2.2607, "step": 8895 }, { "epoch": 0.89, "learning_rate": 6.134758840993093e-07, "loss": 2.3285, "step": 8896 }, { "epoch": 0.89, "learning_rate": 6.123572539279432e-07, "loss": 2.2732, "step": 8897 }, { "epoch": 0.89, "learning_rate": 6.11239612345761e-07, "loss": 2.2996, "step": 8898 }, { "epoch": 0.89, "learning_rate": 6.101229594704605e-07, "loss": 2.2929, "step": 8899 }, { "epoch": 0.89, "learning_rate": 6.090072954196336e-07, "loss": 2.3621, "step": 8900 }, { "epoch": 0.89, "learning_rate": 6.078926203107682e-07, "loss": 2.1659, "step": 8901 }, { "epoch": 0.89, "learning_rate": 6.067789342612462e-07, "loss": 2.3246, "step": 8902 }, { "epoch": 0.89, "learning_rate": 6.056662373883482e-07, "loss": 2.3024, "step": 8903 }, { "epoch": 0.89, "learning_rate": 6.045545298092503e-07, "loss": 2.3575, "step": 8904 }, { "epoch": 0.89, "learning_rate": 6.034438116410235e-07, "loss": 2.3498, "step": 8905 }, { "epoch": 0.89, "learning_rate": 6.023340830006341e-07, "loss": 2.3497, "step": 8906 }, { "epoch": 0.89, "learning_rate": 6.012253440049454e-07, "loss": 2.2488, "step": 8907 }, { "epoch": 0.89, "learning_rate": 6.001175947707149e-07, "loss": 2.3882, "step": 8908 }, { "epoch": 0.89, "learning_rate": 5.990108354145973e-07, "loss": 2.2254, "step": 8909 }, { "epoch": 0.89, "learning_rate": 5.979050660531438e-07, "loss": 2.351, "step": 8910 }, { "epoch": 0.89, "learning_rate": 5.968002868027989e-07, "loss": 2.3851, "step": 8911 }, { "epoch": 0.89, "learning_rate": 5.956964977799029e-07, "loss": 2.338, "step": 8912 }, { "epoch": 0.89, "learning_rate": 5.945936991006973e-07, "loss": 2.2715, "step": 8913 }, { "epoch": 0.89, "learning_rate": 5.934918908813114e-07, "loss": 2.2922, "step": 8914 }, { "epoch": 0.89, "learning_rate": 5.923910732377758e-07, "loss": 2.2456, "step": 8915 }, { "epoch": 0.89, "learning_rate": 5.912912462860155e-07, "loss": 2.3119, "step": 8916 }, { "epoch": 0.89, "learning_rate": 5.901924101418465e-07, "loss": 2.3383, "step": 8917 }, { "epoch": 0.89, "learning_rate": 5.890945649209878e-07, "loss": 2.358, "step": 8918 }, { "epoch": 0.89, "learning_rate": 5.8799771073905e-07, "loss": 2.1149, "step": 8919 }, { "epoch": 0.89, "learning_rate": 5.869018477115396e-07, "loss": 2.2961, "step": 8920 }, { "epoch": 0.89, "learning_rate": 5.858069759538587e-07, "loss": 2.2072, "step": 8921 }, { "epoch": 0.89, "learning_rate": 5.847130955813085e-07, "loss": 2.3145, "step": 8922 }, { "epoch": 0.89, "learning_rate": 5.836202067090801e-07, "loss": 2.3739, "step": 8923 }, { "epoch": 0.89, "learning_rate": 5.825283094522627e-07, "loss": 2.1986, "step": 8924 }, { "epoch": 0.89, "learning_rate": 5.81437403925843e-07, "loss": 2.3035, "step": 8925 }, { "epoch": 0.89, "learning_rate": 5.803474902447014e-07, "loss": 2.278, "step": 8926 }, { "epoch": 0.89, "learning_rate": 5.792585685236118e-07, "loss": 2.2657, "step": 8927 }, { "epoch": 0.89, "learning_rate": 5.781706388772479e-07, "loss": 2.3633, "step": 8928 }, { "epoch": 0.89, "learning_rate": 5.770837014201768e-07, "loss": 2.3154, "step": 8929 }, { "epoch": 0.89, "learning_rate": 5.759977562668583e-07, "loss": 2.3247, "step": 8930 }, { "epoch": 0.89, "learning_rate": 5.749128035316553e-07, "loss": 2.2256, "step": 8931 }, { "epoch": 0.89, "learning_rate": 5.738288433288175e-07, "loss": 2.3692, "step": 8932 }, { "epoch": 0.9, "learning_rate": 5.727458757724968e-07, "loss": 2.292, "step": 8933 }, { "epoch": 0.9, "learning_rate": 5.716639009767367e-07, "loss": 2.2384, "step": 8934 }, { "epoch": 0.9, "learning_rate": 5.705829190554756e-07, "loss": 2.2083, "step": 8935 }, { "epoch": 0.9, "learning_rate": 5.695029301225518e-07, "loss": 2.2695, "step": 8936 }, { "epoch": 0.9, "learning_rate": 5.684239342916953e-07, "loss": 2.2426, "step": 8937 }, { "epoch": 0.9, "learning_rate": 5.673459316765317e-07, "loss": 2.2856, "step": 8938 }, { "epoch": 0.9, "learning_rate": 5.662689223905826e-07, "loss": 2.3694, "step": 8939 }, { "epoch": 0.9, "learning_rate": 5.651929065472661e-07, "loss": 2.2727, "step": 8940 }, { "epoch": 0.9, "learning_rate": 5.641178842598949e-07, "loss": 2.2756, "step": 8941 }, { "epoch": 0.9, "learning_rate": 5.630438556416751e-07, "loss": 2.2569, "step": 8942 }, { "epoch": 0.9, "learning_rate": 5.619708208057129e-07, "loss": 2.2289, "step": 8943 }, { "epoch": 0.9, "learning_rate": 5.608987798650034e-07, "loss": 2.2419, "step": 8944 }, { "epoch": 0.9, "learning_rate": 5.598277329324442e-07, "loss": 2.2502, "step": 8945 }, { "epoch": 0.9, "learning_rate": 5.587576801208217e-07, "loss": 2.2338, "step": 8946 }, { "epoch": 0.9, "learning_rate": 5.576886215428223e-07, "loss": 2.2524, "step": 8947 }, { "epoch": 0.9, "learning_rate": 5.566205573110228e-07, "loss": 2.2325, "step": 8948 }, { "epoch": 0.9, "learning_rate": 5.555534875379032e-07, "loss": 2.3763, "step": 8949 }, { "epoch": 0.9, "learning_rate": 5.544874123358302e-07, "loss": 2.2851, "step": 8950 }, { "epoch": 0.9, "learning_rate": 5.534223318170717e-07, "loss": 2.3151, "step": 8951 }, { "epoch": 0.9, "learning_rate": 5.52358246093787e-07, "loss": 2.2494, "step": 8952 }, { "epoch": 0.9, "learning_rate": 5.512951552780344e-07, "loss": 2.2948, "step": 8953 }, { "epoch": 0.9, "learning_rate": 5.502330594817629e-07, "loss": 2.2896, "step": 8954 }, { "epoch": 0.9, "learning_rate": 5.49171958816821e-07, "loss": 2.3468, "step": 8955 }, { "epoch": 0.9, "learning_rate": 5.481118533949492e-07, "loss": 2.3092, "step": 8956 }, { "epoch": 0.9, "learning_rate": 5.470527433277861e-07, "loss": 2.3856, "step": 8957 }, { "epoch": 0.9, "learning_rate": 5.459946287268614e-07, "loss": 2.2912, "step": 8958 }, { "epoch": 0.9, "learning_rate": 5.449375097036058e-07, "loss": 2.2598, "step": 8959 }, { "epoch": 0.9, "learning_rate": 5.438813863693393e-07, "loss": 2.2505, "step": 8960 }, { "epoch": 0.9, "learning_rate": 5.428262588352807e-07, "loss": 2.3159, "step": 8961 }, { "epoch": 0.9, "learning_rate": 5.41772127212542e-07, "loss": 2.3584, "step": 8962 }, { "epoch": 0.9, "learning_rate": 5.407189916121325e-07, "loss": 2.2416, "step": 8963 }, { "epoch": 0.9, "learning_rate": 5.396668521449544e-07, "loss": 2.3649, "step": 8964 }, { "epoch": 0.9, "learning_rate": 5.386157089218058e-07, "loss": 2.3537, "step": 8965 }, { "epoch": 0.9, "learning_rate": 5.375655620533793e-07, "loss": 2.2533, "step": 8966 }, { "epoch": 0.9, "learning_rate": 5.365164116502653e-07, "loss": 2.2763, "step": 8967 }, { "epoch": 0.9, "learning_rate": 5.354682578229453e-07, "loss": 2.1358, "step": 8968 }, { "epoch": 0.9, "learning_rate": 5.34421100681799e-07, "loss": 2.2743, "step": 8969 }, { "epoch": 0.9, "learning_rate": 5.333749403371003e-07, "loss": 2.2248, "step": 8970 }, { "epoch": 0.9, "learning_rate": 5.323297768990154e-07, "loss": 2.2675, "step": 8971 }, { "epoch": 0.9, "learning_rate": 5.312856104776098e-07, "loss": 2.2676, "step": 8972 }, { "epoch": 0.9, "learning_rate": 5.302424411828421e-07, "loss": 2.2091, "step": 8973 }, { "epoch": 0.9, "learning_rate": 5.292002691245645e-07, "loss": 2.3255, "step": 8974 }, { "epoch": 0.9, "learning_rate": 5.281590944125259e-07, "loss": 2.2441, "step": 8975 }, { "epoch": 0.9, "learning_rate": 5.271189171563707e-07, "loss": 2.2654, "step": 8976 }, { "epoch": 0.9, "learning_rate": 5.26079737465638e-07, "loss": 2.4061, "step": 8977 }, { "epoch": 0.9, "learning_rate": 5.25041555449759e-07, "loss": 2.3747, "step": 8978 }, { "epoch": 0.9, "learning_rate": 5.240043712180632e-07, "loss": 2.2971, "step": 8979 }, { "epoch": 0.9, "learning_rate": 5.229681848797752e-07, "loss": 2.3438, "step": 8980 }, { "epoch": 0.9, "learning_rate": 5.219329965440112e-07, "loss": 2.2839, "step": 8981 }, { "epoch": 0.9, "learning_rate": 5.208988063197851e-07, "loss": 2.1798, "step": 8982 }, { "epoch": 0.9, "learning_rate": 5.198656143160042e-07, "loss": 2.3112, "step": 8983 }, { "epoch": 0.9, "learning_rate": 5.188334206414702e-07, "loss": 2.3125, "step": 8984 }, { "epoch": 0.9, "learning_rate": 5.178022254048843e-07, "loss": 2.1461, "step": 8985 }, { "epoch": 0.9, "learning_rate": 5.16772028714837e-07, "loss": 2.3312, "step": 8986 }, { "epoch": 0.9, "learning_rate": 5.157428306798162e-07, "loss": 2.3813, "step": 8987 }, { "epoch": 0.9, "learning_rate": 5.147146314082041e-07, "loss": 2.2331, "step": 8988 }, { "epoch": 0.9, "learning_rate": 5.136874310082773e-07, "loss": 2.3625, "step": 8989 }, { "epoch": 0.9, "learning_rate": 5.126612295882083e-07, "loss": 2.3852, "step": 8990 }, { "epoch": 0.9, "learning_rate": 5.116360272560639e-07, "loss": 2.319, "step": 8991 }, { "epoch": 0.9, "learning_rate": 5.106118241198044e-07, "loss": 2.3604, "step": 8992 }, { "epoch": 0.9, "learning_rate": 5.095886202872869e-07, "loss": 2.3092, "step": 8993 }, { "epoch": 0.9, "learning_rate": 5.085664158662628e-07, "loss": 2.3786, "step": 8994 }, { "epoch": 0.9, "learning_rate": 5.075452109643786e-07, "loss": 2.2384, "step": 8995 }, { "epoch": 0.9, "learning_rate": 5.065250056891735e-07, "loss": 2.2421, "step": 8996 }, { "epoch": 0.9, "learning_rate": 5.055058001480828e-07, "loss": 2.3104, "step": 8997 }, { "epoch": 0.9, "learning_rate": 5.044875944484373e-07, "loss": 2.2754, "step": 8998 }, { "epoch": 0.9, "learning_rate": 5.034703886974612e-07, "loss": 2.3843, "step": 8999 }, { "epoch": 0.9, "learning_rate": 5.024541830022733e-07, "loss": 2.2052, "step": 9000 }, { "epoch": 0.9, "learning_rate": 5.014389774698891e-07, "loss": 2.2707, "step": 9001 }, { "epoch": 0.9, "learning_rate": 5.004247722072164e-07, "loss": 2.2783, "step": 9002 }, { "epoch": 0.9, "learning_rate": 4.994115673210575e-07, "loss": 2.2318, "step": 9003 }, { "epoch": 0.9, "learning_rate": 4.983993629181128e-07, "loss": 2.2175, "step": 9004 }, { "epoch": 0.9, "learning_rate": 4.973881591049745e-07, "loss": 2.3298, "step": 9005 }, { "epoch": 0.9, "learning_rate": 4.963779559881287e-07, "loss": 2.2959, "step": 9006 }, { "epoch": 0.9, "learning_rate": 4.953687536739571e-07, "loss": 2.3885, "step": 9007 }, { "epoch": 0.9, "learning_rate": 4.943605522687389e-07, "loss": 2.2742, "step": 9008 }, { "epoch": 0.9, "learning_rate": 4.933533518786426e-07, "loss": 2.2048, "step": 9009 }, { "epoch": 0.9, "learning_rate": 4.923471526097357e-07, "loss": 2.3477, "step": 9010 }, { "epoch": 0.9, "learning_rate": 4.913419545679754e-07, "loss": 2.2259, "step": 9011 }, { "epoch": 0.9, "learning_rate": 4.903377578592205e-07, "loss": 2.3876, "step": 9012 }, { "epoch": 0.9, "learning_rate": 4.893345625892199e-07, "loss": 2.2538, "step": 9013 }, { "epoch": 0.9, "learning_rate": 4.883323688636155e-07, "loss": 2.33, "step": 9014 }, { "epoch": 0.9, "learning_rate": 4.873311767879474e-07, "loss": 2.273, "step": 9015 }, { "epoch": 0.9, "learning_rate": 4.86330986467648e-07, "loss": 2.2993, "step": 9016 }, { "epoch": 0.9, "learning_rate": 4.853317980080452e-07, "loss": 2.3077, "step": 9017 }, { "epoch": 0.9, "learning_rate": 4.843336115143615e-07, "loss": 2.2509, "step": 9018 }, { "epoch": 0.9, "learning_rate": 4.833364270917119e-07, "loss": 2.2544, "step": 9019 }, { "epoch": 0.9, "learning_rate": 4.823402448451075e-07, "loss": 2.2472, "step": 9020 }, { "epoch": 0.9, "learning_rate": 4.813450648794559e-07, "loss": 2.3575, "step": 9021 }, { "epoch": 0.9, "learning_rate": 4.803508872995554e-07, "loss": 2.2503, "step": 9022 }, { "epoch": 0.9, "learning_rate": 4.793577122101001e-07, "loss": 2.2092, "step": 9023 }, { "epoch": 0.9, "learning_rate": 4.783655397156794e-07, "loss": 2.2748, "step": 9024 }, { "epoch": 0.9, "learning_rate": 4.773743699207767e-07, "loss": 2.3574, "step": 9025 }, { "epoch": 0.9, "learning_rate": 4.763842029297683e-07, "loss": 2.3482, "step": 9026 }, { "epoch": 0.9, "learning_rate": 4.7539503884692864e-07, "loss": 2.2832, "step": 9027 }, { "epoch": 0.9, "learning_rate": 4.74406877776421e-07, "loss": 2.3658, "step": 9028 }, { "epoch": 0.9, "learning_rate": 4.7341971982230784e-07, "loss": 2.383, "step": 9029 }, { "epoch": 0.9, "learning_rate": 4.724335650885459e-07, "loss": 2.3102, "step": 9030 }, { "epoch": 0.9, "learning_rate": 4.714484136789821e-07, "loss": 2.3239, "step": 9031 }, { "epoch": 0.9, "learning_rate": 4.704642656973613e-07, "loss": 2.2767, "step": 9032 }, { "epoch": 0.91, "learning_rate": 4.694811212473216e-07, "loss": 2.3744, "step": 9033 }, { "epoch": 0.91, "learning_rate": 4.684989804323958e-07, "loss": 2.2866, "step": 9034 }, { "epoch": 0.91, "learning_rate": 4.675178433560101e-07, "loss": 2.2551, "step": 9035 }, { "epoch": 0.91, "learning_rate": 4.665377101214863e-07, "loss": 2.2367, "step": 9036 }, { "epoch": 0.91, "learning_rate": 4.6555858083203843e-07, "loss": 2.2788, "step": 9037 }, { "epoch": 0.91, "learning_rate": 4.6458045559077626e-07, "loss": 2.3525, "step": 9038 }, { "epoch": 0.91, "learning_rate": 4.636033345007063e-07, "loss": 2.3043, "step": 9039 }, { "epoch": 0.91, "learning_rate": 4.6262721766472395e-07, "loss": 2.1956, "step": 9040 }, { "epoch": 0.91, "learning_rate": 4.6165210518562263e-07, "loss": 2.2607, "step": 9041 }, { "epoch": 0.91, "learning_rate": 4.606779971660902e-07, "loss": 2.365, "step": 9042 }, { "epoch": 0.91, "learning_rate": 4.597048937087056e-07, "loss": 2.2627, "step": 9043 }, { "epoch": 0.91, "learning_rate": 4.587327949159459e-07, "loss": 2.2508, "step": 9044 }, { "epoch": 0.91, "learning_rate": 4.57761700890178e-07, "loss": 2.408, "step": 9045 }, { "epoch": 0.91, "learning_rate": 4.567916117336657e-07, "loss": 2.2392, "step": 9046 }, { "epoch": 0.91, "learning_rate": 4.5582252754856725e-07, "loss": 2.2319, "step": 9047 }, { "epoch": 0.91, "learning_rate": 4.548544484369355e-07, "loss": 2.3601, "step": 9048 }, { "epoch": 0.91, "learning_rate": 4.5388737450071664e-07, "loss": 2.3476, "step": 9049 }, { "epoch": 0.91, "learning_rate": 4.529213058417481e-07, "loss": 2.3191, "step": 9050 }, { "epoch": 0.91, "learning_rate": 4.519562425617674e-07, "loss": 2.2415, "step": 9051 }, { "epoch": 0.91, "learning_rate": 4.5099218476240104e-07, "loss": 2.2683, "step": 9052 }, { "epoch": 0.91, "learning_rate": 4.500291325451711e-07, "loss": 2.3211, "step": 9053 }, { "epoch": 0.91, "learning_rate": 4.490670860114954e-07, "loss": 2.2714, "step": 9054 }, { "epoch": 0.91, "learning_rate": 4.48106045262684e-07, "loss": 2.295, "step": 9055 }, { "epoch": 0.91, "learning_rate": 4.4714601039994144e-07, "loss": 2.2974, "step": 9056 }, { "epoch": 0.91, "learning_rate": 4.4618698152436915e-07, "loss": 2.2884, "step": 9057 }, { "epoch": 0.91, "learning_rate": 4.4522895873695625e-07, "loss": 2.2861, "step": 9058 }, { "epoch": 0.91, "learning_rate": 4.4427194213859216e-07, "loss": 2.2653, "step": 9059 }, { "epoch": 0.91, "learning_rate": 4.433159318300584e-07, "loss": 2.3281, "step": 9060 }, { "epoch": 0.91, "learning_rate": 4.4236092791202777e-07, "loss": 2.3226, "step": 9061 }, { "epoch": 0.91, "learning_rate": 4.414069304850699e-07, "loss": 2.3037, "step": 9062 }, { "epoch": 0.91, "learning_rate": 4.4045393964964875e-07, "loss": 2.3638, "step": 9063 }, { "epoch": 0.91, "learning_rate": 4.3950195550612197e-07, "loss": 2.245, "step": 9064 }, { "epoch": 0.91, "learning_rate": 4.3855097815473923e-07, "loss": 2.3018, "step": 9065 }, { "epoch": 0.91, "learning_rate": 4.376010076956461e-07, "loss": 2.1746, "step": 9066 }, { "epoch": 0.91, "learning_rate": 4.366520442288813e-07, "loss": 2.3289, "step": 9067 }, { "epoch": 0.91, "learning_rate": 4.3570408785437833e-07, "loss": 2.3594, "step": 9068 }, { "epoch": 0.91, "learning_rate": 4.34757138671964e-07, "loss": 2.2304, "step": 9069 }, { "epoch": 0.91, "learning_rate": 4.338111967813585e-07, "loss": 2.3623, "step": 9070 }, { "epoch": 0.91, "learning_rate": 4.328662622821778e-07, "loss": 2.2587, "step": 9071 }, { "epoch": 0.91, "learning_rate": 4.319223352739299e-07, "loss": 2.4377, "step": 9072 }, { "epoch": 0.91, "learning_rate": 4.309794158560154e-07, "loss": 2.3152, "step": 9073 }, { "epoch": 0.91, "learning_rate": 4.3003750412773495e-07, "loss": 2.3518, "step": 9074 }, { "epoch": 0.91, "learning_rate": 4.290966001882757e-07, "loss": 2.2843, "step": 9075 }, { "epoch": 0.91, "learning_rate": 4.2815670413672403e-07, "loss": 2.2972, "step": 9076 }, { "epoch": 0.91, "learning_rate": 4.2721781607205635e-07, "loss": 2.2279, "step": 9077 }, { "epoch": 0.91, "learning_rate": 4.262799360931458e-07, "loss": 2.3864, "step": 9078 }, { "epoch": 0.91, "learning_rate": 4.253430642987566e-07, "loss": 2.3167, "step": 9079 }, { "epoch": 0.91, "learning_rate": 4.2440720078754993e-07, "loss": 2.3461, "step": 9080 }, { "epoch": 0.91, "learning_rate": 4.2347234565807917e-07, "loss": 2.31, "step": 9081 }, { "epoch": 0.91, "learning_rate": 4.2253849900878996e-07, "loss": 2.3133, "step": 9082 }, { "epoch": 0.91, "learning_rate": 4.216056609380259e-07, "loss": 2.295, "step": 9083 }, { "epoch": 0.91, "learning_rate": 4.206738315440195e-07, "loss": 2.2707, "step": 9084 }, { "epoch": 0.91, "learning_rate": 4.197430109249012e-07, "loss": 2.3138, "step": 9085 }, { "epoch": 0.91, "learning_rate": 4.1881319917869143e-07, "loss": 2.2636, "step": 9086 }, { "epoch": 0.91, "learning_rate": 4.178843964033086e-07, "loss": 2.3638, "step": 9087 }, { "epoch": 0.91, "learning_rate": 4.1695660269655993e-07, "loss": 2.2876, "step": 9088 }, { "epoch": 0.91, "learning_rate": 4.160298181561517e-07, "loss": 2.3048, "step": 9089 }, { "epoch": 0.91, "learning_rate": 4.151040428796793e-07, "loss": 2.2593, "step": 9090 }, { "epoch": 0.91, "learning_rate": 4.1417927696463356e-07, "loss": 2.3282, "step": 9091 }, { "epoch": 0.91, "learning_rate": 4.1325552050840213e-07, "loss": 2.2864, "step": 9092 }, { "epoch": 0.91, "learning_rate": 4.1233277360826165e-07, "loss": 2.2298, "step": 9093 }, { "epoch": 0.91, "learning_rate": 4.1141103636138433e-07, "loss": 2.3562, "step": 9094 }, { "epoch": 0.91, "learning_rate": 4.1049030886483485e-07, "loss": 2.3265, "step": 9095 }, { "epoch": 0.91, "learning_rate": 4.095705912155756e-07, "loss": 2.2646, "step": 9096 }, { "epoch": 0.91, "learning_rate": 4.0865188351045694e-07, "loss": 2.3202, "step": 9097 }, { "epoch": 0.91, "learning_rate": 4.0773418584622694e-07, "loss": 2.2465, "step": 9098 }, { "epoch": 0.91, "learning_rate": 4.068174983195261e-07, "loss": 2.291, "step": 9099 }, { "epoch": 0.91, "learning_rate": 4.0590182102688725e-07, "loss": 2.1637, "step": 9100 }, { "epoch": 0.91, "learning_rate": 4.0498715406473987e-07, "loss": 2.2751, "step": 9101 }, { "epoch": 0.91, "learning_rate": 4.040734975294047e-07, "loss": 2.2215, "step": 9102 }, { "epoch": 0.91, "learning_rate": 4.0316085151709597e-07, "loss": 2.2631, "step": 9103 }, { "epoch": 0.91, "learning_rate": 4.022492161239233e-07, "loss": 2.3371, "step": 9104 }, { "epoch": 0.91, "learning_rate": 4.013385914458878e-07, "loss": 2.3216, "step": 9105 }, { "epoch": 0.91, "learning_rate": 4.00428977578885e-07, "loss": 2.3216, "step": 9106 }, { "epoch": 0.91, "learning_rate": 3.9952037461870484e-07, "loss": 2.244, "step": 9107 }, { "epoch": 0.91, "learning_rate": 3.986127826610298e-07, "loss": 2.2855, "step": 9108 }, { "epoch": 0.91, "learning_rate": 3.977062018014344e-07, "loss": 2.3403, "step": 9109 }, { "epoch": 0.91, "learning_rate": 3.968006321353912e-07, "loss": 2.21, "step": 9110 }, { "epoch": 0.91, "learning_rate": 3.9589607375826176e-07, "loss": 2.3094, "step": 9111 }, { "epoch": 0.91, "learning_rate": 3.949925267653032e-07, "loss": 2.329, "step": 9112 }, { "epoch": 0.91, "learning_rate": 3.94089991251666e-07, "loss": 2.2043, "step": 9113 }, { "epoch": 0.91, "learning_rate": 3.9318846731239315e-07, "loss": 2.2867, "step": 9114 }, { "epoch": 0.91, "learning_rate": 3.9228795504242303e-07, "loss": 2.1965, "step": 9115 }, { "epoch": 0.91, "learning_rate": 3.913884545365865e-07, "loss": 2.3412, "step": 9116 }, { "epoch": 0.91, "learning_rate": 3.9048996588960554e-07, "loss": 2.334, "step": 9117 }, { "epoch": 0.91, "learning_rate": 3.8959248919609894e-07, "loss": 2.374, "step": 9118 }, { "epoch": 0.91, "learning_rate": 3.886960245505789e-07, "loss": 2.3164, "step": 9119 }, { "epoch": 0.91, "learning_rate": 3.878005720474498e-07, "loss": 2.3035, "step": 9120 }, { "epoch": 0.91, "learning_rate": 3.869061317810074e-07, "loss": 2.3412, "step": 9121 }, { "epoch": 0.91, "learning_rate": 3.860127038454453e-07, "loss": 2.2509, "step": 9122 }, { "epoch": 0.91, "learning_rate": 3.851202883348459e-07, "loss": 2.2534, "step": 9123 }, { "epoch": 0.91, "learning_rate": 3.842288853431897e-07, "loss": 2.2591, "step": 9124 }, { "epoch": 0.91, "learning_rate": 3.8333849496434593e-07, "loss": 2.2332, "step": 9125 }, { "epoch": 0.91, "learning_rate": 3.824491172920808e-07, "loss": 2.4013, "step": 9126 }, { "epoch": 0.91, "learning_rate": 3.8156075242005265e-07, "loss": 2.2085, "step": 9127 }, { "epoch": 0.91, "learning_rate": 3.806734004418111e-07, "loss": 2.2876, "step": 9128 }, { "epoch": 0.91, "learning_rate": 3.7978706145080255e-07, "loss": 2.3161, "step": 9129 }, { "epoch": 0.91, "learning_rate": 3.789017355403646e-07, "loss": 2.2848, "step": 9130 }, { "epoch": 0.91, "learning_rate": 3.780174228037292e-07, "loss": 2.3453, "step": 9131 }, { "epoch": 0.91, "learning_rate": 3.771341233340209e-07, "loss": 2.3981, "step": 9132 }, { "epoch": 0.92, "learning_rate": 3.762518372242563e-07, "loss": 2.1937, "step": 9133 }, { "epoch": 0.92, "learning_rate": 3.7537056456735e-07, "loss": 2.2778, "step": 9134 }, { "epoch": 0.92, "learning_rate": 3.744903054561033e-07, "loss": 2.2985, "step": 9135 }, { "epoch": 0.92, "learning_rate": 3.7361105998321435e-07, "loss": 2.2448, "step": 9136 }, { "epoch": 0.92, "learning_rate": 3.7273282824127677e-07, "loss": 2.1872, "step": 9137 }, { "epoch": 0.92, "learning_rate": 3.718556103227744e-07, "loss": 2.2983, "step": 9138 }, { "epoch": 0.92, "learning_rate": 3.7097940632008334e-07, "loss": 2.3916, "step": 9139 }, { "epoch": 0.92, "learning_rate": 3.7010421632547533e-07, "loss": 2.3328, "step": 9140 }, { "epoch": 0.92, "learning_rate": 3.6923004043111443e-07, "loss": 2.3151, "step": 9141 }, { "epoch": 0.92, "learning_rate": 3.6835687872905704e-07, "loss": 2.2394, "step": 9142 }, { "epoch": 0.92, "learning_rate": 3.674847313112551e-07, "loss": 2.2535, "step": 9143 }, { "epoch": 0.92, "learning_rate": 3.6661359826955066e-07, "loss": 2.1673, "step": 9144 }, { "epoch": 0.92, "learning_rate": 3.6574347969568157e-07, "loss": 2.2822, "step": 9145 }, { "epoch": 0.92, "learning_rate": 3.648743756812778e-07, "loss": 2.3626, "step": 9146 }, { "epoch": 0.92, "learning_rate": 3.6400628631786395e-07, "loss": 2.2721, "step": 9147 }, { "epoch": 0.92, "learning_rate": 3.6313921169685353e-07, "loss": 2.2826, "step": 9148 }, { "epoch": 0.92, "learning_rate": 3.622731519095579e-07, "loss": 2.3215, "step": 9149 }, { "epoch": 0.92, "learning_rate": 3.6140810704717753e-07, "loss": 2.2424, "step": 9150 }, { "epoch": 0.92, "learning_rate": 3.6054407720081064e-07, "loss": 2.3118, "step": 9151 }, { "epoch": 0.92, "learning_rate": 3.5968106246144554e-07, "loss": 2.2479, "step": 9152 }, { "epoch": 0.92, "learning_rate": 3.588190629199628e-07, "loss": 2.3081, "step": 9153 }, { "epoch": 0.92, "learning_rate": 3.5795807866713773e-07, "loss": 2.3584, "step": 9154 }, { "epoch": 0.92, "learning_rate": 3.570981097936399e-07, "loss": 2.3326, "step": 9155 }, { "epoch": 0.92, "learning_rate": 3.5623915639002916e-07, "loss": 2.3063, "step": 9156 }, { "epoch": 0.92, "learning_rate": 3.553812185467609e-07, "loss": 2.2757, "step": 9157 }, { "epoch": 0.92, "learning_rate": 3.5452429635418174e-07, "loss": 2.2854, "step": 9158 }, { "epoch": 0.92, "learning_rate": 3.536683899025317e-07, "loss": 2.3194, "step": 9159 }, { "epoch": 0.92, "learning_rate": 3.528134992819443e-07, "loss": 2.2495, "step": 9160 }, { "epoch": 0.92, "learning_rate": 3.5195962458244526e-07, "loss": 2.1983, "step": 9161 }, { "epoch": 0.92, "learning_rate": 3.5110676589395597e-07, "loss": 2.2205, "step": 9162 }, { "epoch": 0.92, "learning_rate": 3.5025492330628576e-07, "loss": 2.2582, "step": 9163 }, { "epoch": 0.92, "learning_rate": 3.494040969091428e-07, "loss": 2.2782, "step": 9164 }, { "epoch": 0.92, "learning_rate": 3.4855428679212543e-07, "loss": 2.25, "step": 9165 }, { "epoch": 0.92, "learning_rate": 3.4770549304472434e-07, "loss": 2.2932, "step": 9166 }, { "epoch": 0.92, "learning_rate": 3.4685771575632244e-07, "loss": 2.2269, "step": 9167 }, { "epoch": 0.92, "learning_rate": 3.4601095501619944e-07, "loss": 2.4117, "step": 9168 }, { "epoch": 0.92, "learning_rate": 3.45165210913524e-07, "loss": 2.31, "step": 9169 }, { "epoch": 0.92, "learning_rate": 3.4432048353736036e-07, "loss": 2.3194, "step": 9170 }, { "epoch": 0.92, "learning_rate": 3.4347677297666413e-07, "loss": 2.2148, "step": 9171 }, { "epoch": 0.92, "learning_rate": 3.4263407932028313e-07, "loss": 2.4192, "step": 9172 }, { "epoch": 0.92, "learning_rate": 3.417924026569619e-07, "loss": 2.2966, "step": 9173 }, { "epoch": 0.92, "learning_rate": 3.4095174307533285e-07, "loss": 2.2823, "step": 9174 }, { "epoch": 0.92, "learning_rate": 3.4011210066392633e-07, "loss": 2.2884, "step": 9175 }, { "epoch": 0.92, "learning_rate": 3.392734755111604e-07, "loss": 2.3218, "step": 9176 }, { "epoch": 0.92, "learning_rate": 3.38435867705349e-07, "loss": 2.25, "step": 9177 }, { "epoch": 0.92, "learning_rate": 3.3759927733470033e-07, "loss": 2.2844, "step": 9178 }, { "epoch": 0.92, "learning_rate": 3.3676370448731176e-07, "loss": 2.3319, "step": 9179 }, { "epoch": 0.92, "learning_rate": 3.3592914925117624e-07, "loss": 2.409, "step": 9180 }, { "epoch": 0.92, "learning_rate": 3.3509561171417794e-07, "loss": 2.3622, "step": 9181 }, { "epoch": 0.92, "learning_rate": 3.3426309196409546e-07, "loss": 2.3094, "step": 9182 }, { "epoch": 0.92, "learning_rate": 3.3343159008859984e-07, "loss": 2.2649, "step": 9183 }, { "epoch": 0.92, "learning_rate": 3.326011061752532e-07, "loss": 2.3404, "step": 9184 }, { "epoch": 0.92, "learning_rate": 3.3177164031151344e-07, "loss": 2.2782, "step": 9185 }, { "epoch": 0.92, "learning_rate": 3.309431925847273e-07, "loss": 2.3645, "step": 9186 }, { "epoch": 0.92, "learning_rate": 3.3011576308213724e-07, "loss": 2.2482, "step": 9187 }, { "epoch": 0.92, "learning_rate": 3.2928935189087906e-07, "loss": 2.2156, "step": 9188 }, { "epoch": 0.92, "learning_rate": 3.2846395909797877e-07, "loss": 2.3495, "step": 9189 }, { "epoch": 0.92, "learning_rate": 3.276395847903568e-07, "loss": 2.3182, "step": 9190 }, { "epoch": 0.92, "learning_rate": 3.26816229054826e-07, "loss": 2.2474, "step": 9191 }, { "epoch": 0.92, "learning_rate": 3.259938919780914e-07, "loss": 2.3269, "step": 9192 }, { "epoch": 0.92, "learning_rate": 3.251725736467526e-07, "loss": 2.2525, "step": 9193 }, { "epoch": 0.92, "learning_rate": 3.243522741472993e-07, "loss": 2.1799, "step": 9194 }, { "epoch": 0.92, "learning_rate": 3.2353299356611467e-07, "loss": 2.2965, "step": 9195 }, { "epoch": 0.92, "learning_rate": 3.2271473198947744e-07, "loss": 2.3897, "step": 9196 }, { "epoch": 0.92, "learning_rate": 3.2189748950355425e-07, "loss": 2.2829, "step": 9197 }, { "epoch": 0.92, "learning_rate": 3.210812661944085e-07, "loss": 2.2862, "step": 9198 }, { "epoch": 0.92, "learning_rate": 3.202660621479925e-07, "loss": 2.238, "step": 9199 }, { "epoch": 0.92, "learning_rate": 3.194518774501565e-07, "loss": 2.3511, "step": 9200 }, { "epoch": 0.92, "learning_rate": 3.1863871218663856e-07, "loss": 2.3605, "step": 9201 }, { "epoch": 0.92, "learning_rate": 3.178265664430702e-07, "loss": 2.2728, "step": 9202 }, { "epoch": 0.92, "learning_rate": 3.1701544030497855e-07, "loss": 2.3204, "step": 9203 }, { "epoch": 0.92, "learning_rate": 3.1620533385777863e-07, "loss": 2.3362, "step": 9204 }, { "epoch": 0.92, "learning_rate": 3.153962471867833e-07, "loss": 2.2928, "step": 9205 }, { "epoch": 0.92, "learning_rate": 3.145881803771944e-07, "loss": 2.2569, "step": 9206 }, { "epoch": 0.92, "learning_rate": 3.137811335141072e-07, "loss": 2.2879, "step": 9207 }, { "epoch": 0.92, "learning_rate": 3.129751066825093e-07, "loss": 2.2837, "step": 9208 }, { "epoch": 0.92, "learning_rate": 3.121700999672828e-07, "loss": 2.2164, "step": 9209 }, { "epoch": 0.92, "learning_rate": 3.113661134531998e-07, "loss": 2.2781, "step": 9210 }, { "epoch": 0.92, "learning_rate": 3.105631472249282e-07, "loss": 2.3405, "step": 9211 }, { "epoch": 0.92, "learning_rate": 3.097612013670226e-07, "loss": 2.3202, "step": 9212 }, { "epoch": 0.92, "learning_rate": 3.0896027596393654e-07, "loss": 2.3168, "step": 9213 }, { "epoch": 0.92, "learning_rate": 3.081603711000136e-07, "loss": 2.2708, "step": 9214 }, { "epoch": 0.92, "learning_rate": 3.073614868594876e-07, "loss": 2.2654, "step": 9215 }, { "epoch": 0.92, "learning_rate": 3.0656362332649015e-07, "loss": 2.2858, "step": 9216 }, { "epoch": 0.92, "learning_rate": 3.057667805850384e-07, "loss": 2.3393, "step": 9217 }, { "epoch": 0.92, "learning_rate": 3.049709587190497e-07, "loss": 2.3144, "step": 9218 }, { "epoch": 0.92, "learning_rate": 3.041761578123281e-07, "loss": 2.3175, "step": 9219 }, { "epoch": 0.92, "learning_rate": 3.033823779485723e-07, "loss": 2.2929, "step": 9220 }, { "epoch": 0.92, "learning_rate": 3.025896192113742e-07, "loss": 2.28, "step": 9221 }, { "epoch": 0.92, "learning_rate": 3.0179788168421596e-07, "loss": 2.2455, "step": 9222 }, { "epoch": 0.92, "learning_rate": 3.0100716545047426e-07, "loss": 2.2553, "step": 9223 }, { "epoch": 0.92, "learning_rate": 3.002174705934169e-07, "loss": 2.3082, "step": 9224 }, { "epoch": 0.92, "learning_rate": 2.9942879719620396e-07, "loss": 2.2753, "step": 9225 }, { "epoch": 0.92, "learning_rate": 2.9864114534189024e-07, "loss": 2.3399, "step": 9226 }, { "epoch": 0.92, "learning_rate": 2.978545151134216e-07, "loss": 2.2792, "step": 9227 }, { "epoch": 0.92, "learning_rate": 2.9706890659363494e-07, "loss": 2.3357, "step": 9228 }, { "epoch": 0.92, "learning_rate": 2.9628431986526094e-07, "loss": 2.2151, "step": 9229 }, { "epoch": 0.92, "learning_rate": 2.9550075501092234e-07, "loss": 2.3221, "step": 9230 }, { "epoch": 0.92, "learning_rate": 2.9471821211313534e-07, "loss": 2.2904, "step": 9231 }, { "epoch": 0.92, "learning_rate": 2.9393669125430625e-07, "loss": 2.1971, "step": 9232 }, { "epoch": 0.93, "learning_rate": 2.931561925167359e-07, "loss": 2.2426, "step": 9233 }, { "epoch": 0.93, "learning_rate": 2.9237671598261743e-07, "loss": 2.2673, "step": 9234 }, { "epoch": 0.93, "learning_rate": 2.915982617340341e-07, "loss": 2.3188, "step": 9235 }, { "epoch": 0.93, "learning_rate": 2.9082082985296244e-07, "loss": 2.3391, "step": 9236 }, { "epoch": 0.93, "learning_rate": 2.900444204212738e-07, "loss": 2.233, "step": 9237 }, { "epoch": 0.93, "learning_rate": 2.892690335207293e-07, "loss": 2.3147, "step": 9238 }, { "epoch": 0.93, "learning_rate": 2.884946692329826e-07, "loss": 2.3538, "step": 9239 }, { "epoch": 0.93, "learning_rate": 2.8772132763957963e-07, "loss": 2.2042, "step": 9240 }, { "epoch": 0.93, "learning_rate": 2.869490088219606e-07, "loss": 2.2752, "step": 9241 }, { "epoch": 0.93, "learning_rate": 2.86177712861454e-07, "loss": 2.1183, "step": 9242 }, { "epoch": 0.93, "learning_rate": 2.8540743983928475e-07, "loss": 2.2367, "step": 9243 }, { "epoch": 0.93, "learning_rate": 2.846381898365691e-07, "loss": 2.2255, "step": 9244 }, { "epoch": 0.93, "learning_rate": 2.838699629343134e-07, "loss": 2.318, "step": 9245 }, { "epoch": 0.93, "learning_rate": 2.8310275921341947e-07, "loss": 2.3766, "step": 9246 }, { "epoch": 0.93, "learning_rate": 2.8233657875467724e-07, "loss": 2.4037, "step": 9247 }, { "epoch": 0.93, "learning_rate": 2.815714216387733e-07, "loss": 2.3218, "step": 9248 }, { "epoch": 0.93, "learning_rate": 2.8080728794628307e-07, "loss": 2.3214, "step": 9249 }, { "epoch": 0.93, "learning_rate": 2.8004417775767565e-07, "loss": 2.2906, "step": 9250 }, { "epoch": 0.93, "learning_rate": 2.792820911533134e-07, "loss": 2.2416, "step": 9251 }, { "epoch": 0.93, "learning_rate": 2.785210282134487e-07, "loss": 2.295, "step": 9252 }, { "epoch": 0.93, "learning_rate": 2.7776098901822646e-07, "loss": 2.2357, "step": 9253 }, { "epoch": 0.93, "learning_rate": 2.77001973647687e-07, "loss": 2.3647, "step": 9254 }, { "epoch": 0.93, "learning_rate": 2.7624398218175864e-07, "loss": 2.3358, "step": 9255 }, { "epoch": 0.93, "learning_rate": 2.7548701470026306e-07, "loss": 2.3112, "step": 9256 }, { "epoch": 0.93, "learning_rate": 2.747310712829165e-07, "loss": 2.405, "step": 9257 }, { "epoch": 0.93, "learning_rate": 2.7397615200932317e-07, "loss": 2.2512, "step": 9258 }, { "epoch": 0.93, "learning_rate": 2.7322225695898374e-07, "loss": 2.2813, "step": 9259 }, { "epoch": 0.93, "learning_rate": 2.7246938621128813e-07, "loss": 2.3219, "step": 9260 }, { "epoch": 0.93, "learning_rate": 2.717175398455174e-07, "loss": 2.2593, "step": 9261 }, { "epoch": 0.93, "learning_rate": 2.7096671794085037e-07, "loss": 2.3924, "step": 9262 }, { "epoch": 0.93, "learning_rate": 2.7021692057635165e-07, "loss": 2.2749, "step": 9263 }, { "epoch": 0.93, "learning_rate": 2.694681478309824e-07, "loss": 2.2468, "step": 9264 }, { "epoch": 0.93, "learning_rate": 2.687203997835919e-07, "loss": 2.1582, "step": 9265 }, { "epoch": 0.93, "learning_rate": 2.6797367651292485e-07, "loss": 2.3059, "step": 9266 }, { "epoch": 0.93, "learning_rate": 2.672279780976161e-07, "loss": 2.2074, "step": 9267 }, { "epoch": 0.93, "learning_rate": 2.664833046161941e-07, "loss": 2.2669, "step": 9268 }, { "epoch": 0.93, "learning_rate": 2.657396561470782e-07, "loss": 2.1645, "step": 9269 }, { "epoch": 0.93, "learning_rate": 2.6499703276857915e-07, "loss": 2.3004, "step": 9270 }, { "epoch": 0.93, "learning_rate": 2.642554345589032e-07, "loss": 2.2934, "step": 9271 }, { "epoch": 0.93, "learning_rate": 2.635148615961447e-07, "loss": 2.273, "step": 9272 }, { "epoch": 0.93, "learning_rate": 2.6277531395829117e-07, "loss": 2.3227, "step": 9273 }, { "epoch": 0.93, "learning_rate": 2.620367917232225e-07, "loss": 2.272, "step": 9274 }, { "epoch": 0.93, "learning_rate": 2.612992949687121e-07, "loss": 2.3417, "step": 9275 }, { "epoch": 0.93, "learning_rate": 2.605628237724223e-07, "loss": 2.2555, "step": 9276 }, { "epoch": 0.93, "learning_rate": 2.5982737821190984e-07, "loss": 2.3155, "step": 9277 }, { "epoch": 0.93, "learning_rate": 2.590929583646218e-07, "loss": 2.384, "step": 9278 }, { "epoch": 0.93, "learning_rate": 2.5835956430789843e-07, "loss": 2.2841, "step": 9279 }, { "epoch": 0.93, "learning_rate": 2.5762719611897245e-07, "loss": 2.3098, "step": 9280 }, { "epoch": 0.93, "learning_rate": 2.5689585387496775e-07, "loss": 2.356, "step": 9281 }, { "epoch": 0.93, "learning_rate": 2.561655376528993e-07, "loss": 2.2755, "step": 9282 }, { "epoch": 0.93, "learning_rate": 2.5543624752967454e-07, "loss": 2.2992, "step": 9283 }, { "epoch": 0.93, "learning_rate": 2.5470798358209425e-07, "loss": 2.2832, "step": 9284 }, { "epoch": 0.93, "learning_rate": 2.5398074588684927e-07, "loss": 2.2283, "step": 9285 }, { "epoch": 0.93, "learning_rate": 2.5325453452052393e-07, "loss": 2.2094, "step": 9286 }, { "epoch": 0.93, "learning_rate": 2.5252934955959377e-07, "loss": 2.2873, "step": 9287 }, { "epoch": 0.93, "learning_rate": 2.5180519108042424e-07, "loss": 2.3457, "step": 9288 }, { "epoch": 0.93, "learning_rate": 2.5108205915927777e-07, "loss": 2.3188, "step": 9289 }, { "epoch": 0.93, "learning_rate": 2.503599538723034e-07, "loss": 2.3533, "step": 9290 }, { "epoch": 0.93, "learning_rate": 2.496388752955448e-07, "loss": 2.2434, "step": 9291 }, { "epoch": 0.93, "learning_rate": 2.489188235049378e-07, "loss": 2.3039, "step": 9292 }, { "epoch": 0.93, "learning_rate": 2.4819979857630737e-07, "loss": 2.2763, "step": 9293 }, { "epoch": 0.93, "learning_rate": 2.474818005853741e-07, "loss": 2.3008, "step": 9294 }, { "epoch": 0.93, "learning_rate": 2.4676482960774737e-07, "loss": 2.2428, "step": 9295 }, { "epoch": 0.93, "learning_rate": 2.4604888571893027e-07, "loss": 2.271, "step": 9296 }, { "epoch": 0.93, "learning_rate": 2.453339689943168e-07, "loss": 2.3109, "step": 9297 }, { "epoch": 0.93, "learning_rate": 2.4462007950919354e-07, "loss": 2.2748, "step": 9298 }, { "epoch": 0.93, "learning_rate": 2.4390721733873693e-07, "loss": 2.2828, "step": 9299 }, { "epoch": 0.93, "learning_rate": 2.431953825580191e-07, "loss": 2.2762, "step": 9300 }, { "epoch": 0.93, "learning_rate": 2.4248457524199907e-07, "loss": 2.3534, "step": 9301 }, { "epoch": 0.93, "learning_rate": 2.417747954655314e-07, "loss": 2.2561, "step": 9302 }, { "epoch": 0.93, "learning_rate": 2.410660433033607e-07, "loss": 2.3147, "step": 9303 }, { "epoch": 0.93, "learning_rate": 2.4035831883012506e-07, "loss": 2.3017, "step": 9304 }, { "epoch": 0.93, "learning_rate": 2.3965162212035265e-07, "loss": 2.3273, "step": 9305 }, { "epoch": 0.93, "learning_rate": 2.389459532484617e-07, "loss": 2.3345, "step": 9306 }, { "epoch": 0.93, "learning_rate": 2.3824131228876834e-07, "loss": 2.361, "step": 9307 }, { "epoch": 0.93, "learning_rate": 2.3753769931547434e-07, "loss": 2.3624, "step": 9308 }, { "epoch": 0.93, "learning_rate": 2.3683511440267592e-07, "loss": 2.2334, "step": 9309 }, { "epoch": 0.93, "learning_rate": 2.3613355762435952e-07, "loss": 2.3158, "step": 9310 }, { "epoch": 0.93, "learning_rate": 2.3543302905440603e-07, "loss": 2.362, "step": 9311 }, { "epoch": 0.93, "learning_rate": 2.3473352876658528e-07, "loss": 2.2015, "step": 9312 }, { "epoch": 0.93, "learning_rate": 2.3403505683455952e-07, "loss": 2.2997, "step": 9313 }, { "epoch": 0.93, "learning_rate": 2.333376133318843e-07, "loss": 2.3145, "step": 9314 }, { "epoch": 0.93, "learning_rate": 2.326411983320054e-07, "loss": 2.2441, "step": 9315 }, { "epoch": 0.93, "learning_rate": 2.319458119082596e-07, "loss": 2.418, "step": 9316 }, { "epoch": 0.93, "learning_rate": 2.3125145413387728e-07, "loss": 2.2028, "step": 9317 }, { "epoch": 0.93, "learning_rate": 2.3055812508197884e-07, "loss": 2.31, "step": 9318 }, { "epoch": 0.93, "learning_rate": 2.2986582482557697e-07, "loss": 2.1507, "step": 9319 }, { "epoch": 0.93, "learning_rate": 2.2917455343757667e-07, "loss": 2.1963, "step": 9320 }, { "epoch": 0.93, "learning_rate": 2.2848431099077418e-07, "loss": 2.2912, "step": 9321 }, { "epoch": 0.93, "learning_rate": 2.2779509755785578e-07, "loss": 2.2899, "step": 9322 }, { "epoch": 0.93, "learning_rate": 2.2710691321140343e-07, "loss": 2.3099, "step": 9323 }, { "epoch": 0.93, "learning_rate": 2.264197580238836e-07, "loss": 2.1419, "step": 9324 }, { "epoch": 0.93, "learning_rate": 2.2573363206766397e-07, "loss": 2.4012, "step": 9325 }, { "epoch": 0.93, "learning_rate": 2.2504853541499672e-07, "loss": 2.3241, "step": 9326 }, { "epoch": 0.93, "learning_rate": 2.2436446813802636e-07, "loss": 2.3099, "step": 9327 }, { "epoch": 0.93, "learning_rate": 2.2368143030879198e-07, "loss": 2.3173, "step": 9328 }, { "epoch": 0.93, "learning_rate": 2.2299942199922265e-07, "loss": 2.2953, "step": 9329 }, { "epoch": 0.93, "learning_rate": 2.223184432811376e-07, "loss": 2.3493, "step": 9330 }, { "epoch": 0.93, "learning_rate": 2.216384942262495e-07, "loss": 2.2089, "step": 9331 }, { "epoch": 0.93, "learning_rate": 2.2095957490616326e-07, "loss": 2.2349, "step": 9332 }, { "epoch": 0.94, "learning_rate": 2.2028168539237172e-07, "loss": 2.3637, "step": 9333 }, { "epoch": 0.94, "learning_rate": 2.196048257562644e-07, "loss": 2.2723, "step": 9334 }, { "epoch": 0.94, "learning_rate": 2.1892899606911876e-07, "loss": 2.2545, "step": 9335 }, { "epoch": 0.94, "learning_rate": 2.1825419640210344e-07, "loss": 2.2738, "step": 9336 }, { "epoch": 0.94, "learning_rate": 2.1758042682628154e-07, "loss": 2.3022, "step": 9337 }, { "epoch": 0.94, "learning_rate": 2.1690768741260637e-07, "loss": 2.3395, "step": 9338 }, { "epoch": 0.94, "learning_rate": 2.1623597823192123e-07, "loss": 2.3328, "step": 9339 }, { "epoch": 0.94, "learning_rate": 2.1556529935496285e-07, "loss": 2.2818, "step": 9340 }, { "epoch": 0.94, "learning_rate": 2.1489565085235697e-07, "loss": 2.2575, "step": 9341 }, { "epoch": 0.94, "learning_rate": 2.1422703279462386e-07, "loss": 2.2938, "step": 9342 }, { "epoch": 0.94, "learning_rate": 2.1355944525217498e-07, "loss": 2.3394, "step": 9343 }, { "epoch": 0.94, "learning_rate": 2.1289288829531186e-07, "loss": 2.3672, "step": 9344 }, { "epoch": 0.94, "learning_rate": 2.1222736199422723e-07, "loss": 2.1483, "step": 9345 }, { "epoch": 0.94, "learning_rate": 2.1156286641900615e-07, "loss": 2.3035, "step": 9346 }, { "epoch": 0.94, "learning_rate": 2.1089940163962485e-07, "loss": 2.2777, "step": 9347 }, { "epoch": 0.94, "learning_rate": 2.1023696772595193e-07, "loss": 2.2969, "step": 9348 }, { "epoch": 0.94, "learning_rate": 2.09575564747746e-07, "loss": 2.3507, "step": 9349 }, { "epoch": 0.94, "learning_rate": 2.08915192774658e-07, "loss": 2.2981, "step": 9350 }, { "epoch": 0.94, "learning_rate": 2.082558518762301e-07, "loss": 2.2924, "step": 9351 }, { "epoch": 0.94, "learning_rate": 2.0759754212189565e-07, "loss": 2.2882, "step": 9352 }, { "epoch": 0.94, "learning_rate": 2.0694026358097918e-07, "loss": 2.2806, "step": 9353 }, { "epoch": 0.94, "learning_rate": 2.0628401632269867e-07, "loss": 2.2858, "step": 9354 }, { "epoch": 0.94, "learning_rate": 2.0562880041615995e-07, "loss": 2.2755, "step": 9355 }, { "epoch": 0.94, "learning_rate": 2.049746159303634e-07, "loss": 2.3355, "step": 9356 }, { "epoch": 0.94, "learning_rate": 2.043214629341983e-07, "loss": 2.3177, "step": 9357 }, { "epoch": 0.94, "learning_rate": 2.0366934149644857e-07, "loss": 2.3241, "step": 9358 }, { "epoch": 0.94, "learning_rate": 2.0301825168578591e-07, "loss": 2.3763, "step": 9359 }, { "epoch": 0.94, "learning_rate": 2.0236819357077552e-07, "loss": 2.1685, "step": 9360 }, { "epoch": 0.94, "learning_rate": 2.017191672198726e-07, "loss": 2.3071, "step": 9361 }, { "epoch": 0.94, "learning_rate": 2.0107117270142584e-07, "loss": 2.2693, "step": 9362 }, { "epoch": 0.94, "learning_rate": 2.0042421008367284e-07, "loss": 2.3298, "step": 9363 }, { "epoch": 0.94, "learning_rate": 1.997782794347436e-07, "loss": 2.2663, "step": 9364 }, { "epoch": 0.94, "learning_rate": 1.991333808226603e-07, "loss": 2.3303, "step": 9365 }, { "epoch": 0.94, "learning_rate": 1.9848951431533537e-07, "loss": 2.2597, "step": 9366 }, { "epoch": 0.94, "learning_rate": 1.9784667998057228e-07, "loss": 2.2658, "step": 9367 }, { "epoch": 0.94, "learning_rate": 1.972048778860669e-07, "loss": 2.2517, "step": 9368 }, { "epoch": 0.94, "learning_rate": 1.9656410809940406e-07, "loss": 2.2398, "step": 9369 }, { "epoch": 0.94, "learning_rate": 1.9592437068806426e-07, "loss": 2.2958, "step": 9370 }, { "epoch": 0.94, "learning_rate": 1.9528566571941576e-07, "loss": 2.2593, "step": 9371 }, { "epoch": 0.94, "learning_rate": 1.9464799326071816e-07, "loss": 2.1936, "step": 9372 }, { "epoch": 0.94, "learning_rate": 1.9401135337912325e-07, "loss": 2.2466, "step": 9373 }, { "epoch": 0.94, "learning_rate": 1.933757461416752e-07, "loss": 2.327, "step": 9374 }, { "epoch": 0.94, "learning_rate": 1.9274117161530716e-07, "loss": 2.3031, "step": 9375 }, { "epoch": 0.94, "learning_rate": 1.921076298668445e-07, "loss": 2.3038, "step": 9376 }, { "epoch": 0.94, "learning_rate": 1.9147512096300502e-07, "loss": 2.4003, "step": 9377 }, { "epoch": 0.94, "learning_rate": 1.9084364497039431e-07, "loss": 2.3588, "step": 9378 }, { "epoch": 0.94, "learning_rate": 1.9021320195551584e-07, "loss": 2.2605, "step": 9379 }, { "epoch": 0.94, "learning_rate": 1.8958379198475542e-07, "loss": 2.4395, "step": 9380 }, { "epoch": 0.94, "learning_rate": 1.8895541512439665e-07, "loss": 2.2755, "step": 9381 }, { "epoch": 0.94, "learning_rate": 1.8832807144061215e-07, "loss": 2.2929, "step": 9382 }, { "epoch": 0.94, "learning_rate": 1.877017609994658e-07, "loss": 2.2428, "step": 9383 }, { "epoch": 0.94, "learning_rate": 1.870764838669137e-07, "loss": 2.2185, "step": 9384 }, { "epoch": 0.94, "learning_rate": 1.864522401088009e-07, "loss": 2.2601, "step": 9385 }, { "epoch": 0.94, "learning_rate": 1.858290297908649e-07, "loss": 2.282, "step": 9386 }, { "epoch": 0.94, "learning_rate": 1.852068529787343e-07, "loss": 2.3956, "step": 9387 }, { "epoch": 0.94, "learning_rate": 1.8458570973793112e-07, "loss": 2.2953, "step": 9388 }, { "epoch": 0.94, "learning_rate": 1.8396560013386522e-07, "loss": 2.2704, "step": 9389 }, { "epoch": 0.94, "learning_rate": 1.8334652423183774e-07, "loss": 2.3523, "step": 9390 }, { "epoch": 0.94, "learning_rate": 1.8272848209704318e-07, "loss": 2.2934, "step": 9391 }, { "epoch": 0.94, "learning_rate": 1.8211147379456506e-07, "loss": 2.2614, "step": 9392 }, { "epoch": 0.94, "learning_rate": 1.8149549938938026e-07, "loss": 2.1906, "step": 9393 }, { "epoch": 0.94, "learning_rate": 1.808805589463547e-07, "loss": 2.2373, "step": 9394 }, { "epoch": 0.94, "learning_rate": 1.8026665253024545e-07, "loss": 2.3369, "step": 9395 }, { "epoch": 0.94, "learning_rate": 1.79653780205703e-07, "loss": 2.2555, "step": 9396 }, { "epoch": 0.94, "learning_rate": 1.7904194203726688e-07, "loss": 2.4047, "step": 9397 }, { "epoch": 0.94, "learning_rate": 1.7843113808936774e-07, "loss": 2.2645, "step": 9398 }, { "epoch": 0.94, "learning_rate": 1.7782136842632857e-07, "loss": 2.2867, "step": 9399 }, { "epoch": 0.94, "learning_rate": 1.7721263311236247e-07, "loss": 2.3123, "step": 9400 }, { "epoch": 0.94, "learning_rate": 1.766049322115726e-07, "loss": 2.3298, "step": 9401 }, { "epoch": 0.94, "learning_rate": 1.7599826578795665e-07, "loss": 2.2091, "step": 9402 }, { "epoch": 0.94, "learning_rate": 1.7539263390540017e-07, "loss": 2.177, "step": 9403 }, { "epoch": 0.94, "learning_rate": 1.7478803662767885e-07, "loss": 2.207, "step": 9404 }, { "epoch": 0.94, "learning_rate": 1.7418447401846393e-07, "loss": 2.265, "step": 9405 }, { "epoch": 0.94, "learning_rate": 1.7358194614131462e-07, "loss": 2.2244, "step": 9406 }, { "epoch": 0.94, "learning_rate": 1.7298045305968126e-07, "loss": 2.3073, "step": 9407 }, { "epoch": 0.94, "learning_rate": 1.7237999483690425e-07, "loss": 2.3165, "step": 9408 }, { "epoch": 0.94, "learning_rate": 1.7178057153621863e-07, "loss": 2.3072, "step": 9409 }, { "epoch": 0.94, "learning_rate": 1.711821832207472e-07, "loss": 2.2906, "step": 9410 }, { "epoch": 0.94, "learning_rate": 1.70584829953504e-07, "loss": 2.2548, "step": 9411 }, { "epoch": 0.94, "learning_rate": 1.699885117973954e-07, "loss": 2.3364, "step": 9412 }, { "epoch": 0.94, "learning_rate": 1.693932288152178e-07, "loss": 2.3108, "step": 9413 }, { "epoch": 0.94, "learning_rate": 1.687989810696611e-07, "loss": 2.2062, "step": 9414 }, { "epoch": 0.94, "learning_rate": 1.6820576862330073e-07, "loss": 2.2498, "step": 9415 }, { "epoch": 0.94, "learning_rate": 1.6761359153860901e-07, "loss": 2.3324, "step": 9416 }, { "epoch": 0.94, "learning_rate": 1.6702244987794492e-07, "loss": 2.2101, "step": 9417 }, { "epoch": 0.94, "learning_rate": 1.66432343703562e-07, "loss": 2.2951, "step": 9418 }, { "epoch": 0.94, "learning_rate": 1.658432730776005e-07, "loss": 2.329, "step": 9419 }, { "epoch": 0.94, "learning_rate": 1.6525523806209532e-07, "loss": 2.2379, "step": 9420 }, { "epoch": 0.94, "learning_rate": 1.646682387189713e-07, "loss": 2.3328, "step": 9421 }, { "epoch": 0.94, "learning_rate": 1.640822751100435e-07, "loss": 2.2177, "step": 9422 }, { "epoch": 0.94, "learning_rate": 1.6349734729701693e-07, "loss": 2.1965, "step": 9423 }, { "epoch": 0.94, "learning_rate": 1.6291345534149127e-07, "loss": 2.1308, "step": 9424 }, { "epoch": 0.94, "learning_rate": 1.62330599304954e-07, "loss": 2.3517, "step": 9425 }, { "epoch": 0.94, "learning_rate": 1.6174877924878262e-07, "loss": 2.1715, "step": 9426 }, { "epoch": 0.94, "learning_rate": 1.611679952342482e-07, "loss": 2.2807, "step": 9427 }, { "epoch": 0.94, "learning_rate": 1.6058824732251288e-07, "loss": 2.2631, "step": 9428 }, { "epoch": 0.94, "learning_rate": 1.6000953557462672e-07, "loss": 2.3309, "step": 9429 }, { "epoch": 0.94, "learning_rate": 1.594318600515332e-07, "loss": 2.2502, "step": 9430 }, { "epoch": 0.94, "learning_rate": 1.588552208140648e-07, "loss": 2.2903, "step": 9431 }, { "epoch": 0.94, "learning_rate": 1.5827961792294732e-07, "loss": 2.1886, "step": 9432 }, { "epoch": 0.95, "learning_rate": 1.5770505143879567e-07, "loss": 2.3079, "step": 9433 }, { "epoch": 0.95, "learning_rate": 1.5713152142211695e-07, "loss": 2.2665, "step": 9434 }, { "epoch": 0.95, "learning_rate": 1.5655902793330623e-07, "loss": 2.38, "step": 9435 }, { "epoch": 0.95, "learning_rate": 1.5598757103265194e-07, "loss": 2.3237, "step": 9436 }, { "epoch": 0.95, "learning_rate": 1.554171507803337e-07, "loss": 2.3684, "step": 9437 }, { "epoch": 0.95, "learning_rate": 1.5484776723642126e-07, "loss": 2.306, "step": 9438 }, { "epoch": 0.95, "learning_rate": 1.542794204608733e-07, "loss": 2.379, "step": 9439 }, { "epoch": 0.95, "learning_rate": 1.5371211051354085e-07, "loss": 2.2555, "step": 9440 }, { "epoch": 0.95, "learning_rate": 1.5314583745416832e-07, "loss": 2.2196, "step": 9441 }, { "epoch": 0.95, "learning_rate": 1.5258060134238696e-07, "loss": 2.2887, "step": 9442 }, { "epoch": 0.95, "learning_rate": 1.5201640223772128e-07, "loss": 2.2778, "step": 9443 }, { "epoch": 0.95, "learning_rate": 1.5145324019958386e-07, "loss": 2.3008, "step": 9444 }, { "epoch": 0.95, "learning_rate": 1.5089111528728162e-07, "loss": 2.2692, "step": 9445 }, { "epoch": 0.95, "learning_rate": 1.5033002756000947e-07, "loss": 2.3051, "step": 9446 }, { "epoch": 0.95, "learning_rate": 1.4976997707685569e-07, "loss": 2.3429, "step": 9447 }, { "epoch": 0.95, "learning_rate": 1.4921096389679534e-07, "loss": 2.2831, "step": 9448 }, { "epoch": 0.95, "learning_rate": 1.48652988078698e-07, "loss": 2.2885, "step": 9449 }, { "epoch": 0.95, "learning_rate": 1.4809604968132328e-07, "loss": 2.3126, "step": 9450 }, { "epoch": 0.95, "learning_rate": 1.475401487633199e-07, "loss": 2.1354, "step": 9451 }, { "epoch": 0.95, "learning_rate": 1.4698528538322986e-07, "loss": 2.1886, "step": 9452 }, { "epoch": 0.95, "learning_rate": 1.4643145959948312e-07, "loss": 2.3753, "step": 9453 }, { "epoch": 0.95, "learning_rate": 1.4587867147040192e-07, "loss": 2.3331, "step": 9454 }, { "epoch": 0.95, "learning_rate": 1.4532692105419853e-07, "loss": 2.2739, "step": 9455 }, { "epoch": 0.95, "learning_rate": 1.4477620840897767e-07, "loss": 2.2013, "step": 9456 }, { "epoch": 0.95, "learning_rate": 1.4422653359273397e-07, "loss": 2.3424, "step": 9457 }, { "epoch": 0.95, "learning_rate": 1.4367789666334897e-07, "loss": 2.3148, "step": 9458 }, { "epoch": 0.95, "learning_rate": 1.4313029767860198e-07, "loss": 2.3072, "step": 9459 }, { "epoch": 0.95, "learning_rate": 1.425837366961569e-07, "loss": 2.338, "step": 9460 }, { "epoch": 0.95, "learning_rate": 1.420382137735732e-07, "loss": 2.2301, "step": 9461 }, { "epoch": 0.95, "learning_rate": 1.4149372896829495e-07, "loss": 2.3377, "step": 9462 }, { "epoch": 0.95, "learning_rate": 1.4095028233766406e-07, "loss": 2.3022, "step": 9463 }, { "epoch": 0.95, "learning_rate": 1.4040787393890697e-07, "loss": 2.3313, "step": 9464 }, { "epoch": 0.95, "learning_rate": 1.3986650382914468e-07, "loss": 2.3686, "step": 9465 }, { "epoch": 0.95, "learning_rate": 1.3932617206538825e-07, "loss": 2.2817, "step": 9466 }, { "epoch": 0.95, "learning_rate": 1.3878687870453656e-07, "loss": 2.2724, "step": 9467 }, { "epoch": 0.95, "learning_rate": 1.38248623803382e-07, "loss": 2.1473, "step": 9468 }, { "epoch": 0.95, "learning_rate": 1.37711407418607e-07, "loss": 2.2979, "step": 9469 }, { "epoch": 0.95, "learning_rate": 1.371752296067852e-07, "loss": 2.2904, "step": 9470 }, { "epoch": 0.95, "learning_rate": 1.366400904243792e-07, "loss": 2.3229, "step": 9471 }, { "epoch": 0.95, "learning_rate": 1.3610598992774394e-07, "loss": 2.3142, "step": 9472 }, { "epoch": 0.95, "learning_rate": 1.3557292817312329e-07, "loss": 2.2576, "step": 9473 }, { "epoch": 0.95, "learning_rate": 1.3504090521665348e-07, "loss": 2.3586, "step": 9474 }, { "epoch": 0.95, "learning_rate": 1.3450992111435967e-07, "loss": 2.3853, "step": 9475 }, { "epoch": 0.95, "learning_rate": 1.3397997592215829e-07, "loss": 2.1789, "step": 9476 }, { "epoch": 0.95, "learning_rate": 1.334510696958591e-07, "loss": 2.3183, "step": 9477 }, { "epoch": 0.95, "learning_rate": 1.3292320249115642e-07, "loss": 2.2941, "step": 9478 }, { "epoch": 0.95, "learning_rate": 1.3239637436364138e-07, "loss": 2.3317, "step": 9479 }, { "epoch": 0.95, "learning_rate": 1.3187058536879183e-07, "loss": 2.3274, "step": 9480 }, { "epoch": 0.95, "learning_rate": 1.3134583556197677e-07, "loss": 2.2802, "step": 9481 }, { "epoch": 0.95, "learning_rate": 1.3082212499845648e-07, "loss": 2.3789, "step": 9482 }, { "epoch": 0.95, "learning_rate": 1.3029945373338238e-07, "loss": 2.3604, "step": 9483 }, { "epoch": 0.95, "learning_rate": 1.2977782182179488e-07, "loss": 2.3457, "step": 9484 }, { "epoch": 0.95, "learning_rate": 1.2925722931862562e-07, "loss": 2.3139, "step": 9485 }, { "epoch": 0.95, "learning_rate": 1.287376762786985e-07, "loss": 2.3869, "step": 9486 }, { "epoch": 0.95, "learning_rate": 1.282191627567242e-07, "loss": 2.2795, "step": 9487 }, { "epoch": 0.95, "learning_rate": 1.2770168880730683e-07, "loss": 2.3411, "step": 9488 }, { "epoch": 0.95, "learning_rate": 1.2718525448494167e-07, "loss": 2.3056, "step": 9489 }, { "epoch": 0.95, "learning_rate": 1.266698598440108e-07, "loss": 2.284, "step": 9490 }, { "epoch": 0.95, "learning_rate": 1.2615550493879082e-07, "loss": 2.2178, "step": 9491 }, { "epoch": 0.95, "learning_rate": 1.256421898234461e-07, "loss": 2.2904, "step": 9492 }, { "epoch": 0.95, "learning_rate": 1.251299145520335e-07, "loss": 2.2998, "step": 9493 }, { "epoch": 0.95, "learning_rate": 1.2461867917849868e-07, "loss": 2.3115, "step": 9494 }, { "epoch": 0.95, "learning_rate": 1.2410848375667972e-07, "loss": 2.2444, "step": 9495 }, { "epoch": 0.95, "learning_rate": 1.2359932834030252e-07, "loss": 2.3749, "step": 9496 }, { "epoch": 0.95, "learning_rate": 1.2309121298298642e-07, "loss": 2.2693, "step": 9497 }, { "epoch": 0.95, "learning_rate": 1.2258413773823863e-07, "loss": 2.3128, "step": 9498 }, { "epoch": 0.95, "learning_rate": 1.2207810265945863e-07, "loss": 2.2037, "step": 9499 }, { "epoch": 0.95, "learning_rate": 1.2157310779993491e-07, "loss": 2.2497, "step": 9500 }, { "epoch": 0.95, "learning_rate": 1.210691532128483e-07, "loss": 2.4481, "step": 9501 }, { "epoch": 0.95, "learning_rate": 1.205662389512674e-07, "loss": 2.2756, "step": 9502 }, { "epoch": 0.95, "learning_rate": 1.2006436506815432e-07, "loss": 2.2807, "step": 9503 }, { "epoch": 0.95, "learning_rate": 1.1956353161636014e-07, "loss": 2.2722, "step": 9504 }, { "epoch": 0.95, "learning_rate": 1.1906373864862598e-07, "loss": 2.3216, "step": 9505 }, { "epoch": 0.95, "learning_rate": 1.1856498621758416e-07, "loss": 2.2778, "step": 9506 }, { "epoch": 0.95, "learning_rate": 1.1806727437575715e-07, "loss": 2.2534, "step": 9507 }, { "epoch": 0.95, "learning_rate": 1.1757060317555636e-07, "loss": 2.2657, "step": 9508 }, { "epoch": 0.95, "learning_rate": 1.1707497266928546e-07, "loss": 2.3162, "step": 9509 }, { "epoch": 0.95, "learning_rate": 1.1658038290913943e-07, "loss": 2.255, "step": 9510 }, { "epoch": 0.95, "learning_rate": 1.1608683394720099e-07, "loss": 2.2629, "step": 9511 }, { "epoch": 0.95, "learning_rate": 1.1559432583544417e-07, "loss": 2.208, "step": 9512 }, { "epoch": 0.95, "learning_rate": 1.1510285862573522e-07, "loss": 2.2855, "step": 9513 }, { "epoch": 0.95, "learning_rate": 1.1461243236982834e-07, "loss": 2.2748, "step": 9514 }, { "epoch": 0.95, "learning_rate": 1.1412304711936995e-07, "loss": 2.2178, "step": 9515 }, { "epoch": 0.95, "learning_rate": 1.136347029258944e-07, "loss": 2.2858, "step": 9516 }, { "epoch": 0.95, "learning_rate": 1.1314739984082946e-07, "loss": 2.2998, "step": 9517 }, { "epoch": 0.95, "learning_rate": 1.1266113791549183e-07, "loss": 2.217, "step": 9518 }, { "epoch": 0.95, "learning_rate": 1.1217591720108834e-07, "loss": 2.3118, "step": 9519 }, { "epoch": 0.95, "learning_rate": 1.1169173774871478e-07, "loss": 2.3071, "step": 9520 }, { "epoch": 0.95, "learning_rate": 1.1120859960936037e-07, "loss": 2.1738, "step": 9521 }, { "epoch": 0.95, "learning_rate": 1.1072650283390329e-07, "loss": 2.2746, "step": 9522 }, { "epoch": 0.95, "learning_rate": 1.1024544747311183e-07, "loss": 2.2793, "step": 9523 }, { "epoch": 0.95, "learning_rate": 1.0976543357764435e-07, "loss": 2.2453, "step": 9524 }, { "epoch": 0.95, "learning_rate": 1.0928646119805042e-07, "loss": 2.2883, "step": 9525 }, { "epoch": 0.95, "learning_rate": 1.0880853038476858e-07, "loss": 2.2606, "step": 9526 }, { "epoch": 0.95, "learning_rate": 1.0833164118812967e-07, "loss": 2.2734, "step": 9527 }, { "epoch": 0.95, "learning_rate": 1.0785579365835241e-07, "loss": 2.2106, "step": 9528 }, { "epoch": 0.95, "learning_rate": 1.0738098784554895e-07, "loss": 2.2956, "step": 9529 }, { "epoch": 0.95, "learning_rate": 1.0690722379971707e-07, "loss": 2.2196, "step": 9530 }, { "epoch": 0.95, "learning_rate": 1.0643450157075019e-07, "loss": 2.2695, "step": 9531 }, { "epoch": 0.96, "learning_rate": 1.059628212084296e-07, "loss": 2.3028, "step": 9532 }, { "epoch": 0.96, "learning_rate": 1.0549218276242446e-07, "loss": 2.2528, "step": 9533 }, { "epoch": 0.96, "learning_rate": 1.0502258628229845e-07, "loss": 2.247, "step": 9534 }, { "epoch": 0.96, "learning_rate": 1.0455403181750312e-07, "loss": 2.4068, "step": 9535 }, { "epoch": 0.96, "learning_rate": 1.0408651941738013e-07, "loss": 2.2293, "step": 9536 }, { "epoch": 0.96, "learning_rate": 1.0362004913116341e-07, "loss": 2.3425, "step": 9537 }, { "epoch": 0.96, "learning_rate": 1.0315462100797369e-07, "loss": 2.219, "step": 9538 }, { "epoch": 0.96, "learning_rate": 1.0269023509682618e-07, "loss": 2.2433, "step": 9539 }, { "epoch": 0.96, "learning_rate": 1.022268914466229e-07, "loss": 2.2696, "step": 9540 }, { "epoch": 0.96, "learning_rate": 1.0176459010615924e-07, "loss": 2.1777, "step": 9541 }, { "epoch": 0.96, "learning_rate": 1.0130333112411628e-07, "loss": 2.3013, "step": 9542 }, { "epoch": 0.96, "learning_rate": 1.0084311454906959e-07, "loss": 2.4128, "step": 9543 }, { "epoch": 0.96, "learning_rate": 1.0038394042948374e-07, "loss": 2.3616, "step": 9544 }, { "epoch": 0.96, "learning_rate": 9.992580881371228e-08, "loss": 2.3471, "step": 9545 }, { "epoch": 0.96, "learning_rate": 9.946871975000105e-08, "loss": 2.3448, "step": 9546 }, { "epoch": 0.96, "learning_rate": 9.901267328648378e-08, "loss": 2.291, "step": 9547 }, { "epoch": 0.96, "learning_rate": 9.855766947118539e-08, "loss": 2.2342, "step": 9548 }, { "epoch": 0.96, "learning_rate": 9.810370835202199e-08, "loss": 2.3104, "step": 9549 }, { "epoch": 0.96, "learning_rate": 9.765078997679978e-08, "loss": 2.3156, "step": 9550 }, { "epoch": 0.96, "learning_rate": 9.719891439321283e-08, "loss": 2.2293, "step": 9551 }, { "epoch": 0.96, "learning_rate": 9.674808164884864e-08, "loss": 2.3383, "step": 9552 }, { "epoch": 0.96, "learning_rate": 9.629829179118144e-08, "loss": 2.292, "step": 9553 }, { "epoch": 0.96, "learning_rate": 9.584954486758002e-08, "loss": 2.333, "step": 9554 }, { "epoch": 0.96, "learning_rate": 9.540184092529769e-08, "loss": 2.2834, "step": 9555 }, { "epoch": 0.96, "learning_rate": 9.495518001148341e-08, "loss": 2.2026, "step": 9556 }, { "epoch": 0.96, "learning_rate": 9.450956217317176e-08, "loss": 2.3424, "step": 9557 }, { "epoch": 0.96, "learning_rate": 9.406498745729298e-08, "loss": 2.2839, "step": 9558 }, { "epoch": 0.96, "learning_rate": 9.362145591066074e-08, "loss": 2.2911, "step": 9559 }, { "epoch": 0.96, "learning_rate": 9.317896757998435e-08, "loss": 2.3043, "step": 9560 }, { "epoch": 0.96, "learning_rate": 9.273752251186097e-08, "loss": 2.1747, "step": 9561 }, { "epoch": 0.96, "learning_rate": 9.229712075277674e-08, "loss": 2.2866, "step": 9562 }, { "epoch": 0.96, "learning_rate": 9.185776234911015e-08, "loss": 2.2615, "step": 9563 }, { "epoch": 0.96, "learning_rate": 9.14194473471286e-08, "loss": 2.2724, "step": 9564 }, { "epoch": 0.96, "learning_rate": 9.098217579298962e-08, "loss": 2.3876, "step": 9565 }, { "epoch": 0.96, "learning_rate": 9.054594773274306e-08, "loss": 2.342, "step": 9566 }, { "epoch": 0.96, "learning_rate": 9.011076321232548e-08, "loss": 2.2289, "step": 9567 }, { "epoch": 0.96, "learning_rate": 8.96766222775658e-08, "loss": 2.2948, "step": 9568 }, { "epoch": 0.96, "learning_rate": 8.924352497418077e-08, "loss": 2.2096, "step": 9569 }, { "epoch": 0.96, "learning_rate": 8.881147134778056e-08, "loss": 2.3293, "step": 9570 }, { "epoch": 0.96, "learning_rate": 8.838046144386326e-08, "loss": 2.3303, "step": 9571 }, { "epoch": 0.96, "learning_rate": 8.795049530781696e-08, "loss": 2.4159, "step": 9572 }, { "epoch": 0.96, "learning_rate": 8.752157298491992e-08, "loss": 2.315, "step": 9573 }, { "epoch": 0.96, "learning_rate": 8.709369452034044e-08, "loss": 2.3009, "step": 9574 }, { "epoch": 0.96, "learning_rate": 8.666685995914026e-08, "loss": 2.3642, "step": 9575 }, { "epoch": 0.96, "learning_rate": 8.624106934626564e-08, "loss": 2.2917, "step": 9576 }, { "epoch": 0.96, "learning_rate": 8.581632272655627e-08, "loss": 2.2879, "step": 9577 }, { "epoch": 0.96, "learning_rate": 8.539262014474082e-08, "loss": 2.3169, "step": 9578 }, { "epoch": 0.96, "learning_rate": 8.496996164543914e-08, "loss": 2.1934, "step": 9579 }, { "epoch": 0.96, "learning_rate": 8.454834727315897e-08, "loss": 2.3862, "step": 9580 }, { "epoch": 0.96, "learning_rate": 8.412777707230146e-08, "loss": 2.2965, "step": 9581 }, { "epoch": 0.96, "learning_rate": 8.370825108715341e-08, "loss": 2.4146, "step": 9582 }, { "epoch": 0.96, "learning_rate": 8.328976936189615e-08, "loss": 2.3409, "step": 9583 }, { "epoch": 0.96, "learning_rate": 8.287233194059774e-08, "loss": 2.3732, "step": 9584 }, { "epoch": 0.96, "learning_rate": 8.245593886721858e-08, "loss": 2.273, "step": 9585 }, { "epoch": 0.96, "learning_rate": 8.204059018560584e-08, "loss": 2.235, "step": 9586 }, { "epoch": 0.96, "learning_rate": 8.162628593950228e-08, "loss": 2.296, "step": 9587 }, { "epoch": 0.96, "learning_rate": 8.121302617253413e-08, "loss": 2.2916, "step": 9588 }, { "epoch": 0.96, "learning_rate": 8.080081092822101e-08, "loss": 2.221, "step": 9589 }, { "epoch": 0.96, "learning_rate": 8.038964024997375e-08, "loss": 2.2833, "step": 9590 }, { "epoch": 0.96, "learning_rate": 7.997951418109218e-08, "loss": 2.3498, "step": 9591 }, { "epoch": 0.96, "learning_rate": 7.957043276476284e-08, "loss": 2.3384, "step": 9592 }, { "epoch": 0.96, "learning_rate": 7.916239604406795e-08, "loss": 2.2546, "step": 9593 }, { "epoch": 0.96, "learning_rate": 7.875540406197535e-08, "loss": 2.2111, "step": 9594 }, { "epoch": 0.96, "learning_rate": 7.83494568613441e-08, "loss": 2.2207, "step": 9595 }, { "epoch": 0.96, "learning_rate": 7.794455448492444e-08, "loss": 2.3437, "step": 9596 }, { "epoch": 0.96, "learning_rate": 7.75406969753556e-08, "loss": 2.331, "step": 9597 }, { "epoch": 0.96, "learning_rate": 7.713788437516578e-08, "loss": 2.3642, "step": 9598 }, { "epoch": 0.96, "learning_rate": 7.67361167267755e-08, "loss": 2.331, "step": 9599 }, { "epoch": 0.96, "learning_rate": 7.633539407249202e-08, "loss": 2.2848, "step": 9600 }, { "epoch": 0.96, "learning_rate": 7.593571645451603e-08, "loss": 2.3601, "step": 9601 }, { "epoch": 0.96, "learning_rate": 7.553708391493719e-08, "loss": 2.3055, "step": 9602 }, { "epoch": 0.96, "learning_rate": 7.513949649573304e-08, "loss": 2.3363, "step": 9603 }, { "epoch": 0.96, "learning_rate": 7.474295423877232e-08, "loss": 2.3106, "step": 9604 }, { "epoch": 0.96, "learning_rate": 7.434745718581493e-08, "loss": 2.1902, "step": 9605 }, { "epoch": 0.96, "learning_rate": 7.395300537850981e-08, "loss": 2.292, "step": 9606 }, { "epoch": 0.96, "learning_rate": 7.355959885839481e-08, "loss": 2.251, "step": 9607 }, { "epoch": 0.96, "learning_rate": 7.316723766689904e-08, "loss": 2.2855, "step": 9608 }, { "epoch": 0.96, "learning_rate": 7.277592184534054e-08, "loss": 2.3564, "step": 9609 }, { "epoch": 0.96, "learning_rate": 7.238565143492859e-08, "loss": 2.2844, "step": 9610 }, { "epoch": 0.96, "learning_rate": 7.199642647676142e-08, "loss": 2.1861, "step": 9611 }, { "epoch": 0.96, "learning_rate": 7.160824701182733e-08, "loss": 2.267, "step": 9612 }, { "epoch": 0.96, "learning_rate": 7.122111308100365e-08, "loss": 2.2748, "step": 9613 }, { "epoch": 0.96, "learning_rate": 7.083502472505998e-08, "loss": 2.2741, "step": 9614 }, { "epoch": 0.96, "learning_rate": 7.044998198465269e-08, "loss": 2.198, "step": 9615 }, { "epoch": 0.96, "learning_rate": 7.006598490033156e-08, "loss": 2.3715, "step": 9616 }, { "epoch": 0.96, "learning_rate": 6.968303351253203e-08, "loss": 2.3912, "step": 9617 }, { "epoch": 0.96, "learning_rate": 6.930112786158405e-08, "loss": 2.2664, "step": 9618 }, { "epoch": 0.96, "learning_rate": 6.892026798770324e-08, "loss": 2.2278, "step": 9619 }, { "epoch": 0.96, "learning_rate": 6.854045393099861e-08, "loss": 2.1881, "step": 9620 }, { "epoch": 0.96, "learning_rate": 6.816168573146709e-08, "loss": 2.3431, "step": 9621 }, { "epoch": 0.96, "learning_rate": 6.778396342899563e-08, "loss": 2.2314, "step": 9622 }, { "epoch": 0.96, "learning_rate": 6.74072870633602e-08, "loss": 2.2892, "step": 9623 }, { "epoch": 0.96, "learning_rate": 6.703165667422906e-08, "loss": 2.333, "step": 9624 }, { "epoch": 0.96, "learning_rate": 6.665707230115836e-08, "loss": 2.3283, "step": 9625 }, { "epoch": 0.96, "learning_rate": 6.628353398359433e-08, "loss": 2.2957, "step": 9626 }, { "epoch": 0.96, "learning_rate": 6.591104176087326e-08, "loss": 2.1723, "step": 9627 }, { "epoch": 0.96, "learning_rate": 6.553959567222156e-08, "loss": 2.2204, "step": 9628 }, { "epoch": 0.96, "learning_rate": 6.516919575675574e-08, "loss": 2.3142, "step": 9629 }, { "epoch": 0.96, "learning_rate": 6.479984205348233e-08, "loss": 2.2771, "step": 9630 }, { "epoch": 0.96, "learning_rate": 6.44315346012958e-08, "loss": 2.2965, "step": 9631 }, { "epoch": 0.97, "learning_rate": 6.406427343898181e-08, "loss": 2.3314, "step": 9632 }, { "epoch": 0.97, "learning_rate": 6.369805860521606e-08, "loss": 2.3027, "step": 9633 }, { "epoch": 0.97, "learning_rate": 6.333289013856436e-08, "loss": 2.279, "step": 9634 }, { "epoch": 0.97, "learning_rate": 6.296876807747931e-08, "loss": 2.3913, "step": 9635 }, { "epoch": 0.97, "learning_rate": 6.260569246030912e-08, "loss": 2.1947, "step": 9636 }, { "epoch": 0.97, "learning_rate": 6.224366332528431e-08, "loss": 2.3016, "step": 9637 }, { "epoch": 0.97, "learning_rate": 6.188268071053327e-08, "loss": 2.22, "step": 9638 }, { "epoch": 0.97, "learning_rate": 6.152274465406783e-08, "loss": 2.3206, "step": 9639 }, { "epoch": 0.97, "learning_rate": 6.116385519379319e-08, "loss": 2.2999, "step": 9640 }, { "epoch": 0.97, "learning_rate": 6.080601236750139e-08, "loss": 2.3424, "step": 9641 }, { "epoch": 0.97, "learning_rate": 6.04492162128778e-08, "loss": 2.2494, "step": 9642 }, { "epoch": 0.97, "learning_rate": 6.009346676749461e-08, "loss": 2.3286, "step": 9643 }, { "epoch": 0.97, "learning_rate": 5.973876406881629e-08, "loss": 2.295, "step": 9644 }, { "epoch": 0.97, "learning_rate": 5.938510815419296e-08, "loss": 2.2682, "step": 9645 }, { "epoch": 0.97, "learning_rate": 5.903249906087039e-08, "loss": 2.3066, "step": 9646 }, { "epoch": 0.97, "learning_rate": 5.8680936825978865e-08, "loss": 2.3013, "step": 9647 }, { "epoch": 0.97, "learning_rate": 5.8330421486541e-08, "loss": 2.1979, "step": 9648 }, { "epoch": 0.97, "learning_rate": 5.7980953079469494e-08, "loss": 2.2094, "step": 9649 }, { "epoch": 0.97, "learning_rate": 5.7632531641564906e-08, "loss": 2.2466, "step": 9650 }, { "epoch": 0.97, "learning_rate": 5.728515720951899e-08, "loss": 2.2656, "step": 9651 }, { "epoch": 0.97, "learning_rate": 5.693882981991361e-08, "loss": 2.2618, "step": 9652 }, { "epoch": 0.97, "learning_rate": 5.659354950921847e-08, "loss": 2.3963, "step": 9653 }, { "epoch": 0.97, "learning_rate": 5.62493163137956e-08, "loss": 2.255, "step": 9654 }, { "epoch": 0.97, "learning_rate": 5.5906130269893774e-08, "loss": 2.212, "step": 9655 }, { "epoch": 0.97, "learning_rate": 5.556399141365299e-08, "loss": 2.3302, "step": 9656 }, { "epoch": 0.97, "learning_rate": 5.52228997811044e-08, "loss": 2.2538, "step": 9657 }, { "epoch": 0.97, "learning_rate": 5.488285540816707e-08, "loss": 2.2734, "step": 9658 }, { "epoch": 0.97, "learning_rate": 5.454385833065012e-08, "loss": 2.3611, "step": 9659 }, { "epoch": 0.97, "learning_rate": 5.420590858425279e-08, "loss": 2.294, "step": 9660 }, { "epoch": 0.97, "learning_rate": 5.3869006204563254e-08, "loss": 2.3249, "step": 9661 }, { "epoch": 0.97, "learning_rate": 5.353315122705871e-08, "loss": 2.3149, "step": 9662 }, { "epoch": 0.97, "learning_rate": 5.319834368710974e-08, "loss": 2.2369, "step": 9663 }, { "epoch": 0.97, "learning_rate": 5.2864583619971485e-08, "loss": 2.3036, "step": 9664 }, { "epoch": 0.97, "learning_rate": 5.2531871060793605e-08, "loss": 2.332, "step": 9665 }, { "epoch": 0.97, "learning_rate": 5.2200206044612514e-08, "loss": 2.2284, "step": 9666 }, { "epoch": 0.97, "learning_rate": 5.186958860635472e-08, "loss": 2.2557, "step": 9667 }, { "epoch": 0.97, "learning_rate": 5.154001878083681e-08, "loss": 2.2499, "step": 9668 }, { "epoch": 0.97, "learning_rate": 5.121149660276437e-08, "loss": 2.2397, "step": 9669 }, { "epoch": 0.97, "learning_rate": 5.088402210673415e-08, "loss": 2.332, "step": 9670 }, { "epoch": 0.97, "learning_rate": 5.0557595327231924e-08, "loss": 2.1773, "step": 9671 }, { "epoch": 0.97, "learning_rate": 5.0232216298631285e-08, "loss": 2.2803, "step": 9672 }, { "epoch": 0.97, "learning_rate": 4.990788505519928e-08, "loss": 2.3296, "step": 9673 }, { "epoch": 0.97, "learning_rate": 4.958460163108858e-08, "loss": 2.2859, "step": 9674 }, { "epoch": 0.97, "learning_rate": 4.926236606034418e-08, "loss": 2.2279, "step": 9675 }, { "epoch": 0.97, "learning_rate": 4.894117837690005e-08, "loss": 2.2067, "step": 9676 }, { "epoch": 0.97, "learning_rate": 4.8621038614579116e-08, "loss": 2.2737, "step": 9677 }, { "epoch": 0.97, "learning_rate": 4.830194680709444e-08, "loss": 2.1988, "step": 9678 }, { "epoch": 0.97, "learning_rate": 4.7983902988050225e-08, "loss": 2.2353, "step": 9679 }, { "epoch": 0.97, "learning_rate": 4.766690719093636e-08, "loss": 2.3025, "step": 9680 }, { "epoch": 0.97, "learning_rate": 4.7350959449137257e-08, "loss": 2.3612, "step": 9681 }, { "epoch": 0.97, "learning_rate": 4.703605979592296e-08, "loss": 2.3049, "step": 9682 }, { "epoch": 0.97, "learning_rate": 4.6722208264455836e-08, "loss": 2.2906, "step": 9683 }, { "epoch": 0.97, "learning_rate": 4.6409404887786116e-08, "loss": 2.3537, "step": 9684 }, { "epoch": 0.97, "learning_rate": 4.6097649698854106e-08, "loss": 2.3132, "step": 9685 }, { "epoch": 0.97, "learning_rate": 4.578694273049134e-08, "loss": 2.2988, "step": 9686 }, { "epoch": 0.97, "learning_rate": 4.547728401541607e-08, "loss": 2.2902, "step": 9687 }, { "epoch": 0.97, "learning_rate": 4.5168673586238885e-08, "loss": 2.3234, "step": 9688 }, { "epoch": 0.97, "learning_rate": 4.486111147545713e-08, "loss": 2.2831, "step": 9689 }, { "epoch": 0.97, "learning_rate": 4.455459771546156e-08, "loss": 2.355, "step": 9690 }, { "epoch": 0.97, "learning_rate": 4.4249132338528566e-08, "loss": 2.364, "step": 9691 }, { "epoch": 0.97, "learning_rate": 4.394471537682687e-08, "loss": 2.3528, "step": 9692 }, { "epoch": 0.97, "learning_rate": 4.364134686241417e-08, "loss": 2.2371, "step": 9693 }, { "epoch": 0.97, "learning_rate": 4.3339026827237116e-08, "loss": 2.3323, "step": 9694 }, { "epoch": 0.97, "learning_rate": 4.303775530313137e-08, "loss": 2.2854, "step": 9695 }, { "epoch": 0.97, "learning_rate": 4.273753232182376e-08, "loss": 2.3009, "step": 9696 }, { "epoch": 0.97, "learning_rate": 4.243835791493012e-08, "loss": 2.3528, "step": 9697 }, { "epoch": 0.97, "learning_rate": 4.2140232113956345e-08, "loss": 2.2472, "step": 9698 }, { "epoch": 0.97, "learning_rate": 4.1843154950296225e-08, "loss": 2.2299, "step": 9699 }, { "epoch": 0.97, "learning_rate": 4.154712645523473e-08, "loss": 2.3764, "step": 9700 }, { "epoch": 0.97, "learning_rate": 4.1252146659945814e-08, "loss": 2.3956, "step": 9701 }, { "epoch": 0.97, "learning_rate": 4.09582155954924e-08, "loss": 2.2127, "step": 9702 }, { "epoch": 0.97, "learning_rate": 4.0665333292829736e-08, "loss": 2.3948, "step": 9703 }, { "epoch": 0.97, "learning_rate": 4.0373499782797585e-08, "loss": 2.3018, "step": 9704 }, { "epoch": 0.97, "learning_rate": 4.0082715096130266e-08, "loss": 2.3689, "step": 9705 }, { "epoch": 0.97, "learning_rate": 3.979297926344994e-08, "loss": 2.2687, "step": 9706 }, { "epoch": 0.97, "learning_rate": 3.950429231526554e-08, "loss": 2.2341, "step": 9707 }, { "epoch": 0.97, "learning_rate": 3.921665428198051e-08, "loss": 2.334, "step": 9708 }, { "epoch": 0.97, "learning_rate": 3.893006519388287e-08, "loss": 2.2466, "step": 9709 }, { "epoch": 0.97, "learning_rate": 3.8644525081155124e-08, "loss": 2.2552, "step": 9710 }, { "epoch": 0.97, "learning_rate": 3.836003397386545e-08, "loss": 2.2885, "step": 9711 }, { "epoch": 0.97, "learning_rate": 3.8076591901973214e-08, "loss": 2.3502, "step": 9712 }, { "epoch": 0.97, "learning_rate": 3.779419889532676e-08, "loss": 2.3133, "step": 9713 }, { "epoch": 0.97, "learning_rate": 3.751285498366453e-08, "loss": 2.3211, "step": 9714 }, { "epoch": 0.97, "learning_rate": 3.723256019661392e-08, "loss": 2.3327, "step": 9715 }, { "epoch": 0.97, "learning_rate": 3.6953314563692447e-08, "loss": 2.2636, "step": 9716 }, { "epoch": 0.97, "learning_rate": 3.667511811430546e-08, "loss": 2.2503, "step": 9717 }, { "epoch": 0.97, "learning_rate": 3.639797087775065e-08, "loss": 2.316, "step": 9718 }, { "epoch": 0.97, "learning_rate": 3.612187288321245e-08, "loss": 2.3243, "step": 9719 }, { "epoch": 0.97, "learning_rate": 3.584682415976759e-08, "loss": 2.2283, "step": 9720 }, { "epoch": 0.97, "learning_rate": 3.5572824736379574e-08, "loss": 2.257, "step": 9721 }, { "epoch": 0.97, "learning_rate": 3.52998746419031e-08, "loss": 2.2681, "step": 9722 }, { "epoch": 0.97, "learning_rate": 3.502797390508184e-08, "loss": 2.4015, "step": 9723 }, { "epoch": 0.97, "learning_rate": 3.4757122554547326e-08, "loss": 2.2732, "step": 9724 }, { "epoch": 0.97, "learning_rate": 3.448732061882565e-08, "loss": 2.2441, "step": 9725 }, { "epoch": 0.97, "learning_rate": 3.4218568126326293e-08, "loss": 2.2995, "step": 9726 }, { "epoch": 0.97, "learning_rate": 3.3950865105351064e-08, "loss": 2.2784, "step": 9727 }, { "epoch": 0.97, "learning_rate": 3.3684211584091855e-08, "loss": 2.357, "step": 9728 }, { "epoch": 0.97, "learning_rate": 3.3418607590629536e-08, "loss": 2.3412, "step": 9729 }, { "epoch": 0.97, "learning_rate": 3.315405315293396e-08, "loss": 2.2924, "step": 9730 }, { "epoch": 0.97, "learning_rate": 3.2890548298863957e-08, "loss": 2.3422, "step": 9731 }, { "epoch": 0.98, "learning_rate": 3.262809305616954e-08, "loss": 2.2969, "step": 9732 }, { "epoch": 0.98, "learning_rate": 3.236668745248861e-08, "loss": 2.393, "step": 9733 }, { "epoch": 0.98, "learning_rate": 3.210633151535025e-08, "loss": 2.2681, "step": 9734 }, { "epoch": 0.98, "learning_rate": 3.184702527216921e-08, "loss": 2.2963, "step": 9735 }, { "epoch": 0.98, "learning_rate": 3.158876875025474e-08, "loss": 2.3967, "step": 9736 }, { "epoch": 0.98, "learning_rate": 3.133156197680398e-08, "loss": 2.28, "step": 9737 }, { "epoch": 0.98, "learning_rate": 3.107540497889971e-08, "loss": 2.3976, "step": 9738 }, { "epoch": 0.98, "learning_rate": 3.082029778352036e-08, "loss": 2.2299, "step": 9739 }, { "epoch": 0.98, "learning_rate": 3.056624041752776e-08, "loss": 2.1941, "step": 9740 }, { "epoch": 0.98, "learning_rate": 3.031323290767829e-08, "loss": 2.2592, "step": 9741 }, { "epoch": 0.98, "learning_rate": 3.006127528061398e-08, "loss": 2.3244, "step": 9742 }, { "epoch": 0.98, "learning_rate": 2.9810367562869144e-08, "loss": 2.3287, "step": 9743 }, { "epoch": 0.98, "learning_rate": 2.9560509780863777e-08, "loss": 2.2789, "step": 9744 }, { "epoch": 0.98, "learning_rate": 2.9311701960913485e-08, "loss": 2.2847, "step": 9745 }, { "epoch": 0.98, "learning_rate": 2.9063944129217315e-08, "loss": 2.244, "step": 9746 }, { "epoch": 0.98, "learning_rate": 2.8817236311866614e-08, "loss": 2.2368, "step": 9747 }, { "epoch": 0.98, "learning_rate": 2.8571578534840605e-08, "loss": 2.2635, "step": 9748 }, { "epoch": 0.98, "learning_rate": 2.8326970824010813e-08, "loss": 2.3472, "step": 9749 }, { "epoch": 0.98, "learning_rate": 2.8083413205134413e-08, "loss": 2.3455, "step": 9750 }, { "epoch": 0.98, "learning_rate": 2.7840905703860888e-08, "loss": 2.2391, "step": 9751 }, { "epoch": 0.98, "learning_rate": 2.7599448345727587e-08, "loss": 2.2084, "step": 9752 }, { "epoch": 0.98, "learning_rate": 2.7359041156161946e-08, "loss": 2.2849, "step": 9753 }, { "epoch": 0.98, "learning_rate": 2.7119684160480387e-08, "loss": 2.235, "step": 9754 }, { "epoch": 0.98, "learning_rate": 2.6881377383889406e-08, "loss": 2.347, "step": 9755 }, { "epoch": 0.98, "learning_rate": 2.6644120851484488e-08, "loss": 2.2774, "step": 9756 }, { "epoch": 0.98, "learning_rate": 2.6407914588251203e-08, "loss": 2.2585, "step": 9757 }, { "epoch": 0.98, "learning_rate": 2.617275861906188e-08, "loss": 2.209, "step": 9758 }, { "epoch": 0.98, "learning_rate": 2.5938652968682254e-08, "loss": 2.4164, "step": 9759 }, { "epoch": 0.98, "learning_rate": 2.5705597661763726e-08, "loss": 2.2886, "step": 9760 }, { "epoch": 0.98, "learning_rate": 2.5473592722849992e-08, "loss": 2.3167, "step": 9761 }, { "epoch": 0.98, "learning_rate": 2.5242638176372625e-08, "loss": 2.2892, "step": 9762 }, { "epoch": 0.98, "learning_rate": 2.5012734046652164e-08, "loss": 2.3435, "step": 9763 }, { "epoch": 0.98, "learning_rate": 2.478388035790036e-08, "loss": 2.2778, "step": 9764 }, { "epoch": 0.98, "learning_rate": 2.4556077134216817e-08, "loss": 2.3327, "step": 9765 }, { "epoch": 0.98, "learning_rate": 2.4329324399590125e-08, "loss": 2.3118, "step": 9766 }, { "epoch": 0.98, "learning_rate": 2.4103622177900077e-08, "loss": 2.2291, "step": 9767 }, { "epoch": 0.98, "learning_rate": 2.3878970492914322e-08, "loss": 2.3488, "step": 9768 }, { "epoch": 0.98, "learning_rate": 2.3655369368290605e-08, "loss": 2.2341, "step": 9769 }, { "epoch": 0.98, "learning_rate": 2.3432818827575645e-08, "loss": 2.3172, "step": 9770 }, { "epoch": 0.98, "learning_rate": 2.3211318894205136e-08, "loss": 2.2286, "step": 9771 }, { "epoch": 0.98, "learning_rate": 2.2990869591505982e-08, "loss": 2.2872, "step": 9772 }, { "epoch": 0.98, "learning_rate": 2.2771470942691832e-08, "loss": 2.3169, "step": 9773 }, { "epoch": 0.98, "learning_rate": 2.2553122970868647e-08, "loss": 2.2552, "step": 9774 }, { "epoch": 0.98, "learning_rate": 2.2335825699028034e-08, "loss": 2.2203, "step": 9775 }, { "epoch": 0.98, "learning_rate": 2.2119579150055027e-08, "loss": 2.3571, "step": 9776 }, { "epoch": 0.98, "learning_rate": 2.1904383346720293e-08, "loss": 2.317, "step": 9777 }, { "epoch": 0.98, "learning_rate": 2.169023831168571e-08, "loss": 2.316, "step": 9778 }, { "epoch": 0.98, "learning_rate": 2.147714406750434e-08, "loss": 2.3316, "step": 9779 }, { "epoch": 0.98, "learning_rate": 2.12651006366138e-08, "loss": 2.2832, "step": 9780 }, { "epoch": 0.98, "learning_rate": 2.1054108041346222e-08, "loss": 2.276, "step": 9781 }, { "epoch": 0.98, "learning_rate": 2.084416630391939e-08, "loss": 2.2448, "step": 9782 }, { "epoch": 0.98, "learning_rate": 2.063527544644228e-08, "loss": 2.3095, "step": 9783 }, { "epoch": 0.98, "learning_rate": 2.042743549091286e-08, "loss": 2.2503, "step": 9784 }, { "epoch": 0.98, "learning_rate": 2.0220646459216953e-08, "loss": 2.3624, "step": 9785 }, { "epoch": 0.98, "learning_rate": 2.0014908373132692e-08, "loss": 2.2651, "step": 9786 }, { "epoch": 0.98, "learning_rate": 1.9810221254323857e-08, "loss": 2.2257, "step": 9787 }, { "epoch": 0.98, "learning_rate": 1.9606585124347654e-08, "loss": 2.3518, "step": 9788 }, { "epoch": 0.98, "learning_rate": 1.9404000004648037e-08, "loss": 2.2648, "step": 9789 }, { "epoch": 0.98, "learning_rate": 1.9202465916557946e-08, "loss": 2.2425, "step": 9790 }, { "epoch": 0.98, "learning_rate": 1.9001982881300394e-08, "loss": 2.2898, "step": 9791 }, { "epoch": 0.98, "learning_rate": 1.8802550919988506e-08, "loss": 2.3756, "step": 9792 }, { "epoch": 0.98, "learning_rate": 1.860417005362325e-08, "loss": 2.3018, "step": 9793 }, { "epoch": 0.98, "learning_rate": 1.8406840303095698e-08, "loss": 2.3054, "step": 9794 }, { "epoch": 0.98, "learning_rate": 1.8210561689187e-08, "loss": 2.2595, "step": 9795 }, { "epoch": 0.98, "learning_rate": 1.8015334232566184e-08, "loss": 2.2682, "step": 9796 }, { "epoch": 0.98, "learning_rate": 1.7821157953791244e-08, "loss": 2.3965, "step": 9797 }, { "epoch": 0.98, "learning_rate": 1.7628032873312496e-08, "loss": 2.2262, "step": 9798 }, { "epoch": 0.98, "learning_rate": 1.7435959011465886e-08, "loss": 2.2584, "step": 9799 }, { "epoch": 0.98, "learning_rate": 1.7244936388477463e-08, "loss": 2.2974, "step": 9800 }, { "epoch": 0.98, "learning_rate": 1.7054965024465576e-08, "loss": 2.2628, "step": 9801 }, { "epoch": 0.98, "learning_rate": 1.6866044939435332e-08, "loss": 2.3179, "step": 9802 }, { "epoch": 0.98, "learning_rate": 1.6678176153279713e-08, "loss": 2.279, "step": 9803 }, { "epoch": 0.98, "learning_rate": 1.6491358685783997e-08, "loss": 2.3322, "step": 9804 }, { "epoch": 0.98, "learning_rate": 1.630559255662023e-08, "loss": 2.2009, "step": 9805 }, { "epoch": 0.98, "learning_rate": 1.6120877785352762e-08, "loss": 2.1631, "step": 9806 }, { "epoch": 0.98, "learning_rate": 1.5937214391431588e-08, "loss": 2.2786, "step": 9807 }, { "epoch": 0.98, "learning_rate": 1.5754602394200124e-08, "loss": 2.1808, "step": 9808 }, { "epoch": 0.98, "learning_rate": 1.5573041812886326e-08, "loss": 2.1421, "step": 9809 }, { "epoch": 0.98, "learning_rate": 1.539253266661156e-08, "loss": 2.3426, "step": 9810 }, { "epoch": 0.98, "learning_rate": 1.5213074974383956e-08, "loss": 2.2511, "step": 9811 }, { "epoch": 0.98, "learning_rate": 1.5034668755102842e-08, "loss": 2.2618, "step": 9812 }, { "epoch": 0.98, "learning_rate": 1.4857314027554304e-08, "loss": 2.2786, "step": 9813 }, { "epoch": 0.98, "learning_rate": 1.468101081041562e-08, "loss": 2.2403, "step": 9814 }, { "epoch": 0.98, "learning_rate": 1.450575912225305e-08, "loss": 2.3995, "step": 9815 }, { "epoch": 0.98, "learning_rate": 1.4331558981521831e-08, "loss": 2.2131, "step": 9816 }, { "epoch": 0.98, "learning_rate": 1.4158410406566181e-08, "loss": 2.3187, "step": 9817 }, { "epoch": 0.98, "learning_rate": 1.398631341562151e-08, "loss": 2.2884, "step": 9818 }, { "epoch": 0.98, "learning_rate": 1.3815268026808882e-08, "loss": 2.2115, "step": 9819 }, { "epoch": 0.98, "learning_rate": 1.364527425814166e-08, "loss": 2.317, "step": 9820 }, { "epoch": 0.98, "learning_rate": 1.3476332127521086e-08, "loss": 2.2135, "step": 9821 }, { "epoch": 0.98, "learning_rate": 1.3308441652738479e-08, "loss": 2.309, "step": 9822 }, { "epoch": 0.98, "learning_rate": 1.3141602851474144e-08, "loss": 2.3983, "step": 9823 }, { "epoch": 0.98, "learning_rate": 1.297581574129625e-08, "loss": 2.2654, "step": 9824 }, { "epoch": 0.98, "learning_rate": 1.2811080339664161e-08, "loss": 2.2939, "step": 9825 }, { "epoch": 0.98, "learning_rate": 1.2647396663926226e-08, "loss": 2.281, "step": 9826 }, { "epoch": 0.98, "learning_rate": 1.2484764731319765e-08, "loss": 2.1443, "step": 9827 }, { "epoch": 0.98, "learning_rate": 1.2323184558969969e-08, "loss": 2.2709, "step": 9828 }, { "epoch": 0.98, "learning_rate": 1.2162656163893228e-08, "loss": 2.2731, "step": 9829 }, { "epoch": 0.98, "learning_rate": 1.2003179562993795e-08, "loss": 2.2603, "step": 9830 }, { "epoch": 0.98, "learning_rate": 1.1844754773066014e-08, "loss": 2.3226, "step": 9831 }, { "epoch": 0.99, "learning_rate": 1.1687381810793208e-08, "loss": 2.4178, "step": 9832 }, { "epoch": 0.99, "learning_rate": 1.1531060692748786e-08, "loss": 2.3204, "step": 9833 }, { "epoch": 0.99, "learning_rate": 1.1375791435392913e-08, "loss": 2.2656, "step": 9834 }, { "epoch": 0.99, "learning_rate": 1.1221574055078065e-08, "loss": 2.3288, "step": 9835 }, { "epoch": 0.99, "learning_rate": 1.1068408568043477e-08, "loss": 2.3463, "step": 9836 }, { "epoch": 0.99, "learning_rate": 1.0916294990419574e-08, "loss": 2.2243, "step": 9837 }, { "epoch": 0.99, "learning_rate": 1.0765233338224657e-08, "loss": 2.2931, "step": 9838 }, { "epoch": 0.99, "learning_rate": 1.0615223627366e-08, "loss": 2.2064, "step": 9839 }, { "epoch": 0.99, "learning_rate": 1.0466265873640968e-08, "loss": 2.3523, "step": 9840 }, { "epoch": 0.99, "learning_rate": 1.0318360092737013e-08, "loss": 2.2451, "step": 9841 }, { "epoch": 0.99, "learning_rate": 1.017150630022834e-08, "loss": 2.308, "step": 9842 }, { "epoch": 0.99, "learning_rate": 1.0025704511580358e-08, "loss": 2.2445, "step": 9843 }, { "epoch": 0.99, "learning_rate": 9.880954742147453e-09, "loss": 2.3088, "step": 9844 }, { "epoch": 0.99, "learning_rate": 9.737257007171875e-09, "loss": 2.2697, "step": 9845 }, { "epoch": 0.99, "learning_rate": 9.594611321787073e-09, "loss": 2.2796, "step": 9846 }, { "epoch": 0.99, "learning_rate": 9.453017701014366e-09, "loss": 2.3344, "step": 9847 }, { "epoch": 0.99, "learning_rate": 9.31247615976516e-09, "loss": 2.3168, "step": 9848 }, { "epoch": 0.99, "learning_rate": 9.172986712838728e-09, "loss": 2.2438, "step": 9849 }, { "epoch": 0.99, "learning_rate": 9.034549374923318e-09, "loss": 2.3038, "step": 9850 }, { "epoch": 0.99, "learning_rate": 8.897164160600603e-09, "loss": 2.3555, "step": 9851 }, { "epoch": 0.99, "learning_rate": 8.760831084334565e-09, "loss": 2.3098, "step": 9852 }, { "epoch": 0.99, "learning_rate": 8.62555016048483e-09, "loss": 2.3324, "step": 9853 }, { "epoch": 0.99, "learning_rate": 8.49132140329667e-09, "loss": 2.3599, "step": 9854 }, { "epoch": 0.99, "learning_rate": 8.358144826904335e-09, "loss": 2.2193, "step": 9855 }, { "epoch": 0.99, "learning_rate": 8.226020445334381e-09, "loss": 2.3457, "step": 9856 }, { "epoch": 0.99, "learning_rate": 8.094948272499015e-09, "loss": 2.2344, "step": 9857 }, { "epoch": 0.99, "learning_rate": 7.964928322201638e-09, "loss": 2.3282, "step": 9858 }, { "epoch": 0.99, "learning_rate": 7.835960608133519e-09, "loss": 2.3068, "step": 9859 }, { "epoch": 0.99, "learning_rate": 7.70804514387713e-09, "loss": 2.2524, "step": 9860 }, { "epoch": 0.99, "learning_rate": 7.581181942901695e-09, "loss": 2.3391, "step": 9861 }, { "epoch": 0.99, "learning_rate": 7.455371018568746e-09, "loss": 2.3417, "step": 9862 }, { "epoch": 0.99, "learning_rate": 7.3306123841243586e-09, "loss": 2.3103, "step": 9863 }, { "epoch": 0.99, "learning_rate": 7.2069060527091285e-09, "loss": 2.3366, "step": 9864 }, { "epoch": 0.99, "learning_rate": 7.084252037349304e-09, "loss": 2.3549, "step": 9865 }, { "epoch": 0.99, "learning_rate": 6.96265035096122e-09, "loss": 2.2704, "step": 9866 }, { "epoch": 0.99, "learning_rate": 6.842101006350188e-09, "loss": 2.2836, "step": 9867 }, { "epoch": 0.99, "learning_rate": 6.722604016210499e-09, "loss": 2.2959, "step": 9868 }, { "epoch": 0.99, "learning_rate": 6.604159393127641e-09, "loss": 2.1567, "step": 9869 }, { "epoch": 0.99, "learning_rate": 6.486767149572748e-09, "loss": 2.3278, "step": 9870 }, { "epoch": 0.99, "learning_rate": 6.370427297910375e-09, "loss": 2.3196, "step": 9871 }, { "epoch": 0.99, "learning_rate": 6.255139850390723e-09, "loss": 2.2217, "step": 9872 }, { "epoch": 0.99, "learning_rate": 6.140904819154081e-09, "loss": 2.3123, "step": 9873 }, { "epoch": 0.99, "learning_rate": 6.027722216230825e-09, "loss": 2.3386, "step": 9874 }, { "epoch": 0.99, "learning_rate": 5.915592053540309e-09, "loss": 2.2921, "step": 9875 }, { "epoch": 0.99, "learning_rate": 5.804514342889755e-09, "loss": 2.3248, "step": 9876 }, { "epoch": 0.99, "learning_rate": 5.694489095976474e-09, "loss": 2.3419, "step": 9877 }, { "epoch": 0.99, "learning_rate": 5.585516324387863e-09, "loss": 2.3784, "step": 9878 }, { "epoch": 0.99, "learning_rate": 5.477596039598076e-09, "loss": 2.2797, "step": 9879 }, { "epoch": 0.99, "learning_rate": 5.370728252974689e-09, "loss": 2.3088, "step": 9880 }, { "epoch": 0.99, "learning_rate": 5.264912975768699e-09, "loss": 2.4121, "step": 9881 }, { "epoch": 0.99, "learning_rate": 5.160150219124527e-09, "loss": 2.2338, "step": 9882 }, { "epoch": 0.99, "learning_rate": 5.056439994074458e-09, "loss": 2.307, "step": 9883 }, { "epoch": 0.99, "learning_rate": 4.953782311540867e-09, "loss": 2.3782, "step": 9884 }, { "epoch": 0.99, "learning_rate": 4.852177182332884e-09, "loss": 2.2329, "step": 9885 }, { "epoch": 0.99, "learning_rate": 4.75162461714973e-09, "loss": 2.3205, "step": 9886 }, { "epoch": 0.99, "learning_rate": 4.652124626582932e-09, "loss": 2.2945, "step": 9887 }, { "epoch": 0.99, "learning_rate": 4.553677221108554e-09, "loss": 2.2531, "step": 9888 }, { "epoch": 0.99, "learning_rate": 4.4562824110938595e-09, "loss": 2.3187, "step": 9889 }, { "epoch": 0.99, "learning_rate": 4.3599402067973085e-09, "loss": 2.2836, "step": 9890 }, { "epoch": 0.99, "learning_rate": 4.264650618361898e-09, "loss": 2.4949, "step": 9891 }, { "epoch": 0.99, "learning_rate": 4.170413655822936e-09, "loss": 2.2467, "step": 9892 }, { "epoch": 0.99, "learning_rate": 4.077229329104704e-09, "loss": 2.3437, "step": 9893 }, { "epoch": 0.99, "learning_rate": 3.9850976480215745e-09, "loss": 2.2237, "step": 9894 }, { "epoch": 0.99, "learning_rate": 3.894018622273565e-09, "loss": 2.2378, "step": 9895 }, { "epoch": 0.99, "learning_rate": 3.803992261451894e-09, "loss": 2.2644, "step": 9896 }, { "epoch": 0.99, "learning_rate": 3.7150185750389757e-09, "loss": 2.2856, "step": 9897 }, { "epoch": 0.99, "learning_rate": 3.6270975724028713e-09, "loss": 2.332, "step": 9898 }, { "epoch": 0.99, "learning_rate": 3.540229262802841e-09, "loss": 2.2436, "step": 9899 }, { "epoch": 0.99, "learning_rate": 3.454413655387123e-09, "loss": 2.3359, "step": 9900 }, { "epoch": 0.99, "learning_rate": 3.3696507591918225e-09, "loss": 2.4168, "step": 9901 }, { "epoch": 0.99, "learning_rate": 3.2859405831442426e-09, "loss": 2.2626, "step": 9902 }, { "epoch": 0.99, "learning_rate": 3.203283136058444e-09, "loss": 2.2765, "step": 9903 }, { "epoch": 0.99, "learning_rate": 3.121678426639685e-09, "loss": 2.3209, "step": 9904 }, { "epoch": 0.99, "learning_rate": 3.041126463481092e-09, "loss": 2.2586, "step": 9905 }, { "epoch": 0.99, "learning_rate": 2.9616272550658797e-09, "loss": 2.3465, "step": 9906 }, { "epoch": 0.99, "learning_rate": 2.8831808097662396e-09, "loss": 2.2532, "step": 9907 }, { "epoch": 0.99, "learning_rate": 2.8057871358422306e-09, "loss": 2.3282, "step": 9908 }, { "epoch": 0.99, "learning_rate": 2.7294462414440002e-09, "loss": 2.2264, "step": 9909 }, { "epoch": 0.99, "learning_rate": 2.654158134611784e-09, "loss": 2.3085, "step": 9910 }, { "epoch": 0.99, "learning_rate": 2.579922823272574e-09, "loss": 2.2874, "step": 9911 }, { "epoch": 0.99, "learning_rate": 2.5067403152456704e-09, "loss": 2.298, "step": 9912 }, { "epoch": 0.99, "learning_rate": 2.434610618236022e-09, "loss": 2.2006, "step": 9913 }, { "epoch": 0.99, "learning_rate": 2.363533739840884e-09, "loss": 2.3501, "step": 9914 }, { "epoch": 0.99, "learning_rate": 2.2935096875442707e-09, "loss": 2.3855, "step": 9915 }, { "epoch": 0.99, "learning_rate": 2.224538468720283e-09, "loss": 2.3755, "step": 9916 }, { "epoch": 0.99, "learning_rate": 2.156620090632e-09, "loss": 2.1951, "step": 9917 }, { "epoch": 0.99, "learning_rate": 2.0897545604325888e-09, "loss": 2.3477, "step": 9918 }, { "epoch": 0.99, "learning_rate": 2.023941885161973e-09, "loss": 2.3147, "step": 9919 }, { "epoch": 0.99, "learning_rate": 1.9591820717523856e-09, "loss": 2.341, "step": 9920 }, { "epoch": 0.99, "learning_rate": 1.8954751270239268e-09, "loss": 2.342, "step": 9921 }, { "epoch": 0.99, "learning_rate": 1.8328210576823436e-09, "loss": 2.2934, "step": 9922 }, { "epoch": 0.99, "learning_rate": 1.7712198703290217e-09, "loss": 2.2508, "step": 9923 }, { "epoch": 0.99, "learning_rate": 1.7106715714487742e-09, "loss": 2.3901, "step": 9924 }, { "epoch": 0.99, "learning_rate": 1.651176167418722e-09, "loss": 2.286, "step": 9925 }, { "epoch": 0.99, "learning_rate": 1.5927336645038538e-09, "loss": 2.3765, "step": 9926 }, { "epoch": 0.99, "learning_rate": 1.535344068859246e-09, "loss": 2.2578, "step": 9927 }, { "epoch": 0.99, "learning_rate": 1.479007386527842e-09, "loss": 2.2726, "step": 9928 }, { "epoch": 0.99, "learning_rate": 1.423723623441564e-09, "loss": 2.3885, "step": 9929 }, { "epoch": 0.99, "learning_rate": 1.369492785424642e-09, "loss": 2.3004, "step": 9930 }, { "epoch": 0.99, "learning_rate": 1.3163148781847323e-09, "loss": 2.3024, "step": 9931 }, { "epoch": 1.0, "learning_rate": 1.2641899073251307e-09, "loss": 2.2902, "step": 9932 }, { "epoch": 1.0, "learning_rate": 1.2131178783325593e-09, "loss": 2.2851, "step": 9933 }, { "epoch": 1.0, "learning_rate": 1.1630987965860485e-09, "loss": 2.2788, "step": 9934 }, { "epoch": 1.0, "learning_rate": 1.1141326673536067e-09, "loss": 2.2305, "step": 9935 }, { "epoch": 1.0, "learning_rate": 1.0662194957911097e-09, "loss": 2.2542, "step": 9936 }, { "epoch": 1.0, "learning_rate": 1.0193592869445212e-09, "loss": 2.3246, "step": 9937 }, { "epoch": 1.0, "learning_rate": 9.735520457476721e-10, "loss": 2.3732, "step": 9938 }, { "epoch": 1.0, "learning_rate": 9.287977770255918e-10, "loss": 2.3529, "step": 9939 }, { "epoch": 1.0, "learning_rate": 8.850964854900668e-10, "loss": 2.25, "step": 9940 }, { "epoch": 1.0, "learning_rate": 8.424481757440817e-10, "loss": 2.4634, "step": 9941 }, { "epoch": 1.0, "learning_rate": 8.008528522795989e-10, "loss": 2.2286, "step": 9942 }, { "epoch": 1.0, "learning_rate": 7.603105194742277e-10, "loss": 2.1819, "step": 9943 }, { "epoch": 1.0, "learning_rate": 7.208211816001065e-10, "loss": 2.3809, "step": 9944 }, { "epoch": 1.0, "learning_rate": 6.823848428150204e-10, "loss": 2.3471, "step": 9945 }, { "epoch": 1.0, "learning_rate": 6.450015071657323e-10, "loss": 2.3137, "step": 9946 }, { "epoch": 1.0, "learning_rate": 6.08671178589093e-10, "loss": 2.2606, "step": 9947 }, { "epoch": 1.0, "learning_rate": 5.733938609120415e-10, "loss": 2.3316, "step": 9948 }, { "epoch": 1.0, "learning_rate": 5.391695578482736e-10, "loss": 2.277, "step": 9949 }, { "epoch": 1.0, "learning_rate": 5.059982730037937e-10, "loss": 2.2726, "step": 9950 }, { "epoch": 1.0, "learning_rate": 4.738800098691432e-10, "loss": 2.3045, "step": 9951 }, { "epoch": 1.0, "learning_rate": 4.428147718282816e-10, "loss": 2.2481, "step": 9952 }, { "epoch": 1.0, "learning_rate": 4.1280256215192607e-10, "loss": 2.1794, "step": 9953 }, { "epoch": 1.0, "learning_rate": 3.8384338400199173e-10, "loss": 2.2247, "step": 9954 }, { "epoch": 1.0, "learning_rate": 3.5593724042604085e-10, "loss": 2.3082, "step": 9955 }, { "epoch": 1.0, "learning_rate": 3.290841343650542e-10, "loss": 2.2955, "step": 9956 }, { "epoch": 1.0, "learning_rate": 3.0328406864454927e-10, "loss": 2.2568, "step": 9957 }, { "epoch": 1.0, "learning_rate": 2.785370459823522e-10, "loss": 2.2581, "step": 9958 }, { "epoch": 1.0, "learning_rate": 2.5484306898526657e-10, "loss": 2.2835, "step": 9959 }, { "epoch": 1.0, "learning_rate": 2.322021401479635e-10, "loss": 2.1314, "step": 9960 }, { "epoch": 1.0, "learning_rate": 2.1061426185409183e-10, "loss": 2.2617, "step": 9961 }, { "epoch": 1.0, "learning_rate": 1.9007943637849858e-10, "loss": 2.3227, "step": 9962 }, { "epoch": 1.0, "learning_rate": 1.705976658816777e-10, "loss": 2.3167, "step": 9963 }, { "epoch": 1.0, "learning_rate": 1.5216895241643159e-10, "loss": 2.2792, "step": 9964 }, { "epoch": 1.0, "learning_rate": 1.347932979234301e-10, "loss": 2.423, "step": 9965 }, { "epoch": 1.0, "learning_rate": 1.1847070423232076e-10, "loss": 2.2157, "step": 9966 }, { "epoch": 1.0, "learning_rate": 1.0320117306172883e-10, "loss": 2.2014, "step": 9967 }, { "epoch": 1.0, "learning_rate": 8.898470602036746e-11, "loss": 2.1911, "step": 9968 }, { "epoch": 1.0, "learning_rate": 7.582130460481729e-11, "loss": 2.277, "step": 9969 }, { "epoch": 1.0, "learning_rate": 6.371097020063666e-11, "loss": 2.2855, "step": 9970 }, { "epoch": 1.0, "learning_rate": 5.2653704084582035e-11, "loss": 2.3621, "step": 9971 }, { "epoch": 1.0, "learning_rate": 4.264950741905693e-11, "loss": 2.3, "step": 9972 }, { "epoch": 1.0, "learning_rate": 3.369838125988345e-11, "loss": 2.3096, "step": 9973 }, { "epoch": 1.0, "learning_rate": 2.5800326548530708e-11, "loss": 2.4055, "step": 9974 }, { "epoch": 1.0, "learning_rate": 1.895534411655575e-11, "loss": 2.3013, "step": 9975 }, { "epoch": 1.0, "learning_rate": 1.3163434684493327e-11, "loss": 2.203, "step": 9976 }, { "epoch": 1.0, "learning_rate": 8.424598864076317e-12, "loss": 2.2529, "step": 9977 }, { "epoch": 1.0, "learning_rate": 4.738837151574416e-12, "loss": 2.2064, "step": 9978 }, { "epoch": 1.0, "learning_rate": 2.1061499377861284e-12, "loss": 2.2497, "step": 9979 }, { "epoch": 1.0, "learning_rate": 5.265374980467641e-13, "loss": 2.2302, "step": 9980 }, { "epoch": 1.0, "learning_rate": 0.0, "loss": 2.24, "step": 9981 }, { "epoch": 1.0, "step": 9981, "total_flos": 552640681082880.0, "train_loss": 2.3696637807180476, "train_runtime": 80722.6014, "train_samples_per_second": 15.825, "train_steps_per_second": 0.124 } ], "logging_steps": 1.0, "max_steps": 9981, "num_input_tokens_seen": 0, "num_train_epochs": 1, "save_steps": 50000, "total_flos": 552640681082880.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }