diff --git "a/Luminia-8B-RP/trainer_log.jsonl" "b/Luminia-8B-RP/trainer_log.jsonl" new file mode 100644--- /dev/null +++ "b/Luminia-8B-RP/trainer_log.jsonl" @@ -0,0 +1,874 @@ +{"current_steps": 10, "total_steps": 8739, "loss": 1.5075, "learning_rate": 5.000000000000001e-07, "epoch": 0.0011442956860052637, "percentage": 0.11, "elapsed_time": "0:00:50", "remaining_time": "12:08:05", "throughput": 1636.89, "total_tokens": 81920} +{"current_steps": 20, "total_steps": 8739, "loss": 1.379, "learning_rate": 1.0000000000000002e-06, "epoch": 0.0022885913720105274, "percentage": 0.23, "elapsed_time": "0:01:33", "remaining_time": "11:22:03", "throughput": 1745.37, "total_tokens": 163840} +{"current_steps": 30, "total_steps": 8739, "loss": 1.6386, "learning_rate": 1.5e-06, "epoch": 0.0034328870580157913, "percentage": 0.34, "elapsed_time": "0:02:17", "remaining_time": "11:04:46", "throughput": 1788.66, "total_tokens": 245760} +{"current_steps": 40, "total_steps": 8739, "loss": 1.5525, "learning_rate": 2.0000000000000003e-06, "epoch": 0.004577182744021055, "percentage": 0.46, "elapsed_time": "0:03:00", "remaining_time": "10:55:44", "throughput": 1811.24, "total_tokens": 327680} +{"current_steps": 50, "total_steps": 8739, "loss": 1.651, "learning_rate": 2.5e-06, "epoch": 0.005721478430026319, "percentage": 0.57, "elapsed_time": "0:03:44", "remaining_time": "10:51:18", "throughput": 1821.47, "total_tokens": 409600} +{"current_steps": 60, "total_steps": 8739, "loss": 1.5067, "learning_rate": 3e-06, "epoch": 0.006865774116031583, "percentage": 0.69, "elapsed_time": "0:04:28", "remaining_time": "10:47:36", "throughput": 1829.78, "total_tokens": 491520} +{"current_steps": 70, "total_steps": 8739, "loss": 1.3367, "learning_rate": 3.5000000000000004e-06, "epoch": 0.008010069802036847, "percentage": 0.8, "elapsed_time": "0:05:12", "remaining_time": "10:44:57", "throughput": 1835.15, "total_tokens": 573440} +{"current_steps": 80, "total_steps": 8739, "loss": 1.6071, "learning_rate": 4.000000000000001e-06, "epoch": 0.00915436548804211, "percentage": 0.92, "elapsed_time": "0:05:56", "remaining_time": "10:42:28", "throughput": 1840.12, "total_tokens": 655360} +{"current_steps": 90, "total_steps": 8739, "loss": 1.522, "learning_rate": 4.5e-06, "epoch": 0.010298661174047374, "percentage": 1.03, "elapsed_time": "0:06:39", "remaining_time": "10:40:39", "throughput": 1843.21, "total_tokens": 737280} +{"current_steps": 100, "total_steps": 8739, "loss": 1.5853, "learning_rate": 5e-06, "epoch": 0.011442956860052637, "percentage": 1.14, "elapsed_time": "0:07:23", "remaining_time": "10:38:56", "throughput": 1846.03, "total_tokens": 819200} +{"current_steps": 110, "total_steps": 8739, "loss": 1.4081, "learning_rate": 5.500000000000001e-06, "epoch": 0.012587252546057902, "percentage": 1.26, "elapsed_time": "0:08:07", "remaining_time": "10:37:11", "throughput": 1848.96, "total_tokens": 901120} +{"current_steps": 120, "total_steps": 8739, "loss": 1.5405, "learning_rate": 6e-06, "epoch": 0.013731548232063165, "percentage": 1.37, "elapsed_time": "0:08:51", "remaining_time": "10:36:02", "throughput": 1850.19, "total_tokens": 983040} +{"current_steps": 130, "total_steps": 8739, "loss": 1.3632, "learning_rate": 6.5000000000000004e-06, "epoch": 0.014875843918068428, "percentage": 1.49, "elapsed_time": "0:09:35", "remaining_time": "10:34:57", "throughput": 1851.19, "total_tokens": 1064960} +{"current_steps": 140, "total_steps": 8739, "loss": 1.128, "learning_rate": 7.000000000000001e-06, "epoch": 0.016020139604073693, "percentage": 1.6, "elapsed_time": "0:10:19", "remaining_time": "10:34:06", "throughput": 1851.49, "total_tokens": 1146880} +{"current_steps": 150, "total_steps": 8739, "loss": 1.3543, "learning_rate": 7.5e-06, "epoch": 0.017164435290078956, "percentage": 1.72, "elapsed_time": "0:11:03", "remaining_time": "10:33:12", "throughput": 1851.99, "total_tokens": 1228800} +{"current_steps": 160, "total_steps": 8739, "loss": 1.3541, "learning_rate": 8.000000000000001e-06, "epoch": 0.01830873097608422, "percentage": 1.83, "elapsed_time": "0:11:47", "remaining_time": "10:32:00", "throughput": 1853.31, "total_tokens": 1310720} +{"current_steps": 170, "total_steps": 8739, "loss": 1.4476, "learning_rate": 8.500000000000002e-06, "epoch": 0.019453026662089482, "percentage": 1.95, "elapsed_time": "0:12:30", "remaining_time": "10:30:49", "throughput": 1854.64, "total_tokens": 1392640} +{"current_steps": 180, "total_steps": 8739, "loss": 1.212, "learning_rate": 9e-06, "epoch": 0.02059732234809475, "percentage": 2.06, "elapsed_time": "0:13:14", "remaining_time": "10:29:44", "throughput": 1855.68, "total_tokens": 1474560} +{"current_steps": 190, "total_steps": 8739, "loss": 1.3312, "learning_rate": 9.5e-06, "epoch": 0.021741618034100012, "percentage": 2.17, "elapsed_time": "0:13:58", "remaining_time": "10:28:44", "throughput": 1856.44, "total_tokens": 1556480} +{"current_steps": 200, "total_steps": 8739, "loss": 1.3266, "learning_rate": 1e-05, "epoch": 0.022885913720105275, "percentage": 2.29, "elapsed_time": "0:14:42", "remaining_time": "10:27:51", "throughput": 1856.86, "total_tokens": 1638400} +{"current_steps": 210, "total_steps": 8739, "loss": 1.3106, "learning_rate": 1.05e-05, "epoch": 0.024030209406110538, "percentage": 2.4, "elapsed_time": "0:15:26", "remaining_time": "10:26:57", "throughput": 1857.38, "total_tokens": 1720320} +{"current_steps": 220, "total_steps": 8739, "loss": 1.4398, "learning_rate": 1.1000000000000001e-05, "epoch": 0.025174505092115804, "percentage": 2.52, "elapsed_time": "0:16:10", "remaining_time": "10:26:03", "throughput": 1857.84, "total_tokens": 1802240} +{"current_steps": 230, "total_steps": 8739, "loss": 1.1946, "learning_rate": 1.1500000000000002e-05, "epoch": 0.026318800778121067, "percentage": 2.63, "elapsed_time": "0:16:53", "remaining_time": "10:25:07", "throughput": 1858.47, "total_tokens": 1884160} +{"current_steps": 240, "total_steps": 8739, "loss": 1.2912, "learning_rate": 1.2e-05, "epoch": 0.02746309646412633, "percentage": 2.75, "elapsed_time": "0:17:37", "remaining_time": "10:24:11", "throughput": 1859.04, "total_tokens": 1966080} +{"current_steps": 250, "total_steps": 8739, "loss": 1.5374, "learning_rate": 1.25e-05, "epoch": 0.028607392150131594, "percentage": 2.86, "elapsed_time": "0:18:21", "remaining_time": "10:23:17", "throughput": 1859.52, "total_tokens": 2048000} +{"current_steps": 260, "total_steps": 8739, "loss": 1.4559, "learning_rate": 1.3000000000000001e-05, "epoch": 0.029751687836136857, "percentage": 2.98, "elapsed_time": "0:19:05", "remaining_time": "10:22:21", "throughput": 1860.13, "total_tokens": 2129920} +{"current_steps": 270, "total_steps": 8739, "loss": 1.4361, "learning_rate": 1.3500000000000001e-05, "epoch": 0.030895983522142123, "percentage": 3.09, "elapsed_time": "0:19:48", "remaining_time": "10:21:32", "throughput": 1860.39, "total_tokens": 2211840} +{"current_steps": 280, "total_steps": 8739, "loss": 1.7506, "learning_rate": 1.4000000000000001e-05, "epoch": 0.032040279208147386, "percentage": 3.2, "elapsed_time": "0:20:32", "remaining_time": "10:20:41", "throughput": 1860.75, "total_tokens": 2293760} +{"current_steps": 290, "total_steps": 8739, "loss": 1.5946, "learning_rate": 1.45e-05, "epoch": 0.03318457489415265, "percentage": 3.32, "elapsed_time": "0:21:16", "remaining_time": "10:19:57", "throughput": 1860.74, "total_tokens": 2375680} +{"current_steps": 300, "total_steps": 8739, "loss": 1.386, "learning_rate": 1.5e-05, "epoch": 0.03432887058015791, "percentage": 3.43, "elapsed_time": "0:22:00", "remaining_time": "10:19:01", "throughput": 1861.35, "total_tokens": 2457600} +{"current_steps": 310, "total_steps": 8739, "loss": 1.1091, "learning_rate": 1.55e-05, "epoch": 0.035473166266163175, "percentage": 3.55, "elapsed_time": "0:22:44", "remaining_time": "10:18:11", "throughput": 1861.63, "total_tokens": 2539520} +{"current_steps": 320, "total_steps": 8739, "loss": 1.3287, "learning_rate": 1.6000000000000003e-05, "epoch": 0.03661746195216844, "percentage": 3.66, "elapsed_time": "0:23:28", "remaining_time": "10:17:24", "throughput": 1861.77, "total_tokens": 2621440} +{"current_steps": 330, "total_steps": 8739, "loss": 1.2537, "learning_rate": 1.65e-05, "epoch": 0.0377617576381737, "percentage": 3.78, "elapsed_time": "0:24:11", "remaining_time": "10:16:30", "throughput": 1862.29, "total_tokens": 2703360} +{"current_steps": 340, "total_steps": 8739, "loss": 1.4166, "learning_rate": 1.7000000000000003e-05, "epoch": 0.038906053324178964, "percentage": 3.89, "elapsed_time": "0:24:55", "remaining_time": "10:15:46", "throughput": 1862.27, "total_tokens": 2785280} +{"current_steps": 350, "total_steps": 8739, "loss": 1.298, "learning_rate": 1.75e-05, "epoch": 0.040050349010184234, "percentage": 4.01, "elapsed_time": "0:25:39", "remaining_time": "10:15:02", "throughput": 1862.29, "total_tokens": 2867200} +{"current_steps": 360, "total_steps": 8739, "loss": 1.4127, "learning_rate": 1.8e-05, "epoch": 0.0411946446961895, "percentage": 4.12, "elapsed_time": "0:26:23", "remaining_time": "10:14:18", "throughput": 1862.25, "total_tokens": 2949120} +{"current_steps": 370, "total_steps": 8739, "loss": 1.1462, "learning_rate": 1.85e-05, "epoch": 0.04233894038219476, "percentage": 4.23, "elapsed_time": "0:27:07", "remaining_time": "10:13:34", "throughput": 1862.29, "total_tokens": 3031040} +{"current_steps": 380, "total_steps": 8739, "loss": 1.5957, "learning_rate": 1.9e-05, "epoch": 0.043483236068200024, "percentage": 4.35, "elapsed_time": "0:27:51", "remaining_time": "10:12:47", "throughput": 1862.44, "total_tokens": 3112960} +{"current_steps": 390, "total_steps": 8739, "loss": 1.3672, "learning_rate": 1.9500000000000003e-05, "epoch": 0.04462753175420529, "percentage": 4.46, "elapsed_time": "0:28:35", "remaining_time": "10:11:58", "throughput": 1862.66, "total_tokens": 3194880} +{"current_steps": 400, "total_steps": 8739, "loss": 1.2616, "learning_rate": 2e-05, "epoch": 0.04577182744021055, "percentage": 4.58, "elapsed_time": "0:29:19", "remaining_time": "10:11:15", "throughput": 1862.62, "total_tokens": 3276800} +{"current_steps": 410, "total_steps": 8739, "loss": 1.1038, "learning_rate": 2.05e-05, "epoch": 0.04691612312621581, "percentage": 4.69, "elapsed_time": "0:30:02", "remaining_time": "10:10:26", "throughput": 1862.87, "total_tokens": 3358720} +{"current_steps": 420, "total_steps": 8739, "loss": 1.3898, "learning_rate": 2.1e-05, "epoch": 0.048060418812221076, "percentage": 4.81, "elapsed_time": "0:30:46", "remaining_time": "10:09:38", "throughput": 1863.11, "total_tokens": 3440640} +{"current_steps": 430, "total_steps": 8739, "loss": 1.2665, "learning_rate": 2.15e-05, "epoch": 0.04920471449822634, "percentage": 4.92, "elapsed_time": "0:31:31", "remaining_time": "10:09:03", "throughput": 1862.66, "total_tokens": 3522560} +{"current_steps": 440, "total_steps": 8739, "loss": 1.188, "learning_rate": 2.2000000000000003e-05, "epoch": 0.05034901018423161, "percentage": 5.03, "elapsed_time": "0:32:15", "remaining_time": "10:08:18", "throughput": 1862.71, "total_tokens": 3604480} +{"current_steps": 450, "total_steps": 8739, "loss": 1.4607, "learning_rate": 2.25e-05, "epoch": 0.05149330587023687, "percentage": 5.15, "elapsed_time": "0:32:58", "remaining_time": "10:07:30", "throughput": 1862.92, "total_tokens": 3686400} +{"current_steps": 460, "total_steps": 8739, "loss": 1.1622, "learning_rate": 2.3000000000000003e-05, "epoch": 0.052637601556242135, "percentage": 5.26, "elapsed_time": "0:33:42", "remaining_time": "10:06:45", "throughput": 1862.97, "total_tokens": 3768320} +{"current_steps": 470, "total_steps": 8739, "loss": 1.3681, "learning_rate": 2.35e-05, "epoch": 0.0537818972422474, "percentage": 5.38, "elapsed_time": "0:34:26", "remaining_time": "10:05:59", "throughput": 1863.03, "total_tokens": 3850240} +{"current_steps": 480, "total_steps": 8739, "loss": 1.341, "learning_rate": 2.4e-05, "epoch": 0.05492619292825266, "percentage": 5.49, "elapsed_time": "0:35:10", "remaining_time": "10:05:13", "throughput": 1863.15, "total_tokens": 3932160} +{"current_steps": 490, "total_steps": 8739, "loss": 1.0104, "learning_rate": 2.45e-05, "epoch": 0.056070488614257924, "percentage": 5.61, "elapsed_time": "0:35:54", "remaining_time": "10:04:29", "throughput": 1863.18, "total_tokens": 4014080} +{"current_steps": 500, "total_steps": 8739, "loss": 1.4473, "learning_rate": 2.5e-05, "epoch": 0.05721478430026319, "percentage": 5.72, "elapsed_time": "0:36:38", "remaining_time": "10:03:42", "throughput": 1863.33, "total_tokens": 4096000} +{"current_steps": 510, "total_steps": 8739, "loss": 1.5255, "learning_rate": 2.5500000000000003e-05, "epoch": 0.05835907998626845, "percentage": 5.84, "elapsed_time": "0:37:22", "remaining_time": "10:03:09", "throughput": 1862.76, "total_tokens": 4177920} +{"current_steps": 520, "total_steps": 8739, "loss": 1.3778, "learning_rate": 2.6000000000000002e-05, "epoch": 0.05950337567227371, "percentage": 5.95, "elapsed_time": "0:38:06", "remaining_time": "10:02:19", "throughput": 1863.05, "total_tokens": 4259840} +{"current_steps": 530, "total_steps": 8739, "loss": 1.1477, "learning_rate": 2.6500000000000004e-05, "epoch": 0.060647671358278976, "percentage": 6.06, "elapsed_time": "0:38:50", "remaining_time": "10:01:34", "throughput": 1863.13, "total_tokens": 4341760} +{"current_steps": 540, "total_steps": 8739, "loss": 1.4827, "learning_rate": 2.7000000000000002e-05, "epoch": 0.061791967044284246, "percentage": 6.18, "elapsed_time": "0:39:34", "remaining_time": "10:00:48", "throughput": 1863.2, "total_tokens": 4423680} +{"current_steps": 550, "total_steps": 8739, "loss": 1.635, "learning_rate": 2.7500000000000004e-05, "epoch": 0.0629362627302895, "percentage": 6.29, "elapsed_time": "0:40:17", "remaining_time": "10:00:00", "throughput": 1863.41, "total_tokens": 4505600} +{"current_steps": 560, "total_steps": 8739, "loss": 1.2354, "learning_rate": 2.8000000000000003e-05, "epoch": 0.06408055841629477, "percentage": 6.41, "elapsed_time": "0:41:01", "remaining_time": "9:59:15", "throughput": 1863.49, "total_tokens": 4587520} +{"current_steps": 570, "total_steps": 8739, "loss": 1.3294, "learning_rate": 2.8499999999999998e-05, "epoch": 0.06522485410230003, "percentage": 6.52, "elapsed_time": "0:41:45", "remaining_time": "9:58:28", "throughput": 1863.62, "total_tokens": 4669440} +{"current_steps": 580, "total_steps": 8739, "loss": 1.3841, "learning_rate": 2.9e-05, "epoch": 0.0663691497883053, "percentage": 6.64, "elapsed_time": "0:42:29", "remaining_time": "9:57:47", "throughput": 1863.5, "total_tokens": 4751360} +{"current_steps": 590, "total_steps": 8739, "loss": 1.3379, "learning_rate": 2.95e-05, "epoch": 0.06751344547431057, "percentage": 6.75, "elapsed_time": "0:43:13", "remaining_time": "9:56:59", "throughput": 1863.7, "total_tokens": 4833280} +{"current_steps": 600, "total_steps": 8739, "loss": 1.187, "learning_rate": 3e-05, "epoch": 0.06865774116031582, "percentage": 6.87, "elapsed_time": "0:43:57", "remaining_time": "9:56:14", "throughput": 1863.72, "total_tokens": 4915200} +{"current_steps": 610, "total_steps": 8739, "loss": 1.5078, "learning_rate": 3.05e-05, "epoch": 0.0698020368463211, "percentage": 6.98, "elapsed_time": "0:44:41", "remaining_time": "9:55:31", "throughput": 1863.7, "total_tokens": 4997120} +{"current_steps": 620, "total_steps": 8739, "loss": 1.4624, "learning_rate": 3.1e-05, "epoch": 0.07094633253232635, "percentage": 7.09, "elapsed_time": "0:45:25", "remaining_time": "9:54:47", "throughput": 1863.72, "total_tokens": 5079040} +{"current_steps": 630, "total_steps": 8739, "loss": 1.2244, "learning_rate": 3.15e-05, "epoch": 0.07209062821833162, "percentage": 7.21, "elapsed_time": "0:46:08", "remaining_time": "9:53:56", "throughput": 1864.06, "total_tokens": 5160960} +{"current_steps": 640, "total_steps": 8739, "loss": 1.4688, "learning_rate": 3.2000000000000005e-05, "epoch": 0.07323492390433688, "percentage": 7.32, "elapsed_time": "0:46:52", "remaining_time": "9:53:14", "throughput": 1863.96, "total_tokens": 5242880} +{"current_steps": 650, "total_steps": 8739, "loss": 1.1677, "learning_rate": 3.2500000000000004e-05, "epoch": 0.07437921959034215, "percentage": 7.44, "elapsed_time": "0:47:36", "remaining_time": "9:52:30", "throughput": 1863.99, "total_tokens": 5324800} +{"current_steps": 660, "total_steps": 8739, "loss": 1.2562, "learning_rate": 3.3e-05, "epoch": 0.0755235152763474, "percentage": 7.55, "elapsed_time": "0:48:20", "remaining_time": "9:51:44", "throughput": 1864.1, "total_tokens": 5406720} +{"current_steps": 670, "total_steps": 8739, "loss": 1.3111, "learning_rate": 3.35e-05, "epoch": 0.07666781096235267, "percentage": 7.67, "elapsed_time": "0:49:04", "remaining_time": "9:50:59", "throughput": 1864.12, "total_tokens": 5488640} +{"current_steps": 680, "total_steps": 8739, "loss": 1.2953, "learning_rate": 3.4000000000000007e-05, "epoch": 0.07781210664835793, "percentage": 7.78, "elapsed_time": "0:49:48", "remaining_time": "9:50:14", "throughput": 1864.22, "total_tokens": 5570560} +{"current_steps": 690, "total_steps": 8739, "loss": 1.2493, "learning_rate": 3.45e-05, "epoch": 0.0789564023343632, "percentage": 7.9, "elapsed_time": "0:50:32", "remaining_time": "9:49:30", "throughput": 1864.18, "total_tokens": 5652480} +{"current_steps": 700, "total_steps": 8739, "loss": 1.3966, "learning_rate": 3.5e-05, "epoch": 0.08010069802036847, "percentage": 8.01, "elapsed_time": "0:51:16", "remaining_time": "9:48:46", "throughput": 1864.17, "total_tokens": 5734400} +{"current_steps": 710, "total_steps": 8739, "loss": 1.1898, "learning_rate": 3.55e-05, "epoch": 0.08124499370637372, "percentage": 8.12, "elapsed_time": "0:51:59", "remaining_time": "9:47:59", "throughput": 1864.35, "total_tokens": 5816320} +{"current_steps": 720, "total_steps": 8739, "loss": 1.3558, "learning_rate": 3.6e-05, "epoch": 0.082389289392379, "percentage": 8.24, "elapsed_time": "0:52:43", "remaining_time": "9:47:14", "throughput": 1864.39, "total_tokens": 5898240} +{"current_steps": 730, "total_steps": 8739, "loss": 1.6577, "learning_rate": 3.65e-05, "epoch": 0.08353358507838425, "percentage": 8.35, "elapsed_time": "0:53:27", "remaining_time": "9:46:30", "throughput": 1864.44, "total_tokens": 5980160} +{"current_steps": 740, "total_steps": 8739, "loss": 1.2571, "learning_rate": 3.7e-05, "epoch": 0.08467788076438952, "percentage": 8.47, "elapsed_time": "0:54:11", "remaining_time": "9:45:42", "throughput": 1864.64, "total_tokens": 6062080} +{"current_steps": 750, "total_steps": 8739, "loss": 1.3735, "learning_rate": 3.7500000000000003e-05, "epoch": 0.08582217645039478, "percentage": 8.58, "elapsed_time": "0:54:55", "remaining_time": "9:45:00", "throughput": 1864.55, "total_tokens": 6144000} +{"current_steps": 760, "total_steps": 8739, "loss": 1.2731, "learning_rate": 3.8e-05, "epoch": 0.08696647213640005, "percentage": 8.7, "elapsed_time": "0:55:39", "remaining_time": "9:44:17", "throughput": 1864.49, "total_tokens": 6225920} +{"current_steps": 770, "total_steps": 8739, "loss": 1.543, "learning_rate": 3.85e-05, "epoch": 0.0881107678224053, "percentage": 8.81, "elapsed_time": "0:56:23", "remaining_time": "9:43:32", "throughput": 1864.51, "total_tokens": 6307840} +{"current_steps": 780, "total_steps": 8739, "loss": 1.1869, "learning_rate": 3.9000000000000006e-05, "epoch": 0.08925506350841057, "percentage": 8.93, "elapsed_time": "0:57:06", "remaining_time": "9:42:46", "throughput": 1864.64, "total_tokens": 6389760} +{"current_steps": 790, "total_steps": 8739, "loss": 1.6793, "learning_rate": 3.9500000000000005e-05, "epoch": 0.09039935919441584, "percentage": 9.04, "elapsed_time": "0:57:50", "remaining_time": "9:42:03", "throughput": 1864.59, "total_tokens": 6471680} +{"current_steps": 800, "total_steps": 8739, "loss": 1.7236, "learning_rate": 4e-05, "epoch": 0.0915436548804211, "percentage": 9.15, "elapsed_time": "0:58:34", "remaining_time": "9:41:17", "throughput": 1864.73, "total_tokens": 6553600} +{"current_steps": 810, "total_steps": 8739, "loss": 1.1466, "learning_rate": 4.05e-05, "epoch": 0.09268795056642637, "percentage": 9.27, "elapsed_time": "0:59:18", "remaining_time": "9:40:33", "throughput": 1864.7, "total_tokens": 6635520} +{"current_steps": 820, "total_steps": 8739, "loss": 1.308, "learning_rate": 4.1e-05, "epoch": 0.09383224625243163, "percentage": 9.38, "elapsed_time": "1:00:02", "remaining_time": "9:39:46", "throughput": 1864.87, "total_tokens": 6717440} +{"current_steps": 830, "total_steps": 8739, "loss": 1.1448, "learning_rate": 4.15e-05, "epoch": 0.0949765419384369, "percentage": 9.5, "elapsed_time": "1:00:45", "remaining_time": "9:39:00", "throughput": 1864.96, "total_tokens": 6799360} +{"current_steps": 840, "total_steps": 8739, "loss": 1.1618, "learning_rate": 4.2e-05, "epoch": 0.09612083762444215, "percentage": 9.61, "elapsed_time": "1:01:29", "remaining_time": "9:38:16", "throughput": 1864.98, "total_tokens": 6881280} +{"current_steps": 850, "total_steps": 8739, "loss": 1.3667, "learning_rate": 4.25e-05, "epoch": 0.09726513331044742, "percentage": 9.73, "elapsed_time": "1:02:13", "remaining_time": "9:37:35", "throughput": 1864.82, "total_tokens": 6963200} +{"current_steps": 860, "total_steps": 8739, "loss": 1.3752, "learning_rate": 4.3e-05, "epoch": 0.09840942899645268, "percentage": 9.84, "elapsed_time": "1:02:57", "remaining_time": "9:36:50", "throughput": 1864.89, "total_tokens": 7045120} +{"current_steps": 870, "total_steps": 8739, "loss": 1.3973, "learning_rate": 4.35e-05, "epoch": 0.09955372468245795, "percentage": 9.96, "elapsed_time": "1:03:41", "remaining_time": "9:36:06", "throughput": 1864.89, "total_tokens": 7127040} +{"current_steps": 880, "total_steps": 8739, "loss": 1.3936, "learning_rate": 4.4000000000000006e-05, "epoch": 0.10069802036846322, "percentage": 10.07, "elapsed_time": "1:04:25", "remaining_time": "9:35:21", "throughput": 1864.98, "total_tokens": 7208960} +{"current_steps": 890, "total_steps": 8739, "loss": 1.2224, "learning_rate": 4.4500000000000004e-05, "epoch": 0.10184231605446847, "percentage": 10.18, "elapsed_time": "1:05:09", "remaining_time": "9:34:38", "throughput": 1864.92, "total_tokens": 7290880} +{"current_steps": 900, "total_steps": 8739, "loss": 1.0594, "learning_rate": 4.5e-05, "epoch": 0.10298661174047374, "percentage": 10.3, "elapsed_time": "1:05:53", "remaining_time": "9:33:54", "throughput": 1864.92, "total_tokens": 7372800} +{"current_steps": 910, "total_steps": 8739, "loss": 1.122, "learning_rate": 4.55e-05, "epoch": 0.104130907426479, "percentage": 10.41, "elapsed_time": "1:06:37", "remaining_time": "9:33:10", "throughput": 1864.91, "total_tokens": 7454720} +{"current_steps": 920, "total_steps": 8739, "loss": 1.2711, "learning_rate": 4.600000000000001e-05, "epoch": 0.10527520311248427, "percentage": 10.53, "elapsed_time": "1:07:21", "remaining_time": "9:32:26", "throughput": 1864.93, "total_tokens": 7536640} +{"current_steps": 930, "total_steps": 8739, "loss": 1.3302, "learning_rate": 4.6500000000000005e-05, "epoch": 0.10641949879848953, "percentage": 10.64, "elapsed_time": "1:08:05", "remaining_time": "9:31:41", "throughput": 1864.97, "total_tokens": 7618560} +{"current_steps": 940, "total_steps": 8739, "loss": 1.2869, "learning_rate": 4.7e-05, "epoch": 0.1075637944844948, "percentage": 10.76, "elapsed_time": "1:08:48", "remaining_time": "9:30:56", "throughput": 1865.02, "total_tokens": 7700480} +{"current_steps": 950, "total_steps": 8739, "loss": 1.2435, "learning_rate": 4.75e-05, "epoch": 0.10870809017050005, "percentage": 10.87, "elapsed_time": "1:09:32", "remaining_time": "9:30:11", "throughput": 1865.12, "total_tokens": 7782400} +{"current_steps": 960, "total_steps": 8739, "loss": 1.0464, "learning_rate": 4.8e-05, "epoch": 0.10985238585650532, "percentage": 10.99, "elapsed_time": "1:10:16", "remaining_time": "9:29:24", "throughput": 1865.25, "total_tokens": 7864320} +{"current_steps": 970, "total_steps": 8739, "loss": 1.2715, "learning_rate": 4.85e-05, "epoch": 0.11099668154251058, "percentage": 11.1, "elapsed_time": "1:11:00", "remaining_time": "9:28:39", "throughput": 1865.31, "total_tokens": 7946240} +{"current_steps": 980, "total_steps": 8739, "loss": 1.4746, "learning_rate": 4.9e-05, "epoch": 0.11214097722851585, "percentage": 11.21, "elapsed_time": "1:11:43", "remaining_time": "9:27:54", "throughput": 1865.38, "total_tokens": 8028160} +{"current_steps": 990, "total_steps": 8739, "loss": 1.1464, "learning_rate": 4.9500000000000004e-05, "epoch": 0.11328527291452112, "percentage": 11.33, "elapsed_time": "1:12:27", "remaining_time": "9:27:08", "throughput": 1865.51, "total_tokens": 8110080} +{"current_steps": 1000, "total_steps": 8739, "loss": 1.3901, "learning_rate": 5e-05, "epoch": 0.11442956860052637, "percentage": 11.44, "elapsed_time": "1:13:11", "remaining_time": "9:26:22", "throughput": 1865.61, "total_tokens": 8192000} +{"current_steps": 1010, "total_steps": 8739, "loss": 1.3986, "learning_rate": 4.999979401316311e-05, "epoch": 0.11557386428653164, "percentage": 11.56, "elapsed_time": "1:14:11", "remaining_time": "9:27:47", "throughput": 1858.55, "total_tokens": 8273920} +{"current_steps": 1020, "total_steps": 8739, "loss": 1.3841, "learning_rate": 4.999917605604688e-05, "epoch": 0.1167181599725369, "percentage": 11.67, "elapsed_time": "1:14:55", "remaining_time": "9:27:02", "throughput": 1858.62, "total_tokens": 8355840} +{"current_steps": 1030, "total_steps": 8739, "loss": 1.6034, "learning_rate": 4.999814613883459e-05, "epoch": 0.11786245565854217, "percentage": 11.79, "elapsed_time": "1:15:39", "remaining_time": "9:26:16", "throughput": 1858.71, "total_tokens": 8437760} +{"current_steps": 1040, "total_steps": 8739, "loss": 1.5685, "learning_rate": 4.9996704278498185e-05, "epoch": 0.11900675134454743, "percentage": 11.9, "elapsed_time": "1:16:23", "remaining_time": "9:25:31", "throughput": 1858.73, "total_tokens": 8519680} +{"current_steps": 1050, "total_steps": 8739, "loss": 1.4407, "learning_rate": 4.9994850498798026e-05, "epoch": 0.1201510470305527, "percentage": 12.02, "elapsed_time": "1:17:07", "remaining_time": "9:24:46", "throughput": 1858.82, "total_tokens": 8601600} +{"current_steps": 1060, "total_steps": 8739, "loss": 1.2713, "learning_rate": 4.999258483028243e-05, "epoch": 0.12129534271655795, "percentage": 12.13, "elapsed_time": "1:17:51", "remaining_time": "9:24:00", "throughput": 1858.93, "total_tokens": 8683520} +{"current_steps": 1070, "total_steps": 8739, "loss": 1.2696, "learning_rate": 4.9989907310287243e-05, "epoch": 0.12243963840256322, "percentage": 12.24, "elapsed_time": "1:18:34", "remaining_time": "9:23:13", "throughput": 1859.06, "total_tokens": 8765440} +{"current_steps": 1080, "total_steps": 8739, "loss": 1.1279, "learning_rate": 4.998681798293516e-05, "epoch": 0.12358393408856849, "percentage": 12.36, "elapsed_time": "1:19:18", "remaining_time": "9:22:28", "throughput": 1859.13, "total_tokens": 8847360} +{"current_steps": 1090, "total_steps": 8739, "loss": 1.3104, "learning_rate": 4.998331689913506e-05, "epoch": 0.12472822977457375, "percentage": 12.47, "elapsed_time": "1:20:02", "remaining_time": "9:21:41", "throughput": 1859.31, "total_tokens": 8929280} +{"current_steps": 1100, "total_steps": 8739, "loss": 1.2877, "learning_rate": 4.9979404116581104e-05, "epoch": 0.125872525460579, "percentage": 12.59, "elapsed_time": "1:20:46", "remaining_time": "9:20:55", "throughput": 1859.39, "total_tokens": 9011200} +{"current_steps": 1110, "total_steps": 8739, "loss": 1.2768, "learning_rate": 4.9975079699751825e-05, "epoch": 0.12701682114658427, "percentage": 12.7, "elapsed_time": "1:21:30", "remaining_time": "9:20:09", "throughput": 1859.49, "total_tokens": 9093120} +{"current_steps": 1120, "total_steps": 8739, "loss": 1.5502, "learning_rate": 4.997034371990907e-05, "epoch": 0.12816111683258954, "percentage": 12.82, "elapsed_time": "1:22:13", "remaining_time": "9:19:22", "throughput": 1859.63, "total_tokens": 9175040} +{"current_steps": 1130, "total_steps": 8739, "loss": 1.3732, "learning_rate": 4.99651962550968e-05, "epoch": 0.12930541251859481, "percentage": 12.93, "elapsed_time": "1:22:57", "remaining_time": "9:18:38", "throughput": 1859.65, "total_tokens": 9256960} +{"current_steps": 1140, "total_steps": 8739, "loss": 1.1296, "learning_rate": 4.9959637390139814e-05, "epoch": 0.13044970820460006, "percentage": 13.04, "elapsed_time": "1:23:41", "remaining_time": "9:17:52", "throughput": 1859.75, "total_tokens": 9338880} +{"current_steps": 1150, "total_steps": 8739, "loss": 1.1064, "learning_rate": 4.995366721664234e-05, "epoch": 0.13159400389060533, "percentage": 13.16, "elapsed_time": "1:24:25", "remaining_time": "9:17:06", "throughput": 1859.85, "total_tokens": 9420800} +{"current_steps": 1160, "total_steps": 8739, "loss": 1.3228, "learning_rate": 4.9947285832986553e-05, "epoch": 0.1327382995766106, "percentage": 13.27, "elapsed_time": "1:25:08", "remaining_time": "9:16:20", "throughput": 1860.0, "total_tokens": 9502720} +{"current_steps": 1170, "total_steps": 8739, "loss": 1.3161, "learning_rate": 4.994049334433095e-05, "epoch": 0.13388259526261587, "percentage": 13.39, "elapsed_time": "1:25:52", "remaining_time": "9:15:35", "throughput": 1860.02, "total_tokens": 9584640} +{"current_steps": 1180, "total_steps": 8739, "loss": 1.4789, "learning_rate": 4.9933289862608584e-05, "epoch": 0.13502689094862114, "percentage": 13.5, "elapsed_time": "1:26:36", "remaining_time": "9:14:51", "throughput": 1860.05, "total_tokens": 9666560} +{"current_steps": 1190, "total_steps": 8739, "loss": 1.3033, "learning_rate": 4.992567550652525e-05, "epoch": 0.13617118663462638, "percentage": 13.62, "elapsed_time": "1:27:20", "remaining_time": "9:14:05", "throughput": 1860.13, "total_tokens": 9748480} +{"current_steps": 1200, "total_steps": 8739, "loss": 1.1661, "learning_rate": 4.9917650401557505e-05, "epoch": 0.13731548232063165, "percentage": 13.73, "elapsed_time": "1:28:04", "remaining_time": "9:13:19", "throughput": 1860.26, "total_tokens": 9830400} +{"current_steps": 1210, "total_steps": 8739, "loss": 1.3148, "learning_rate": 4.990921467995064e-05, "epoch": 0.13845977800663692, "percentage": 13.85, "elapsed_time": "1:28:48", "remaining_time": "9:12:33", "throughput": 1860.34, "total_tokens": 9912320} +{"current_steps": 1220, "total_steps": 8739, "loss": 1.186, "learning_rate": 4.9900368480716466e-05, "epoch": 0.1396040736926422, "percentage": 13.96, "elapsed_time": "1:29:32", "remaining_time": "9:11:49", "throughput": 1860.37, "total_tokens": 9994240} +{"current_steps": 1230, "total_steps": 8739, "loss": 1.0854, "learning_rate": 4.9891111949631023e-05, "epoch": 0.14074836937864743, "percentage": 14.07, "elapsed_time": "1:30:15", "remaining_time": "9:11:02", "throughput": 1860.5, "total_tokens": 10076160} +{"current_steps": 1240, "total_steps": 8739, "loss": 1.2775, "learning_rate": 4.988144523923221e-05, "epoch": 0.1418926650646527, "percentage": 14.19, "elapsed_time": "1:30:59", "remaining_time": "9:10:18", "throughput": 1860.53, "total_tokens": 10158080} +{"current_steps": 1250, "total_steps": 8739, "loss": 1.3006, "learning_rate": 4.987136850881721e-05, "epoch": 0.14303696075065797, "percentage": 14.3, "elapsed_time": "1:31:43", "remaining_time": "9:09:33", "throughput": 1860.56, "total_tokens": 10240000} +{"current_steps": 1260, "total_steps": 8739, "loss": 1.0796, "learning_rate": 4.986088192443995e-05, "epoch": 0.14418125643666324, "percentage": 14.42, "elapsed_time": "1:32:27", "remaining_time": "9:08:50", "throughput": 1860.53, "total_tokens": 10321920} +{"current_steps": 1270, "total_steps": 8739, "loss": 1.2881, "learning_rate": 4.9849985658908296e-05, "epoch": 0.1453255521226685, "percentage": 14.53, "elapsed_time": "1:33:11", "remaining_time": "9:08:05", "throughput": 1860.58, "total_tokens": 10403840} +{"current_steps": 1280, "total_steps": 8739, "loss": 1.2889, "learning_rate": 4.9838679891781214e-05, "epoch": 0.14646984780867375, "percentage": 14.65, "elapsed_time": "1:33:55", "remaining_time": "9:07:19", "throughput": 1860.71, "total_tokens": 10485760} +{"current_steps": 1290, "total_steps": 8739, "loss": 1.0391, "learning_rate": 4.982696480936586e-05, "epoch": 0.14761414349467902, "percentage": 14.76, "elapsed_time": "1:34:39", "remaining_time": "9:06:36", "throughput": 1860.65, "total_tokens": 10567680} +{"current_steps": 1300, "total_steps": 8739, "loss": 1.0809, "learning_rate": 4.981484060471444e-05, "epoch": 0.1487584391806843, "percentage": 14.88, "elapsed_time": "1:35:23", "remaining_time": "9:05:51", "throughput": 1860.66, "total_tokens": 10649600} +{"current_steps": 1310, "total_steps": 8739, "loss": 1.1128, "learning_rate": 4.9802307477621084e-05, "epoch": 0.14990273486668956, "percentage": 14.99, "elapsed_time": "1:36:07", "remaining_time": "9:05:05", "throughput": 1860.78, "total_tokens": 10731520} +{"current_steps": 1320, "total_steps": 8739, "loss": 1.2888, "learning_rate": 4.978936563461854e-05, "epoch": 0.1510470305526948, "percentage": 15.1, "elapsed_time": "1:36:50", "remaining_time": "9:04:20", "throughput": 1860.87, "total_tokens": 10813440} +{"current_steps": 1330, "total_steps": 8739, "loss": 1.3032, "learning_rate": 4.9776015288974736e-05, "epoch": 0.15219132623870008, "percentage": 15.22, "elapsed_time": "1:37:34", "remaining_time": "9:03:35", "throughput": 1860.9, "total_tokens": 10895360} +{"current_steps": 1340, "total_steps": 8739, "loss": 0.9843, "learning_rate": 4.976225666068932e-05, "epoch": 0.15333562192470535, "percentage": 15.33, "elapsed_time": "1:38:18", "remaining_time": "9:02:50", "throughput": 1860.99, "total_tokens": 10977280} +{"current_steps": 1350, "total_steps": 8739, "loss": 1.3003, "learning_rate": 4.9748089976489996e-05, "epoch": 0.15447991761071062, "percentage": 15.45, "elapsed_time": "1:39:02", "remaining_time": "9:02:05", "throughput": 1861.05, "total_tokens": 11059200} +{"current_steps": 1360, "total_steps": 8739, "loss": 1.4718, "learning_rate": 4.9733515469828795e-05, "epoch": 0.15562421329671586, "percentage": 15.56, "elapsed_time": "1:39:46", "remaining_time": "9:01:20", "throughput": 1861.08, "total_tokens": 11141120} +{"current_steps": 1370, "total_steps": 8739, "loss": 1.3703, "learning_rate": 4.971853338087825e-05, "epoch": 0.15676850898272113, "percentage": 15.68, "elapsed_time": "1:40:30", "remaining_time": "9:00:35", "throughput": 1861.11, "total_tokens": 11223040} +{"current_steps": 1380, "total_steps": 8739, "loss": 1.0876, "learning_rate": 4.97031439565274e-05, "epoch": 0.1579128046687264, "percentage": 15.79, "elapsed_time": "1:41:14", "remaining_time": "8:59:50", "throughput": 1861.17, "total_tokens": 11304960} +{"current_steps": 1390, "total_steps": 8739, "loss": 1.2873, "learning_rate": 4.9687347450377755e-05, "epoch": 0.15905710035473167, "percentage": 15.91, "elapsed_time": "1:41:57", "remaining_time": "8:59:05", "throughput": 1861.27, "total_tokens": 11386880} +{"current_steps": 1400, "total_steps": 8739, "loss": 1.4622, "learning_rate": 4.9671144122739106e-05, "epoch": 0.16020139604073694, "percentage": 16.02, "elapsed_time": "1:42:41", "remaining_time": "8:58:20", "throughput": 1861.32, "total_tokens": 11468800} +{"current_steps": 1410, "total_steps": 8739, "loss": 1.0993, "learning_rate": 4.9654534240625225e-05, "epoch": 0.16134569172674218, "percentage": 16.13, "elapsed_time": "1:43:25", "remaining_time": "8:57:35", "throughput": 1861.35, "total_tokens": 11550720} +{"current_steps": 1420, "total_steps": 8739, "loss": 1.156, "learning_rate": 4.9637518077749476e-05, "epoch": 0.16248998741274745, "percentage": 16.25, "elapsed_time": "1:44:09", "remaining_time": "8:56:49", "throughput": 1861.45, "total_tokens": 11632640} +{"current_steps": 1430, "total_steps": 8739, "loss": 1.266, "learning_rate": 4.962009591452032e-05, "epoch": 0.16363428309875272, "percentage": 16.36, "elapsed_time": "1:44:53", "remaining_time": "8:56:06", "throughput": 1861.42, "total_tokens": 11714560} +{"current_steps": 1440, "total_steps": 8739, "loss": 1.2794, "learning_rate": 4.960226803803664e-05, "epoch": 0.164778578784758, "percentage": 16.48, "elapsed_time": "1:45:37", "remaining_time": "8:55:21", "throughput": 1861.45, "total_tokens": 11796480} +{"current_steps": 1450, "total_steps": 8739, "loss": 1.2099, "learning_rate": 4.958403474208308e-05, "epoch": 0.16592287447076323, "percentage": 16.59, "elapsed_time": "1:46:21", "remaining_time": "8:54:38", "throughput": 1861.41, "total_tokens": 11878400} +{"current_steps": 1460, "total_steps": 8739, "loss": 1.3631, "learning_rate": 4.9565396327125155e-05, "epoch": 0.1670671701567685, "percentage": 16.71, "elapsed_time": "1:47:05", "remaining_time": "8:53:53", "throughput": 1861.48, "total_tokens": 11960320} +{"current_steps": 1470, "total_steps": 8739, "loss": 1.1778, "learning_rate": 4.95463531003043e-05, "epoch": 0.16821146584277377, "percentage": 16.82, "elapsed_time": "1:47:49", "remaining_time": "8:53:08", "throughput": 1861.51, "total_tokens": 12042240} +{"current_steps": 1480, "total_steps": 8739, "loss": 1.3796, "learning_rate": 4.952690537543287e-05, "epoch": 0.16935576152877904, "percentage": 16.94, "elapsed_time": "1:48:33", "remaining_time": "8:52:24", "throughput": 1861.51, "total_tokens": 12124160} +{"current_steps": 1490, "total_steps": 8739, "loss": 1.2806, "learning_rate": 4.9507053472988867e-05, "epoch": 0.1705000572147843, "percentage": 17.05, "elapsed_time": "1:49:16", "remaining_time": "8:51:39", "throughput": 1861.58, "total_tokens": 12206080} +{"current_steps": 1500, "total_steps": 8739, "loss": 1.3344, "learning_rate": 4.9486797720110746e-05, "epoch": 0.17164435290078955, "percentage": 17.16, "elapsed_time": "1:50:00", "remaining_time": "8:50:54", "throughput": 1861.66, "total_tokens": 12288000} +{"current_steps": 1510, "total_steps": 8739, "loss": 1.2448, "learning_rate": 4.946613845059199e-05, "epoch": 0.17278864858679482, "percentage": 17.28, "elapsed_time": "1:50:44", "remaining_time": "8:50:10", "throughput": 1861.65, "total_tokens": 12369920} +{"current_steps": 1520, "total_steps": 8739, "loss": 1.2916, "learning_rate": 4.9445076004875596e-05, "epoch": 0.1739329442728001, "percentage": 17.39, "elapsed_time": "1:51:28", "remaining_time": "8:49:26", "throughput": 1861.63, "total_tokens": 12451840} +{"current_steps": 1530, "total_steps": 8739, "loss": 1.3731, "learning_rate": 4.9423610730048495e-05, "epoch": 0.17507723995880536, "percentage": 17.51, "elapsed_time": "1:52:12", "remaining_time": "8:48:41", "throughput": 1861.69, "total_tokens": 12533760} +{"current_steps": 1540, "total_steps": 8739, "loss": 1.3654, "learning_rate": 4.940174297983581e-05, "epoch": 0.1762215356448106, "percentage": 17.62, "elapsed_time": "1:52:56", "remaining_time": "8:47:57", "throughput": 1861.72, "total_tokens": 12615680} +{"current_steps": 1550, "total_steps": 8739, "loss": 1.2584, "learning_rate": 4.937947311459503e-05, "epoch": 0.17736583133081588, "percentage": 17.74, "elapsed_time": "1:53:40", "remaining_time": "8:47:12", "throughput": 1861.75, "total_tokens": 12697600} +{"current_steps": 1560, "total_steps": 8739, "loss": 1.372, "learning_rate": 4.9356801501310105e-05, "epoch": 0.17851012701682115, "percentage": 17.85, "elapsed_time": "1:54:24", "remaining_time": "8:46:28", "throughput": 1861.76, "total_tokens": 12779520} +{"current_steps": 1570, "total_steps": 8739, "loss": 1.562, "learning_rate": 4.933372851358532e-05, "epoch": 0.17965442270282642, "percentage": 17.97, "elapsed_time": "1:55:07", "remaining_time": "8:45:43", "throughput": 1861.84, "total_tokens": 12861440} +{"current_steps": 1580, "total_steps": 8739, "loss": 1.2423, "learning_rate": 4.9310254531639235e-05, "epoch": 0.1807987183888317, "percentage": 18.08, "elapsed_time": "1:55:51", "remaining_time": "8:44:58", "throughput": 1861.9, "total_tokens": 12943360} +{"current_steps": 1590, "total_steps": 8739, "loss": 1.3979, "learning_rate": 4.928637994229834e-05, "epoch": 0.18194301407483693, "percentage": 18.19, "elapsed_time": "1:56:35", "remaining_time": "8:44:14", "throughput": 1861.88, "total_tokens": 13025280} +{"current_steps": 1600, "total_steps": 8739, "loss": 1.3811, "learning_rate": 4.9262105138990745e-05, "epoch": 0.1830873097608422, "percentage": 18.31, "elapsed_time": "1:57:19", "remaining_time": "8:43:30", "throughput": 1861.89, "total_tokens": 13107200} +{"current_steps": 1610, "total_steps": 8739, "loss": 1.4006, "learning_rate": 4.9237430521739626e-05, "epoch": 0.18423160544684747, "percentage": 18.42, "elapsed_time": "1:58:03", "remaining_time": "8:42:46", "throughput": 1861.86, "total_tokens": 13189120} +{"current_steps": 1620, "total_steps": 8739, "loss": 1.2214, "learning_rate": 4.92123564971567e-05, "epoch": 0.18537590113285274, "percentage": 18.54, "elapsed_time": "1:58:47", "remaining_time": "8:42:02", "throughput": 1861.9, "total_tokens": 13271040} +{"current_steps": 1630, "total_steps": 8739, "loss": 1.2192, "learning_rate": 4.918688347843549e-05, "epoch": 0.18652019681885798, "percentage": 18.65, "elapsed_time": "1:59:31", "remaining_time": "8:41:18", "throughput": 1861.89, "total_tokens": 13352960} +{"current_steps": 1640, "total_steps": 8739, "loss": 1.4384, "learning_rate": 4.916101188534452e-05, "epoch": 0.18766449250486325, "percentage": 18.77, "elapsed_time": "2:00:15", "remaining_time": "8:40:32", "throughput": 1861.98, "total_tokens": 13434880} +{"current_steps": 1650, "total_steps": 8739, "loss": 1.2473, "learning_rate": 4.9134742144220394e-05, "epoch": 0.18880878819086852, "percentage": 18.88, "elapsed_time": "2:00:59", "remaining_time": "8:39:47", "throughput": 1862.06, "total_tokens": 13516800} +{"current_steps": 1660, "total_steps": 8739, "loss": 1.277, "learning_rate": 4.910807468796079e-05, "epoch": 0.1899530838768738, "percentage": 19.0, "elapsed_time": "2:01:42", "remaining_time": "8:39:02", "throughput": 1862.15, "total_tokens": 13598720} +{"current_steps": 1670, "total_steps": 8739, "loss": 1.31, "learning_rate": 4.90810099560173e-05, "epoch": 0.19109737956287906, "percentage": 19.11, "elapsed_time": "2:02:26", "remaining_time": "8:38:17", "throughput": 1862.19, "total_tokens": 13680640} +{"current_steps": 1680, "total_steps": 8739, "loss": 1.2949, "learning_rate": 4.90535483943882e-05, "epoch": 0.1922416752488843, "percentage": 19.22, "elapsed_time": "2:03:10", "remaining_time": "8:37:32", "throughput": 1862.23, "total_tokens": 13762560} +{"current_steps": 1690, "total_steps": 8739, "loss": 1.3735, "learning_rate": 4.902569045561113e-05, "epoch": 0.19338597093488957, "percentage": 19.34, "elapsed_time": "2:03:54", "remaining_time": "8:36:49", "throughput": 1862.19, "total_tokens": 13844480} +{"current_steps": 1700, "total_steps": 8739, "loss": 1.2904, "learning_rate": 4.899743659875556e-05, "epoch": 0.19453026662089484, "percentage": 19.45, "elapsed_time": "2:05:51", "remaining_time": "8:41:07", "throughput": 1844.17, "total_tokens": 13926400} +{"current_steps": 1710, "total_steps": 8739, "loss": 1.3387, "learning_rate": 4.896878728941531e-05, "epoch": 0.1956745623069001, "percentage": 19.57, "elapsed_time": "2:07:42", "remaining_time": "8:44:57", "throughput": 1828.13, "total_tokens": 14008320} +{"current_steps": 1720, "total_steps": 8739, "loss": 1.1596, "learning_rate": 4.893974299970082e-05, "epoch": 0.19681885799290535, "percentage": 19.68, "elapsed_time": "2:08:40", "remaining_time": "8:45:06", "throughput": 1825.01, "total_tokens": 14090240} +{"current_steps": 1730, "total_steps": 8739, "loss": 1.296, "learning_rate": 4.891030420823142e-05, "epoch": 0.19796315367891062, "percentage": 19.8, "elapsed_time": "2:09:39", "remaining_time": "8:45:17", "throughput": 1821.77, "total_tokens": 14172160} +{"current_steps": 1740, "total_steps": 8739, "loss": 1.3196, "learning_rate": 4.888047140012737e-05, "epoch": 0.1991074493649159, "percentage": 19.91, "elapsed_time": "2:10:36", "remaining_time": "8:45:22", "throughput": 1818.9, "total_tokens": 14254080} +{"current_steps": 1750, "total_steps": 8739, "loss": 1.1085, "learning_rate": 4.885024506700195e-05, "epoch": 0.20025174505092116, "percentage": 20.03, "elapsed_time": "2:11:34", "remaining_time": "8:45:28", "throughput": 1815.91, "total_tokens": 14336000} +{"current_steps": 1760, "total_steps": 8739, "loss": 1.3757, "learning_rate": 4.8819625706953286e-05, "epoch": 0.20139604073692643, "percentage": 20.14, "elapsed_time": "2:12:33", "remaining_time": "8:45:36", "throughput": 1812.86, "total_tokens": 14417920} +{"current_steps": 1770, "total_steps": 8739, "loss": 1.1697, "learning_rate": 4.8788613824556194e-05, "epoch": 0.20254033642293168, "percentage": 20.25, "elapsed_time": "2:13:31", "remaining_time": "8:45:41", "throughput": 1809.98, "total_tokens": 14499840} +{"current_steps": 1780, "total_steps": 8739, "loss": 1.2916, "learning_rate": 4.875720993085384e-05, "epoch": 0.20368463210893695, "percentage": 20.37, "elapsed_time": "2:14:28", "remaining_time": "8:45:42", "throughput": 1807.33, "total_tokens": 14581760} +{"current_steps": 1790, "total_steps": 8739, "loss": 1.1496, "learning_rate": 4.8725414543349326e-05, "epoch": 0.20482892779494222, "percentage": 20.48, "elapsed_time": "2:15:25", "remaining_time": "8:45:44", "throughput": 1804.62, "total_tokens": 14663680} +{"current_steps": 1800, "total_steps": 8739, "loss": 1.265, "learning_rate": 4.869322818599714e-05, "epoch": 0.2059732234809475, "percentage": 20.6, "elapsed_time": "2:16:23", "remaining_time": "8:45:48", "throughput": 1801.81, "total_tokens": 14745600} +{"current_steps": 1810, "total_steps": 8739, "loss": 1.293, "learning_rate": 4.8660651389194576e-05, "epoch": 0.20711751916695273, "percentage": 20.71, "elapsed_time": "2:17:20", "remaining_time": "8:45:47", "throughput": 1799.27, "total_tokens": 14827520} +{"current_steps": 1820, "total_steps": 8739, "loss": 1.3073, "learning_rate": 4.862768468977293e-05, "epoch": 0.208261814852958, "percentage": 20.83, "elapsed_time": "2:18:18", "remaining_time": "8:45:48", "throughput": 1796.63, "total_tokens": 14909440} +{"current_steps": 1830, "total_steps": 8739, "loss": 1.171, "learning_rate": 4.8594328630988696e-05, "epoch": 0.20940611053896327, "percentage": 20.94, "elapsed_time": "2:19:16", "remaining_time": "8:45:49", "throughput": 1793.98, "total_tokens": 14991360} +{"current_steps": 1840, "total_steps": 8739, "loss": 1.2818, "learning_rate": 4.8560583762514594e-05, "epoch": 0.21055040622496854, "percentage": 21.06, "elapsed_time": "2:20:14", "remaining_time": "8:45:49", "throughput": 1791.39, "total_tokens": 15073280} +{"current_steps": 1850, "total_steps": 8739, "loss": 1.0901, "learning_rate": 4.852645064043053e-05, "epoch": 0.2116947019109738, "percentage": 21.17, "elapsed_time": "2:21:11", "remaining_time": "8:45:46", "throughput": 1788.94, "total_tokens": 15155200} +{"current_steps": 1860, "total_steps": 8739, "loss": 1.2341, "learning_rate": 4.84919298272144e-05, "epoch": 0.21283899759697905, "percentage": 21.28, "elapsed_time": "2:22:09", "remaining_time": "8:45:44", "throughput": 1786.45, "total_tokens": 15237120} +{"current_steps": 1870, "total_steps": 8739, "loss": 1.415, "learning_rate": 4.8457021891732866e-05, "epoch": 0.21398329328298432, "percentage": 21.4, "elapsed_time": "2:23:07", "remaining_time": "8:45:45", "throughput": 1783.78, "total_tokens": 15319040} +{"current_steps": 1880, "total_steps": 8739, "loss": 1.5628, "learning_rate": 4.842172740923194e-05, "epoch": 0.2151275889689896, "percentage": 21.51, "elapsed_time": "2:24:06", "remaining_time": "8:45:44", "throughput": 1781.25, "total_tokens": 15400960} +{"current_steps": 1890, "total_steps": 8739, "loss": 1.4214, "learning_rate": 4.838604696132753e-05, "epoch": 0.21627188465499486, "percentage": 21.63, "elapsed_time": "2:25:03", "remaining_time": "8:45:40", "throughput": 1778.88, "total_tokens": 15482880} +{"current_steps": 1900, "total_steps": 8739, "loss": 1.2436, "learning_rate": 4.8349981135995826e-05, "epoch": 0.2174161803410001, "percentage": 21.74, "elapsed_time": "2:26:01", "remaining_time": "8:45:35", "throughput": 1776.56, "total_tokens": 15564800} +{"current_steps": 1910, "total_steps": 8739, "loss": 1.3363, "learning_rate": 4.831353052756367e-05, "epoch": 0.21856047602700537, "percentage": 21.86, "elapsed_time": "2:26:58", "remaining_time": "8:45:30", "throughput": 1774.24, "total_tokens": 15646720} +{"current_steps": 1920, "total_steps": 8739, "loss": 1.3984, "learning_rate": 4.8276695736698704e-05, "epoch": 0.21970477171301064, "percentage": 21.97, "elapsed_time": "2:27:53", "remaining_time": "8:45:16", "throughput": 1772.46, "total_tokens": 15728640} +{"current_steps": 1930, "total_steps": 8739, "loss": 1.2282, "learning_rate": 4.823947737039948e-05, "epoch": 0.2208490673990159, "percentage": 22.08, "elapsed_time": "2:28:49", "remaining_time": "8:45:04", "throughput": 1770.52, "total_tokens": 15810560} +{"current_steps": 1940, "total_steps": 8739, "loss": 1.32, "learning_rate": 4.8201876041985496e-05, "epoch": 0.22199336308502116, "percentage": 22.2, "elapsed_time": "2:29:45", "remaining_time": "8:44:49", "throughput": 1768.75, "total_tokens": 15892480} +{"current_steps": 1950, "total_steps": 8739, "loss": 1.2447, "learning_rate": 4.8163892371087045e-05, "epoch": 0.22313765877102643, "percentage": 22.31, "elapsed_time": "2:30:40", "remaining_time": "8:44:34", "throughput": 1767.0, "total_tokens": 15974400} +{"current_steps": 1960, "total_steps": 8739, "loss": 1.1607, "learning_rate": 4.812552698363502e-05, "epoch": 0.2242819544570317, "percentage": 22.43, "elapsed_time": "2:31:35", "remaining_time": "8:44:19", "throughput": 1765.24, "total_tokens": 16056320} +{"current_steps": 1970, "total_steps": 8739, "loss": 1.3617, "learning_rate": 4.8086780511850606e-05, "epoch": 0.22542625014303697, "percentage": 22.54, "elapsed_time": "2:32:31", "remaining_time": "8:44:03", "throughput": 1763.53, "total_tokens": 16138240} +{"current_steps": 1980, "total_steps": 8739, "loss": 1.1251, "learning_rate": 4.8047653594234855e-05, "epoch": 0.22657054582904224, "percentage": 22.66, "elapsed_time": "2:33:25", "remaining_time": "8:43:44", "throughput": 1761.99, "total_tokens": 16220160} +{"current_steps": 1990, "total_steps": 8739, "loss": 1.193, "learning_rate": 4.800814687555817e-05, "epoch": 0.22771484151504748, "percentage": 22.77, "elapsed_time": "2:34:18", "remaining_time": "8:43:21", "throughput": 1760.7, "total_tokens": 16302080} +{"current_steps": 2000, "total_steps": 8739, "loss": 1.1411, "learning_rate": 4.796826100684967e-05, "epoch": 0.22885913720105275, "percentage": 22.89, "elapsed_time": "2:35:11", "remaining_time": "8:42:56", "throughput": 1759.47, "total_tokens": 16384000} +{"current_steps": 2010, "total_steps": 8739, "loss": 1.2578, "learning_rate": 4.7927996645386476e-05, "epoch": 0.23000343288705802, "percentage": 23.0, "elapsed_time": "2:36:18", "remaining_time": "8:43:18", "throughput": 1755.63, "total_tokens": 16465920} +{"current_steps": 2020, "total_steps": 8739, "loss": 1.1249, "learning_rate": 4.7887354454682854e-05, "epoch": 0.2311477285730633, "percentage": 23.11, "elapsed_time": "2:37:12", "remaining_time": "8:42:53", "throughput": 1754.4, "total_tokens": 16547840} +{"current_steps": 2030, "total_steps": 8739, "loss": 1.1754, "learning_rate": 4.784633510447932e-05, "epoch": 0.23229202425906853, "percentage": 23.23, "elapsed_time": "2:38:05", "remaining_time": "8:42:29", "throughput": 1753.12, "total_tokens": 16629760} +{"current_steps": 2040, "total_steps": 8739, "loss": 1.2965, "learning_rate": 4.7804939270731564e-05, "epoch": 0.2334363199450738, "percentage": 23.34, "elapsed_time": "2:38:59", "remaining_time": "8:42:04", "throughput": 1751.92, "total_tokens": 16711680} +{"current_steps": 2050, "total_steps": 8739, "loss": 1.2211, "learning_rate": 4.776316763559933e-05, "epoch": 0.23458061563107907, "percentage": 23.46, "elapsed_time": "2:39:52", "remaining_time": "8:41:39", "throughput": 1750.68, "total_tokens": 16793600} +{"current_steps": 2060, "total_steps": 8739, "loss": 1.0741, "learning_rate": 4.7721020887435186e-05, "epoch": 0.23572491131708434, "percentage": 23.57, "elapsed_time": "2:40:45", "remaining_time": "8:41:14", "throughput": 1749.49, "total_tokens": 16875520} +{"current_steps": 2070, "total_steps": 8739, "loss": 1.1755, "learning_rate": 4.767849972077315e-05, "epoch": 0.2368692070030896, "percentage": 23.69, "elapsed_time": "2:41:39", "remaining_time": "8:40:48", "throughput": 1748.31, "total_tokens": 16957440} +{"current_steps": 2080, "total_steps": 8739, "loss": 1.2918, "learning_rate": 4.763560483631728e-05, "epoch": 0.23801350268909485, "percentage": 23.8, "elapsed_time": "2:42:32", "remaining_time": "8:40:22", "throughput": 1747.13, "total_tokens": 17039360} +{"current_steps": 2090, "total_steps": 8739, "loss": 1.2861, "learning_rate": 4.75923369409301e-05, "epoch": 0.23915779837510012, "percentage": 23.92, "elapsed_time": "2:43:26", "remaining_time": "8:39:58", "throughput": 1745.87, "total_tokens": 17121280} +{"current_steps": 2100, "total_steps": 8739, "loss": 1.2797, "learning_rate": 4.7548696747620956e-05, "epoch": 0.2403020940611054, "percentage": 24.03, "elapsed_time": "2:44:20", "remaining_time": "8:39:32", "throughput": 1744.71, "total_tokens": 17203200} +{"current_steps": 2110, "total_steps": 8739, "loss": 1.2802, "learning_rate": 4.750468497553429e-05, "epoch": 0.24144638974711066, "percentage": 24.14, "elapsed_time": "2:45:13", "remaining_time": "8:39:05", "throughput": 1743.56, "total_tokens": 17285120} +{"current_steps": 2120, "total_steps": 8739, "loss": 1.2026, "learning_rate": 4.746030234993775e-05, "epoch": 0.2425906854331159, "percentage": 24.26, "elapsed_time": "2:46:07", "remaining_time": "8:38:38", "throughput": 1742.45, "total_tokens": 17367040} +{"current_steps": 2130, "total_steps": 8739, "loss": 1.4968, "learning_rate": 4.741554960221027e-05, "epoch": 0.24373498111912117, "percentage": 24.37, "elapsed_time": "2:47:00", "remaining_time": "8:38:10", "throughput": 1741.38, "total_tokens": 17448960} +{"current_steps": 2140, "total_steps": 8739, "loss": 1.4157, "learning_rate": 4.7370427469830016e-05, "epoch": 0.24487927680512644, "percentage": 24.49, "elapsed_time": "2:47:53", "remaining_time": "8:37:42", "throughput": 1740.31, "total_tokens": 17530880} +{"current_steps": 2150, "total_steps": 8739, "loss": 1.2478, "learning_rate": 4.73249366963622e-05, "epoch": 0.24602357249113171, "percentage": 24.6, "elapsed_time": "2:48:46", "remaining_time": "8:37:13", "throughput": 1739.3, "total_tokens": 17612800} +{"current_steps": 2160, "total_steps": 8739, "loss": 1.4627, "learning_rate": 4.727907803144686e-05, "epoch": 0.24716786817713698, "percentage": 24.72, "elapsed_time": "2:49:39", "remaining_time": "8:36:45", "throughput": 1738.27, "total_tokens": 17694720} +{"current_steps": 2170, "total_steps": 8739, "loss": 1.2206, "learning_rate": 4.723285223078653e-05, "epoch": 0.24831216386314223, "percentage": 24.83, "elapsed_time": "2:50:32", "remaining_time": "8:36:15", "throughput": 1737.26, "total_tokens": 17776640} +{"current_steps": 2180, "total_steps": 8739, "loss": 1.1268, "learning_rate": 4.71862600561337e-05, "epoch": 0.2494564595491475, "percentage": 24.95, "elapsed_time": "2:51:25", "remaining_time": "8:35:47", "throughput": 1736.21, "total_tokens": 17858560} +{"current_steps": 2190, "total_steps": 8739, "loss": 1.0187, "learning_rate": 4.713930227527836e-05, "epoch": 0.25060075523515274, "percentage": 25.06, "elapsed_time": "2:52:19", "remaining_time": "8:35:18", "throughput": 1735.17, "total_tokens": 17940480} +{"current_steps": 2200, "total_steps": 8739, "loss": 0.875, "learning_rate": 4.709197966203528e-05, "epoch": 0.251745050921158, "percentage": 25.17, "elapsed_time": "2:53:13", "remaining_time": "8:34:51", "throughput": 1734.06, "total_tokens": 18022400} +{"current_steps": 2210, "total_steps": 8739, "loss": 1.2277, "learning_rate": 4.704429299623129e-05, "epoch": 0.2528893466071633, "percentage": 25.29, "elapsed_time": "2:54:06", "remaining_time": "8:34:21", "throughput": 1733.11, "total_tokens": 18104320} +{"current_steps": 2220, "total_steps": 8739, "loss": 1.4153, "learning_rate": 4.6996243063692446e-05, "epoch": 0.25403364229316855, "percentage": 25.4, "elapsed_time": "2:54:59", "remaining_time": "8:33:51", "throughput": 1732.1, "total_tokens": 18186240} +{"current_steps": 2230, "total_steps": 8739, "loss": 1.1905, "learning_rate": 4.694783065623102e-05, "epoch": 0.2551779379791738, "percentage": 25.52, "elapsed_time": "2:55:52", "remaining_time": "8:33:21", "throughput": 1731.16, "total_tokens": 18268160} +{"current_steps": 2240, "total_steps": 8739, "loss": 1.363, "learning_rate": 4.68990565716325e-05, "epoch": 0.2563222336651791, "percentage": 25.63, "elapsed_time": "2:56:45", "remaining_time": "8:32:50", "throughput": 1730.23, "total_tokens": 18350080} +{"current_steps": 2250, "total_steps": 8739, "loss": 1.3028, "learning_rate": 4.6849921613642456e-05, "epoch": 0.25746652935118436, "percentage": 25.75, "elapsed_time": "2:57:38", "remaining_time": "8:32:18", "throughput": 1729.34, "total_tokens": 18432000} +{"current_steps": 2260, "total_steps": 8739, "loss": 1.0479, "learning_rate": 4.680042659195325e-05, "epoch": 0.25861082503718963, "percentage": 25.86, "elapsed_time": "2:58:31", "remaining_time": "8:31:48", "throughput": 1728.4, "total_tokens": 18513920} +{"current_steps": 2270, "total_steps": 8739, "loss": 1.4381, "learning_rate": 4.6750572322190716e-05, "epoch": 0.2597551207231949, "percentage": 25.98, "elapsed_time": "2:59:24", "remaining_time": "8:31:17", "throughput": 1727.44, "total_tokens": 18595840} +{"current_steps": 2280, "total_steps": 8739, "loss": 1.1211, "learning_rate": 4.6700359625900724e-05, "epoch": 0.2608994164092001, "percentage": 26.09, "elapsed_time": "3:00:18", "remaining_time": "8:30:46", "throughput": 1726.54, "total_tokens": 18677760} +{"current_steps": 2290, "total_steps": 8739, "loss": 1.1206, "learning_rate": 4.664978933053562e-05, "epoch": 0.2620437120952054, "percentage": 26.2, "elapsed_time": "3:01:11", "remaining_time": "8:30:15", "throughput": 1725.6, "total_tokens": 18759680} +{"current_steps": 2300, "total_steps": 8739, "loss": 1.2446, "learning_rate": 4.659886226944063e-05, "epoch": 0.26318800778121065, "percentage": 26.32, "elapsed_time": "3:02:04", "remaining_time": "8:29:44", "throughput": 1724.66, "total_tokens": 18841600} +{"current_steps": 2310, "total_steps": 8739, "loss": 1.1047, "learning_rate": 4.65475792818401e-05, "epoch": 0.2643323034672159, "percentage": 26.43, "elapsed_time": "3:02:57", "remaining_time": "8:29:12", "throughput": 1723.8, "total_tokens": 18923520} +{"current_steps": 2320, "total_steps": 8739, "loss": 1.175, "learning_rate": 4.6495941212823644e-05, "epoch": 0.2654765991532212, "percentage": 26.55, "elapsed_time": "3:03:51", "remaining_time": "8:28:41", "throughput": 1722.88, "total_tokens": 19005440} +{"current_steps": 2330, "total_steps": 8739, "loss": 1.1473, "learning_rate": 4.644394891333227e-05, "epoch": 0.26662089483922646, "percentage": 26.66, "elapsed_time": "3:04:44", "remaining_time": "8:28:09", "throughput": 1722.0, "total_tokens": 19087360} +{"current_steps": 2340, "total_steps": 8739, "loss": 1.1003, "learning_rate": 4.639160324014433e-05, "epoch": 0.26776519052523173, "percentage": 26.78, "elapsed_time": "3:05:37", "remaining_time": "8:27:36", "throughput": 1721.16, "total_tokens": 19169280} +{"current_steps": 2350, "total_steps": 8739, "loss": 1.5043, "learning_rate": 4.633890505586139e-05, "epoch": 0.268909486211237, "percentage": 26.89, "elapsed_time": "3:06:30", "remaining_time": "8:27:04", "throughput": 1720.3, "total_tokens": 19251200} +{"current_steps": 2360, "total_steps": 8739, "loss": 1.3875, "learning_rate": 4.6285855228894025e-05, "epoch": 0.2700537818972423, "percentage": 27.01, "elapsed_time": "3:07:24", "remaining_time": "8:26:32", "throughput": 1719.38, "total_tokens": 19333120} +{"current_steps": 2370, "total_steps": 8739, "loss": 1.2485, "learning_rate": 4.623245463344753e-05, "epoch": 0.2711980775832475, "percentage": 27.12, "elapsed_time": "3:08:17", "remaining_time": "8:26:00", "throughput": 1718.51, "total_tokens": 19415040} +{"current_steps": 2380, "total_steps": 8739, "loss": 1.6017, "learning_rate": 4.617870414950748e-05, "epoch": 0.27234237326925276, "percentage": 27.23, "elapsed_time": "3:09:11", "remaining_time": "8:25:28", "throughput": 1717.62, "total_tokens": 19496960} +{"current_steps": 2390, "total_steps": 8739, "loss": 1.1282, "learning_rate": 4.612460466282525e-05, "epoch": 0.273486668955258, "percentage": 27.35, "elapsed_time": "3:10:04", "remaining_time": "8:24:55", "throughput": 1716.81, "total_tokens": 19578880} +{"current_steps": 2400, "total_steps": 8739, "loss": 1.1795, "learning_rate": 4.607015706490341e-05, "epoch": 0.2746309646412633, "percentage": 27.46, "elapsed_time": "3:10:57", "remaining_time": "8:24:22", "throughput": 1715.97, "total_tokens": 19660800} +{"current_steps": 2410, "total_steps": 8739, "loss": 1.111, "learning_rate": 4.601536225298104e-05, "epoch": 0.27577526032726857, "percentage": 27.58, "elapsed_time": "3:11:51", "remaining_time": "8:23:49", "throughput": 1715.12, "total_tokens": 19742720} +{"current_steps": 2420, "total_steps": 8739, "loss": 1.1325, "learning_rate": 4.5960221130018946e-05, "epoch": 0.27691955601327384, "percentage": 27.69, "elapsed_time": "3:12:44", "remaining_time": "8:23:15", "throughput": 1714.32, "total_tokens": 19824640} +{"current_steps": 2430, "total_steps": 8739, "loss": 1.2953, "learning_rate": 4.590473460468475e-05, "epoch": 0.2780638516992791, "percentage": 27.81, "elapsed_time": "3:13:37", "remaining_time": "8:22:42", "throughput": 1713.5, "total_tokens": 19906560} +{"current_steps": 2440, "total_steps": 8739, "loss": 1.168, "learning_rate": 4.584890359133797e-05, "epoch": 0.2792081473852844, "percentage": 27.92, "elapsed_time": "3:14:31", "remaining_time": "8:22:09", "throughput": 1712.65, "total_tokens": 19988480} +{"current_steps": 2450, "total_steps": 8739, "loss": 1.3607, "learning_rate": 4.579272901001491e-05, "epoch": 0.28035244307128965, "percentage": 28.04, "elapsed_time": "3:15:24", "remaining_time": "8:21:35", "throughput": 1711.89, "total_tokens": 20070400} +{"current_steps": 2460, "total_steps": 8739, "loss": 1.293, "learning_rate": 4.5736211786413524e-05, "epoch": 0.28149673875729486, "percentage": 28.15, "elapsed_time": "3:16:17", "remaining_time": "8:21:00", "throughput": 1711.14, "total_tokens": 20152320} +{"current_steps": 2470, "total_steps": 8739, "loss": 1.3167, "learning_rate": 4.5679352851878135e-05, "epoch": 0.28264103444330013, "percentage": 28.26, "elapsed_time": "3:17:10", "remaining_time": "8:20:26", "throughput": 1710.33, "total_tokens": 20234240} +{"current_steps": 2480, "total_steps": 8739, "loss": 1.3806, "learning_rate": 4.562215314338411e-05, "epoch": 0.2837853301293054, "percentage": 28.38, "elapsed_time": "3:18:03", "remaining_time": "8:19:52", "throughput": 1709.57, "total_tokens": 20316160} +{"current_steps": 2490, "total_steps": 8739, "loss": 1.0428, "learning_rate": 4.556461360352241e-05, "epoch": 0.28492962581531067, "percentage": 28.49, "elapsed_time": "3:18:56", "remaining_time": "8:19:17", "throughput": 1708.82, "total_tokens": 20398080} +{"current_steps": 2500, "total_steps": 8739, "loss": 1.0979, "learning_rate": 4.550673518048405e-05, "epoch": 0.28607392150131594, "percentage": 28.61, "elapsed_time": "3:19:50", "remaining_time": "8:18:42", "throughput": 1708.09, "total_tokens": 20480000} +{"current_steps": 2510, "total_steps": 8739, "loss": 1.2309, "learning_rate": 4.5448518828044515e-05, "epoch": 0.2872182171873212, "percentage": 28.72, "elapsed_time": "3:20:43", "remaining_time": "8:18:07", "throughput": 1707.35, "total_tokens": 20561920} +{"current_steps": 2520, "total_steps": 8739, "loss": 1.1428, "learning_rate": 4.538996550554798e-05, "epoch": 0.2883625128733265, "percentage": 28.84, "elapsed_time": "3:21:36", "remaining_time": "8:17:31", "throughput": 1706.62, "total_tokens": 20643840} +{"current_steps": 2530, "total_steps": 8739, "loss": 1.5423, "learning_rate": 4.5331076177891527e-05, "epoch": 0.28950680855933175, "percentage": 28.95, "elapsed_time": "3:22:29", "remaining_time": "8:16:56", "throughput": 1705.89, "total_tokens": 20725760} +{"current_steps": 2540, "total_steps": 8739, "loss": 1.31, "learning_rate": 4.527185181550928e-05, "epoch": 0.290651104245337, "percentage": 29.07, "elapsed_time": "3:23:22", "remaining_time": "8:16:20", "throughput": 1705.21, "total_tokens": 20807680} +{"current_steps": 2550, "total_steps": 8739, "loss": 1.0873, "learning_rate": 4.5212293394356356e-05, "epoch": 0.29179539993134224, "percentage": 29.18, "elapsed_time": "3:24:15", "remaining_time": "8:15:45", "throughput": 1704.49, "total_tokens": 20889600} +{"current_steps": 2560, "total_steps": 8739, "loss": 1.1553, "learning_rate": 4.515240189589282e-05, "epoch": 0.2929396956173475, "percentage": 29.29, "elapsed_time": "3:25:08", "remaining_time": "8:15:09", "throughput": 1703.79, "total_tokens": 20971520} +{"current_steps": 2570, "total_steps": 8739, "loss": 1.267, "learning_rate": 4.509217830706749e-05, "epoch": 0.2940839913033528, "percentage": 29.41, "elapsed_time": "3:26:02", "remaining_time": "8:14:33", "throughput": 1703.07, "total_tokens": 21053440} +{"current_steps": 2580, "total_steps": 8739, "loss": 1.074, "learning_rate": 4.50316236203017e-05, "epoch": 0.29522828698935805, "percentage": 29.52, "elapsed_time": "3:26:55", "remaining_time": "8:13:58", "throughput": 1702.34, "total_tokens": 21135360} +{"current_steps": 2590, "total_steps": 8739, "loss": 1.238, "learning_rate": 4.497073883347293e-05, "epoch": 0.2963725826753633, "percentage": 29.64, "elapsed_time": "3:27:49", "remaining_time": "8:13:23", "throughput": 1701.6, "total_tokens": 21217280} +{"current_steps": 2600, "total_steps": 8739, "loss": 1.2223, "learning_rate": 4.490952494989834e-05, "epoch": 0.2975168783613686, "percentage": 29.75, "elapsed_time": "3:28:42", "remaining_time": "8:12:46", "throughput": 1700.92, "total_tokens": 21299200} +{"current_steps": 2610, "total_steps": 8739, "loss": 1.2797, "learning_rate": 4.484798297831826e-05, "epoch": 0.29866117404737386, "percentage": 29.87, "elapsed_time": "3:29:35", "remaining_time": "8:12:10", "throughput": 1700.25, "total_tokens": 21381120} +{"current_steps": 2620, "total_steps": 8739, "loss": 1.1556, "learning_rate": 4.4786113932879605e-05, "epoch": 0.2998054697333791, "percentage": 29.98, "elapsed_time": "3:30:29", "remaining_time": "8:11:35", "throughput": 1699.48, "total_tokens": 21463040} +{"current_steps": 2630, "total_steps": 8739, "loss": 1.156, "learning_rate": 4.472391883311906e-05, "epoch": 0.3009497654193844, "percentage": 30.09, "elapsed_time": "3:31:22", "remaining_time": "8:10:58", "throughput": 1698.83, "total_tokens": 21544960} +{"current_steps": 2640, "total_steps": 8739, "loss": 1.1363, "learning_rate": 4.4661398703946396e-05, "epoch": 0.3020940611053896, "percentage": 30.21, "elapsed_time": "3:32:15", "remaining_time": "8:10:21", "throughput": 1698.17, "total_tokens": 21626880} +{"current_steps": 2650, "total_steps": 8739, "loss": 1.4523, "learning_rate": 4.4598554575627495e-05, "epoch": 0.3032383567913949, "percentage": 30.32, "elapsed_time": "3:33:08", "remaining_time": "8:09:45", "throughput": 1697.47, "total_tokens": 21708800} +{"current_steps": 2660, "total_steps": 8739, "loss": 0.9537, "learning_rate": 4.453538748376742e-05, "epoch": 0.30438265247740015, "percentage": 30.44, "elapsed_time": "3:34:02", "remaining_time": "8:09:09", "throughput": 1696.79, "total_tokens": 21790720} +{"current_steps": 2670, "total_steps": 8739, "loss": 1.1622, "learning_rate": 4.4471898469293324e-05, "epoch": 0.3055269481634054, "percentage": 30.55, "elapsed_time": "3:34:55", "remaining_time": "8:08:32", "throughput": 1696.09, "total_tokens": 21872640} +{"current_steps": 2680, "total_steps": 8739, "loss": 1.3041, "learning_rate": 4.44080885784373e-05, "epoch": 0.3066712438494107, "percentage": 30.67, "elapsed_time": "3:35:49", "remaining_time": "8:07:55", "throughput": 1695.44, "total_tokens": 21954560} +{"current_steps": 2690, "total_steps": 8739, "loss": 1.3722, "learning_rate": 4.434395886271917e-05, "epoch": 0.30781553953541596, "percentage": 30.78, "elapsed_time": "3:36:42", "remaining_time": "8:07:19", "throughput": 1694.77, "total_tokens": 22036480} +{"current_steps": 2700, "total_steps": 8739, "loss": 1.4421, "learning_rate": 4.427951037892911e-05, "epoch": 0.30895983522142123, "percentage": 30.9, "elapsed_time": "3:37:35", "remaining_time": "8:06:41", "throughput": 1694.16, "total_tokens": 22118400} +{"current_steps": 2710, "total_steps": 8739, "loss": 1.5259, "learning_rate": 4.4214744189110266e-05, "epoch": 0.3101041309074265, "percentage": 31.01, "elapsed_time": "3:38:28", "remaining_time": "8:06:03", "throughput": 1693.53, "total_tokens": 22200320} +{"current_steps": 2720, "total_steps": 8739, "loss": 1.1897, "learning_rate": 4.414966136054125e-05, "epoch": 0.3112484265934317, "percentage": 31.12, "elapsed_time": "3:39:22", "remaining_time": "8:05:26", "throughput": 1692.9, "total_tokens": 22282240} +{"current_steps": 2730, "total_steps": 8739, "loss": 1.0431, "learning_rate": 4.408426296571852e-05, "epoch": 0.312392722279437, "percentage": 31.24, "elapsed_time": "3:40:15", "remaining_time": "8:04:48", "throughput": 1692.27, "total_tokens": 22364160} +{"current_steps": 2740, "total_steps": 8739, "loss": 1.3437, "learning_rate": 4.401855008233879e-05, "epoch": 0.31353701796544226, "percentage": 31.35, "elapsed_time": "3:41:08", "remaining_time": "8:04:11", "throughput": 1691.63, "total_tokens": 22446080} +{"current_steps": 2750, "total_steps": 8739, "loss": 1.4596, "learning_rate": 4.395252379328115e-05, "epoch": 0.3146813136514475, "percentage": 31.47, "elapsed_time": "3:42:01", "remaining_time": "8:03:32", "throughput": 1691.04, "total_tokens": 22528000} +{"current_steps": 2760, "total_steps": 8739, "loss": 1.1596, "learning_rate": 4.388618518658932e-05, "epoch": 0.3158256093374528, "percentage": 31.58, "elapsed_time": "3:42:55", "remaining_time": "8:02:54", "throughput": 1690.46, "total_tokens": 22609920} +{"current_steps": 2770, "total_steps": 8739, "loss": 1.2776, "learning_rate": 4.381953535545369e-05, "epoch": 0.31696990502345807, "percentage": 31.7, "elapsed_time": "3:43:48", "remaining_time": "8:02:16", "throughput": 1689.85, "total_tokens": 22691840} +{"current_steps": 2780, "total_steps": 8739, "loss": 1.1147, "learning_rate": 4.375257539819328e-05, "epoch": 0.31811420070946334, "percentage": 31.81, "elapsed_time": "3:44:41", "remaining_time": "8:01:38", "throughput": 1689.23, "total_tokens": 22773760} +{"current_steps": 2790, "total_steps": 8739, "loss": 1.1802, "learning_rate": 4.368530641823769e-05, "epoch": 0.3192584963954686, "percentage": 31.93, "elapsed_time": "3:45:34", "remaining_time": "8:00:59", "throughput": 1688.67, "total_tokens": 22855680} +{"current_steps": 2800, "total_steps": 8739, "loss": 1.0881, "learning_rate": 4.361772952410886e-05, "epoch": 0.3204027920814739, "percentage": 32.04, "elapsed_time": "3:46:28", "remaining_time": "8:00:21", "throughput": 1688.04, "total_tokens": 22937600} +{"current_steps": 2810, "total_steps": 8739, "loss": 1.1945, "learning_rate": 4.354984582940285e-05, "epoch": 0.3215470877674791, "percentage": 32.15, "elapsed_time": "3:47:21", "remaining_time": "7:59:43", "throughput": 1687.41, "total_tokens": 23019520} +{"current_steps": 2820, "total_steps": 8739, "loss": 1.3629, "learning_rate": 4.348165645277145e-05, "epoch": 0.32269138345348436, "percentage": 32.27, "elapsed_time": "3:48:14", "remaining_time": "7:59:04", "throughput": 1686.9, "total_tokens": 23101440} +{"current_steps": 2830, "total_steps": 8739, "loss": 1.3362, "learning_rate": 4.34131625179038e-05, "epoch": 0.32383567913948963, "percentage": 32.38, "elapsed_time": "3:49:08", "remaining_time": "7:58:25", "throughput": 1686.3, "total_tokens": 23183360} +{"current_steps": 2840, "total_steps": 8739, "loss": 1.2316, "learning_rate": 4.334436515350779e-05, "epoch": 0.3249799748254949, "percentage": 32.5, "elapsed_time": "3:50:00", "remaining_time": "7:57:45", "throughput": 1685.79, "total_tokens": 23265280} +{"current_steps": 2850, "total_steps": 8739, "loss": 1.7573, "learning_rate": 4.327526549329157e-05, "epoch": 0.32612427051150017, "percentage": 32.61, "elapsed_time": "3:50:53", "remaining_time": "7:57:06", "throughput": 1685.23, "total_tokens": 23347200} +{"current_steps": 2860, "total_steps": 8739, "loss": 1.4037, "learning_rate": 4.320586467594476e-05, "epoch": 0.32726856619750544, "percentage": 32.73, "elapsed_time": "3:51:47", "remaining_time": "7:56:27", "throughput": 1684.67, "total_tokens": 23429120} +{"current_steps": 2870, "total_steps": 8739, "loss": 1.4623, "learning_rate": 4.313616384511976e-05, "epoch": 0.3284128618835107, "percentage": 32.84, "elapsed_time": "3:52:40", "remaining_time": "7:55:48", "throughput": 1684.13, "total_tokens": 23511040} +{"current_steps": 2880, "total_steps": 8739, "loss": 1.1027, "learning_rate": 4.3066164149412844e-05, "epoch": 0.329557157569516, "percentage": 32.96, "elapsed_time": "3:53:33", "remaining_time": "7:55:08", "throughput": 1683.6, "total_tokens": 23592960} +{"current_steps": 2890, "total_steps": 8739, "loss": 1.2341, "learning_rate": 4.299586674234529e-05, "epoch": 0.33070145325552125, "percentage": 33.07, "elapsed_time": "3:54:26", "remaining_time": "7:54:29", "throughput": 1683.06, "total_tokens": 23674880} +{"current_steps": 2900, "total_steps": 8739, "loss": 1.2661, "learning_rate": 4.292527278234435e-05, "epoch": 0.33184574894152646, "percentage": 33.18, "elapsed_time": "3:55:19", "remaining_time": "7:53:49", "throughput": 1682.54, "total_tokens": 23756800} +{"current_steps": 2910, "total_steps": 8739, "loss": 1.375, "learning_rate": 4.285438343272414e-05, "epoch": 0.33299004462753173, "percentage": 33.3, "elapsed_time": "3:56:13", "remaining_time": "7:53:09", "throughput": 1681.98, "total_tokens": 23838720} +{"current_steps": 2920, "total_steps": 8739, "loss": 1.2119, "learning_rate": 4.278319986166649e-05, "epoch": 0.334134340313537, "percentage": 33.41, "elapsed_time": "3:57:06", "remaining_time": "7:52:30", "throughput": 1681.43, "total_tokens": 23920640} +{"current_steps": 2930, "total_steps": 8739, "loss": 1.322, "learning_rate": 4.2711723242201695e-05, "epoch": 0.3352786359995423, "percentage": 33.53, "elapsed_time": "3:57:59", "remaining_time": "7:51:50", "throughput": 1680.89, "total_tokens": 24002560} +{"current_steps": 2940, "total_steps": 8739, "loss": 1.4806, "learning_rate": 4.263995475218917e-05, "epoch": 0.33642293168554754, "percentage": 33.64, "elapsed_time": "3:58:52", "remaining_time": "7:51:10", "throughput": 1680.37, "total_tokens": 24084480} +{"current_steps": 2950, "total_steps": 8739, "loss": 1.6319, "learning_rate": 4.256789557429806e-05, "epoch": 0.3375672273715528, "percentage": 33.76, "elapsed_time": "3:59:46", "remaining_time": "7:50:31", "throughput": 1679.79, "total_tokens": 24166400} +{"current_steps": 2960, "total_steps": 8739, "loss": 1.2252, "learning_rate": 4.2495546895987724e-05, "epoch": 0.3387115230575581, "percentage": 33.87, "elapsed_time": "4:00:39", "remaining_time": "7:49:51", "throughput": 1679.26, "total_tokens": 24248320} +{"current_steps": 2970, "total_steps": 8739, "loss": 1.1941, "learning_rate": 4.242290990948821e-05, "epoch": 0.33985581874356335, "percentage": 33.99, "elapsed_time": "4:01:33", "remaining_time": "7:49:11", "throughput": 1678.74, "total_tokens": 24330240} +{"current_steps": 2980, "total_steps": 8739, "loss": 1.2853, "learning_rate": 4.234998581178056e-05, "epoch": 0.3410001144295686, "percentage": 34.1, "elapsed_time": "4:02:26", "remaining_time": "7:48:31", "throughput": 1678.23, "total_tokens": 24412160} +{"current_steps": 2990, "total_steps": 8739, "loss": 1.157, "learning_rate": 4.227677580457711e-05, "epoch": 0.34214441011557384, "percentage": 34.21, "elapsed_time": "4:03:20", "remaining_time": "7:47:53", "throughput": 1677.61, "total_tokens": 24494080} +{"current_steps": 3000, "total_steps": 8739, "loss": 1.1064, "learning_rate": 4.220328109430167e-05, "epoch": 0.3432887058015791, "percentage": 34.33, "elapsed_time": "4:04:14", "remaining_time": "7:47:13", "throughput": 1677.07, "total_tokens": 24576000} +{"current_steps": 3010, "total_steps": 8739, "loss": 1.3768, "learning_rate": 4.21295028920697e-05, "epoch": 0.3444330014875844, "percentage": 34.44, "elapsed_time": "4:05:14", "remaining_time": "7:46:46", "throughput": 1675.73, "total_tokens": 24657920} +{"current_steps": 3020, "total_steps": 8739, "loss": 1.1968, "learning_rate": 4.2055442413668264e-05, "epoch": 0.34557729717358965, "percentage": 34.56, "elapsed_time": "4:06:08", "remaining_time": "7:46:06", "throughput": 1675.22, "total_tokens": 24739840} +{"current_steps": 3030, "total_steps": 8739, "loss": 1.3736, "learning_rate": 4.198110087953606e-05, "epoch": 0.3467215928595949, "percentage": 34.67, "elapsed_time": "4:07:01", "remaining_time": "7:45:25", "throughput": 1674.77, "total_tokens": 24821760} +{"current_steps": 3040, "total_steps": 8739, "loss": 1.2485, "learning_rate": 4.190647951474328e-05, "epoch": 0.3478658885456002, "percentage": 34.79, "elapsed_time": "4:07:54", "remaining_time": "7:44:44", "throughput": 1674.29, "total_tokens": 24903680} +{"current_steps": 3050, "total_steps": 8739, "loss": 1.1501, "learning_rate": 4.183157954897144e-05, "epoch": 0.34901018423160546, "percentage": 34.9, "elapsed_time": "4:08:47", "remaining_time": "7:44:03", "throughput": 1673.82, "total_tokens": 24985600} +{"current_steps": 3060, "total_steps": 8739, "loss": 1.1709, "learning_rate": 4.1756402216493115e-05, "epoch": 0.35015447991761073, "percentage": 35.02, "elapsed_time": "4:09:40", "remaining_time": "7:43:21", "throughput": 1673.36, "total_tokens": 25067520} +{"current_steps": 3070, "total_steps": 8739, "loss": 1.2692, "learning_rate": 4.1680948756151564e-05, "epoch": 0.351298775603616, "percentage": 35.13, "elapsed_time": "4:10:33", "remaining_time": "7:42:40", "throughput": 1672.89, "total_tokens": 25149440} +{"current_steps": 3080, "total_steps": 8739, "loss": 1.2124, "learning_rate": 4.160522041134035e-05, "epoch": 0.3524430712896212, "percentage": 35.24, "elapsed_time": "4:11:26", "remaining_time": "7:41:59", "throughput": 1672.44, "total_tokens": 25231360} +{"current_steps": 3090, "total_steps": 8739, "loss": 1.1728, "learning_rate": 4.152921842998287e-05, "epoch": 0.3535873669756265, "percentage": 35.36, "elapsed_time": "4:12:19", "remaining_time": "7:41:17", "throughput": 1671.97, "total_tokens": 25313280} +{"current_steps": 3100, "total_steps": 8739, "loss": 1.309, "learning_rate": 4.145294406451173e-05, "epoch": 0.35473166266163175, "percentage": 35.47, "elapsed_time": "4:13:13", "remaining_time": "7:40:36", "throughput": 1671.5, "total_tokens": 25395200} +{"current_steps": 3110, "total_steps": 8739, "loss": 1.3163, "learning_rate": 4.137639857184815e-05, "epoch": 0.355875958347637, "percentage": 35.59, "elapsed_time": "4:14:06", "remaining_time": "7:39:54", "throughput": 1671.07, "total_tokens": 25477120} +{"current_steps": 3120, "total_steps": 8739, "loss": 1.1725, "learning_rate": 4.129958321338127e-05, "epoch": 0.3570202540336423, "percentage": 35.7, "elapsed_time": "4:14:59", "remaining_time": "7:39:13", "throughput": 1670.61, "total_tokens": 25559040} +{"current_steps": 3130, "total_steps": 8739, "loss": 1.1192, "learning_rate": 4.122249925494726e-05, "epoch": 0.35816454971964756, "percentage": 35.82, "elapsed_time": "4:15:52", "remaining_time": "7:38:31", "throughput": 1670.15, "total_tokens": 25640960} +{"current_steps": 3140, "total_steps": 8739, "loss": 1.2959, "learning_rate": 4.114514796680862e-05, "epoch": 0.35930884540565283, "percentage": 35.93, "elapsed_time": "4:16:45", "remaining_time": "7:37:50", "throughput": 1669.68, "total_tokens": 25722880} +{"current_steps": 3150, "total_steps": 8739, "loss": 1.2905, "learning_rate": 4.106753062363311e-05, "epoch": 0.3604531410916581, "percentage": 36.05, "elapsed_time": "4:17:39", "remaining_time": "7:37:09", "throughput": 1669.22, "total_tokens": 25804800} +{"current_steps": 3160, "total_steps": 8739, "loss": 1.315, "learning_rate": 4.098964850447281e-05, "epoch": 0.3615974367776634, "percentage": 36.16, "elapsed_time": "4:18:32", "remaining_time": "7:36:26", "throughput": 1668.81, "total_tokens": 25886720} +{"current_steps": 3170, "total_steps": 8739, "loss": 1.28, "learning_rate": 4.0911502892743035e-05, "epoch": 0.3627417324636686, "percentage": 36.27, "elapsed_time": "4:19:25", "remaining_time": "7:35:45", "throughput": 1668.33, "total_tokens": 25968640} +{"current_steps": 3180, "total_steps": 8739, "loss": 1.2515, "learning_rate": 4.083309507620118e-05, "epoch": 0.36388602814967386, "percentage": 36.39, "elapsed_time": "4:20:18", "remaining_time": "7:35:02", "throughput": 1667.93, "total_tokens": 26050560} +{"current_steps": 3190, "total_steps": 8739, "loss": 1.1768, "learning_rate": 4.075442634692548e-05, "epoch": 0.3650303238356791, "percentage": 36.5, "elapsed_time": "4:21:11", "remaining_time": "7:34:20", "throughput": 1667.53, "total_tokens": 26132480} +{"current_steps": 3200, "total_steps": 8739, "loss": 1.2891, "learning_rate": 4.067549800129375e-05, "epoch": 0.3661746195216844, "percentage": 36.62, "elapsed_time": "4:22:04", "remaining_time": "7:33:38", "throughput": 1667.08, "total_tokens": 26214400} +{"current_steps": 3210, "total_steps": 8739, "loss": 1.3888, "learning_rate": 4.059631133996203e-05, "epoch": 0.36731891520768967, "percentage": 36.73, "elapsed_time": "4:22:58", "remaining_time": "7:32:57", "throughput": 1666.6, "total_tokens": 26296320} +{"current_steps": 3220, "total_steps": 8739, "loss": 0.9946, "learning_rate": 4.05168676678431e-05, "epoch": 0.36846321089369494, "percentage": 36.85, "elapsed_time": "4:23:51", "remaining_time": "7:32:15", "throughput": 1666.16, "total_tokens": 26378240} +{"current_steps": 3230, "total_steps": 8739, "loss": 1.4232, "learning_rate": 4.0437168294085013e-05, "epoch": 0.3696075065797002, "percentage": 36.96, "elapsed_time": "4:24:45", "remaining_time": "7:31:33", "throughput": 1665.72, "total_tokens": 26460160} +{"current_steps": 3240, "total_steps": 8739, "loss": 1.1119, "learning_rate": 4.0357214532049535e-05, "epoch": 0.3707518022657055, "percentage": 37.08, "elapsed_time": "4:25:38", "remaining_time": "7:30:50", "throughput": 1665.3, "total_tokens": 26542080} +{"current_steps": 3250, "total_steps": 8739, "loss": 1.1302, "learning_rate": 4.027700769929046e-05, "epoch": 0.37189609795171075, "percentage": 37.19, "elapsed_time": "4:26:31", "remaining_time": "7:30:08", "throughput": 1664.87, "total_tokens": 26624000} +{"current_steps": 3260, "total_steps": 8739, "loss": 1.2648, "learning_rate": 4.019654911753193e-05, "epoch": 0.37304039363771596, "percentage": 37.3, "elapsed_time": "4:27:24", "remaining_time": "7:29:26", "throughput": 1664.46, "total_tokens": 26705920} +{"current_steps": 3270, "total_steps": 8739, "loss": 1.204, "learning_rate": 4.011584011264665e-05, "epoch": 0.37418468932372123, "percentage": 37.42, "elapsed_time": "4:28:18", "remaining_time": "7:28:43", "throughput": 1664.05, "total_tokens": 26787840} +{"current_steps": 3280, "total_steps": 8739, "loss": 1.3242, "learning_rate": 4.0034882014634015e-05, "epoch": 0.3753289850097265, "percentage": 37.53, "elapsed_time": "4:29:11", "remaining_time": "7:28:00", "throughput": 1663.64, "total_tokens": 26869760} +{"current_steps": 3290, "total_steps": 8739, "loss": 1.235, "learning_rate": 3.995367615759825e-05, "epoch": 0.37647328069573177, "percentage": 37.65, "elapsed_time": "4:30:04", "remaining_time": "7:27:18", "throughput": 1663.24, "total_tokens": 26951680} +{"current_steps": 3300, "total_steps": 8739, "loss": 1.1119, "learning_rate": 3.9872223879726356e-05, "epoch": 0.37761757638173704, "percentage": 37.76, "elapsed_time": "4:30:57", "remaining_time": "7:26:35", "throughput": 1662.81, "total_tokens": 27033600} +{"current_steps": 3310, "total_steps": 8739, "loss": 1.2295, "learning_rate": 3.979052652326609e-05, "epoch": 0.3787618720677423, "percentage": 37.88, "elapsed_time": "4:31:51", "remaining_time": "7:25:53", "throughput": 1662.37, "total_tokens": 27115520} +{"current_steps": 3320, "total_steps": 8739, "loss": 1.4858, "learning_rate": 3.970858543450387e-05, "epoch": 0.3799061677537476, "percentage": 37.99, "elapsed_time": "4:32:44", "remaining_time": "7:25:11", "throughput": 1661.95, "total_tokens": 27197440} +{"current_steps": 3330, "total_steps": 8739, "loss": 1.1919, "learning_rate": 3.962640196374254e-05, "epoch": 0.38105046343975285, "percentage": 38.11, "elapsed_time": "4:33:38", "remaining_time": "7:24:28", "throughput": 1661.54, "total_tokens": 27279360} +{"current_steps": 3340, "total_steps": 8739, "loss": 1.1531, "learning_rate": 3.954397746527916e-05, "epoch": 0.3821947591257581, "percentage": 38.22, "elapsed_time": "4:34:31", "remaining_time": "7:23:45", "throughput": 1661.15, "total_tokens": 27361280} +{"current_steps": 3350, "total_steps": 8739, "loss": 1.1539, "learning_rate": 3.9461313297382666e-05, "epoch": 0.38333905481176334, "percentage": 38.33, "elapsed_time": "4:35:24", "remaining_time": "7:23:02", "throughput": 1660.75, "total_tokens": 27443200} +{"current_steps": 3360, "total_steps": 8739, "loss": 1.6298, "learning_rate": 3.93784108222715e-05, "epoch": 0.3844833504977686, "percentage": 38.45, "elapsed_time": "4:36:18", "remaining_time": "7:22:19", "throughput": 1660.32, "total_tokens": 27525120} +{"current_steps": 3370, "total_steps": 8739, "loss": 1.2188, "learning_rate": 3.929527140609115e-05, "epoch": 0.3856276461837739, "percentage": 38.56, "elapsed_time": "4:37:11", "remaining_time": "7:21:36", "throughput": 1659.94, "total_tokens": 27607040} +{"current_steps": 3380, "total_steps": 8739, "loss": 1.2925, "learning_rate": 3.921189641889163e-05, "epoch": 0.38677194186977915, "percentage": 38.68, "elapsed_time": "4:38:04", "remaining_time": "7:20:53", "throughput": 1659.55, "total_tokens": 27688960} +{"current_steps": 3390, "total_steps": 8739, "loss": 1.3113, "learning_rate": 3.912828723460495e-05, "epoch": 0.3879162375557844, "percentage": 38.79, "elapsed_time": "4:38:57", "remaining_time": "7:20:09", "throughput": 1659.19, "total_tokens": 27770880} +{"current_steps": 3400, "total_steps": 8739, "loss": 1.2155, "learning_rate": 3.904444523102242e-05, "epoch": 0.3890605332417897, "percentage": 38.91, "elapsed_time": "4:39:50", "remaining_time": "7:19:26", "throughput": 1658.79, "total_tokens": 27852800} +{"current_steps": 3410, "total_steps": 8739, "loss": 1.4058, "learning_rate": 3.896037178977196e-05, "epoch": 0.39020482892779496, "percentage": 39.02, "elapsed_time": "4:40:44", "remaining_time": "7:18:43", "throughput": 1658.4, "total_tokens": 27934720} +{"current_steps": 3420, "total_steps": 8739, "loss": 1.2582, "learning_rate": 3.887606829629536e-05, "epoch": 0.3913491246138002, "percentage": 39.13, "elapsed_time": "4:41:37", "remaining_time": "7:18:00", "throughput": 1658.03, "total_tokens": 28016640} +{"current_steps": 3430, "total_steps": 8739, "loss": 1.2471, "learning_rate": 3.87915361398254e-05, "epoch": 0.3924934202998055, "percentage": 39.25, "elapsed_time": "4:42:30", "remaining_time": "7:17:16", "throughput": 1657.67, "total_tokens": 28098560} +{"current_steps": 3440, "total_steps": 8739, "loss": 1.2815, "learning_rate": 3.8706776713363025e-05, "epoch": 0.3936377159858107, "percentage": 39.36, "elapsed_time": "4:43:23", "remaining_time": "7:16:32", "throughput": 1657.3, "total_tokens": 28180480} +{"current_steps": 3450, "total_steps": 8739, "loss": 1.4604, "learning_rate": 3.862179141365431e-05, "epoch": 0.394782011671816, "percentage": 39.48, "elapsed_time": "4:44:16", "remaining_time": "7:15:49", "throughput": 1656.94, "total_tokens": 28262400} +{"current_steps": 3460, "total_steps": 8739, "loss": 1.2577, "learning_rate": 3.8536581641167506e-05, "epoch": 0.39592630735782125, "percentage": 39.59, "elapsed_time": "4:45:10", "remaining_time": "7:15:05", "throughput": 1656.57, "total_tokens": 28344320} +{"current_steps": 3470, "total_steps": 8739, "loss": 1.2211, "learning_rate": 3.845114880006994e-05, "epoch": 0.3970706030438265, "percentage": 39.71, "elapsed_time": "4:46:03", "remaining_time": "7:14:21", "throughput": 1656.2, "total_tokens": 28426240} +{"current_steps": 3480, "total_steps": 8739, "loss": 1.2543, "learning_rate": 3.836549429820485e-05, "epoch": 0.3982148987298318, "percentage": 39.82, "elapsed_time": "4:46:56", "remaining_time": "7:13:38", "throughput": 1655.84, "total_tokens": 28508160} +{"current_steps": 3490, "total_steps": 8739, "loss": 1.2716, "learning_rate": 3.827961954706825e-05, "epoch": 0.39935919441583706, "percentage": 39.94, "elapsed_time": "4:47:50", "remaining_time": "7:12:54", "throughput": 1655.46, "total_tokens": 28590080} +{"current_steps": 3500, "total_steps": 8739, "loss": 0.9854, "learning_rate": 3.8193525961785584e-05, "epoch": 0.40050349010184233, "percentage": 40.05, "elapsed_time": "4:48:43", "remaining_time": "7:12:10", "throughput": 1655.13, "total_tokens": 28672000} +{"current_steps": 3510, "total_steps": 8739, "loss": 1.1416, "learning_rate": 3.81072149610885e-05, "epoch": 0.4016477857878476, "percentage": 40.16, "elapsed_time": "4:49:36", "remaining_time": "7:11:26", "throughput": 1654.74, "total_tokens": 28753920} +{"current_steps": 3520, "total_steps": 8739, "loss": 1.3587, "learning_rate": 3.802068796729139e-05, "epoch": 0.40279208147385287, "percentage": 40.28, "elapsed_time": "4:50:30", "remaining_time": "7:10:43", "throughput": 1654.37, "total_tokens": 28835840} +{"current_steps": 3530, "total_steps": 8739, "loss": 1.2926, "learning_rate": 3.7933946406268e-05, "epoch": 0.4039363771598581, "percentage": 40.39, "elapsed_time": "4:51:23", "remaining_time": "7:09:59", "throughput": 1654.02, "total_tokens": 28917760} +{"current_steps": 3540, "total_steps": 8739, "loss": 1.2945, "learning_rate": 3.7846991707427905e-05, "epoch": 0.40508067284586335, "percentage": 40.51, "elapsed_time": "4:52:16", "remaining_time": "7:09:14", "throughput": 1653.68, "total_tokens": 28999680} +{"current_steps": 3550, "total_steps": 8739, "loss": 1.2348, "learning_rate": 3.775982530369298e-05, "epoch": 0.4062249685318686, "percentage": 40.62, "elapsed_time": "4:53:09", "remaining_time": "7:08:30", "throughput": 1653.33, "total_tokens": 29081600} +{"current_steps": 3560, "total_steps": 8739, "loss": 1.2022, "learning_rate": 3.767244863147377e-05, "epoch": 0.4073692642178739, "percentage": 40.74, "elapsed_time": "4:54:02", "remaining_time": "7:07:46", "throughput": 1652.99, "total_tokens": 29163520} +{"current_steps": 3570, "total_steps": 8739, "loss": 1.5009, "learning_rate": 3.75848631306458e-05, "epoch": 0.40851355990387916, "percentage": 40.85, "elapsed_time": "4:54:55", "remaining_time": "7:07:02", "throughput": 1652.66, "total_tokens": 29245440} +{"current_steps": 3580, "total_steps": 8739, "loss": 1.2186, "learning_rate": 3.7497070244525925e-05, "epoch": 0.40965785558988443, "percentage": 40.97, "elapsed_time": "4:55:49", "remaining_time": "7:06:17", "throughput": 1652.33, "total_tokens": 29327360} +{"current_steps": 3590, "total_steps": 8739, "loss": 1.3161, "learning_rate": 3.7409071419848436e-05, "epoch": 0.4108021512758897, "percentage": 41.08, "elapsed_time": "4:56:42", "remaining_time": "7:05:32", "throughput": 1652.02, "total_tokens": 29409280} +{"current_steps": 3600, "total_steps": 8739, "loss": 1.0534, "learning_rate": 3.73208681067413e-05, "epoch": 0.411946446961895, "percentage": 41.19, "elapsed_time": "4:57:35", "remaining_time": "7:04:48", "throughput": 1651.67, "total_tokens": 29491200} +{"current_steps": 3610, "total_steps": 8739, "loss": 1.3398, "learning_rate": 3.7232461758702244e-05, "epoch": 0.41309074264790024, "percentage": 41.31, "elapsed_time": "4:58:28", "remaining_time": "7:04:03", "throughput": 1651.36, "total_tokens": 29573120} +{"current_steps": 3620, "total_steps": 8739, "loss": 1.1538, "learning_rate": 3.714385383257477e-05, "epoch": 0.41423503833390546, "percentage": 41.42, "elapsed_time": "4:59:21", "remaining_time": "7:03:19", "throughput": 1651.02, "total_tokens": 29655040} +{"current_steps": 3630, "total_steps": 8739, "loss": 1.0701, "learning_rate": 3.7055045788524214e-05, "epoch": 0.41537933401991073, "percentage": 41.54, "elapsed_time": "5:00:14", "remaining_time": "7:02:34", "throughput": 1650.69, "total_tokens": 29736960} +{"current_steps": 3640, "total_steps": 8739, "loss": 1.4487, "learning_rate": 3.696603909001361e-05, "epoch": 0.416523629705916, "percentage": 41.65, "elapsed_time": "5:01:08", "remaining_time": "7:01:50", "throughput": 1650.34, "total_tokens": 29818880} +{"current_steps": 3650, "total_steps": 8739, "loss": 1.3053, "learning_rate": 3.6876835203779615e-05, "epoch": 0.41766792539192127, "percentage": 41.77, "elapsed_time": "5:02:01", "remaining_time": "7:01:06", "throughput": 1649.99, "total_tokens": 29900800} +{"current_steps": 3660, "total_steps": 8739, "loss": 1.4515, "learning_rate": 3.678743559980835e-05, "epoch": 0.41881222107792654, "percentage": 41.88, "elapsed_time": "5:02:55", "remaining_time": "7:00:21", "throughput": 1649.64, "total_tokens": 29982720} +{"current_steps": 3670, "total_steps": 8739, "loss": 1.4384, "learning_rate": 3.669784175131115e-05, "epoch": 0.4199565167639318, "percentage": 42.0, "elapsed_time": "5:03:48", "remaining_time": "6:59:37", "throughput": 1649.33, "total_tokens": 30064640} +{"current_steps": 3680, "total_steps": 8739, "loss": 1.4419, "learning_rate": 3.660805513470027e-05, "epoch": 0.4211008124499371, "percentage": 42.11, "elapsed_time": "5:04:41", "remaining_time": "6:58:52", "throughput": 1649.01, "total_tokens": 30146560} +{"current_steps": 3690, "total_steps": 8739, "loss": 1.2246, "learning_rate": 3.651807722956462e-05, "epoch": 0.42224510813594235, "percentage": 42.22, "elapsed_time": "5:05:34", "remaining_time": "6:58:07", "throughput": 1648.69, "total_tokens": 30228480} +{"current_steps": 3700, "total_steps": 8739, "loss": 1.0901, "learning_rate": 3.642790951864532e-05, "epoch": 0.4233894038219476, "percentage": 42.34, "elapsed_time": "5:06:28", "remaining_time": "6:57:22", "throughput": 1648.37, "total_tokens": 30310400} +{"current_steps": 3710, "total_steps": 8739, "loss": 1.2148, "learning_rate": 3.63375534878113e-05, "epoch": 0.42453369950795283, "percentage": 42.45, "elapsed_time": "5:07:21", "remaining_time": "6:56:37", "throughput": 1648.04, "total_tokens": 30392320} +{"current_steps": 3720, "total_steps": 8739, "loss": 1.3764, "learning_rate": 3.6247010626034795e-05, "epoch": 0.4256779951939581, "percentage": 42.57, "elapsed_time": "5:08:14", "remaining_time": "6:55:53", "throughput": 1647.72, "total_tokens": 30474240} +{"current_steps": 3730, "total_steps": 8739, "loss": 1.216, "learning_rate": 3.615628242536682e-05, "epoch": 0.4268222908799634, "percentage": 42.68, "elapsed_time": "5:09:08", "remaining_time": "6:55:08", "throughput": 1647.4, "total_tokens": 30556160} +{"current_steps": 3740, "total_steps": 8739, "loss": 1.2571, "learning_rate": 3.6065370380912587e-05, "epoch": 0.42796658656596864, "percentage": 42.8, "elapsed_time": "5:10:01", "remaining_time": "6:54:23", "throughput": 1647.09, "total_tokens": 30638080} +{"current_steps": 3750, "total_steps": 8739, "loss": 1.1939, "learning_rate": 3.5974275990806846e-05, "epoch": 0.4291108822519739, "percentage": 42.91, "elapsed_time": "5:10:54", "remaining_time": "6:53:37", "throughput": 1646.79, "total_tokens": 30720000} +{"current_steps": 3760, "total_steps": 8739, "loss": 1.1014, "learning_rate": 3.588300075618922e-05, "epoch": 0.4302551779379792, "percentage": 43.03, "elapsed_time": "5:11:47", "remaining_time": "6:52:52", "throughput": 1646.5, "total_tokens": 30801920} +{"current_steps": 3770, "total_steps": 8739, "loss": 1.1029, "learning_rate": 3.579154618117946e-05, "epoch": 0.43139947362398445, "percentage": 43.14, "elapsed_time": "5:12:40", "remaining_time": "6:52:07", "throughput": 1646.19, "total_tokens": 30883840} +{"current_steps": 3780, "total_steps": 8739, "loss": 1.3753, "learning_rate": 3.5699913772852664e-05, "epoch": 0.4325437693099897, "percentage": 43.25, "elapsed_time": "5:13:34", "remaining_time": "6:51:23", "throughput": 1645.82, "total_tokens": 30965760} +{"current_steps": 3790, "total_steps": 8739, "loss": 1.405, "learning_rate": 3.560810504121441e-05, "epoch": 0.43368806499599494, "percentage": 43.37, "elapsed_time": "5:14:28", "remaining_time": "6:50:38", "throughput": 1645.51, "total_tokens": 31047680} +{"current_steps": 3800, "total_steps": 8739, "loss": 1.1393, "learning_rate": 3.551612149917593e-05, "epoch": 0.4348323606820002, "percentage": 43.48, "elapsed_time": "5:15:20", "remaining_time": "6:49:52", "throughput": 1645.25, "total_tokens": 31129600} +{"current_steps": 3810, "total_steps": 8739, "loss": 1.3569, "learning_rate": 3.542396466252913e-05, "epoch": 0.4359766563680055, "percentage": 43.6, "elapsed_time": "5:16:14", "remaining_time": "6:49:06", "throughput": 1644.95, "total_tokens": 31211520} +{"current_steps": 3820, "total_steps": 8739, "loss": 1.4194, "learning_rate": 3.533163604992163e-05, "epoch": 0.43712095205401075, "percentage": 43.71, "elapsed_time": "5:17:07", "remaining_time": "6:48:21", "throughput": 1644.65, "total_tokens": 31293440} +{"current_steps": 3830, "total_steps": 8739, "loss": 1.2899, "learning_rate": 3.523913718283175e-05, "epoch": 0.438265247740016, "percentage": 43.83, "elapsed_time": "5:18:00", "remaining_time": "6:47:35", "throughput": 1644.38, "total_tokens": 31375360} +{"current_steps": 3840, "total_steps": 8739, "loss": 1.3624, "learning_rate": 3.514646958554339e-05, "epoch": 0.4394095434260213, "percentage": 43.94, "elapsed_time": "5:18:53", "remaining_time": "6:46:49", "throughput": 1644.11, "total_tokens": 31457280} +{"current_steps": 3850, "total_steps": 8739, "loss": 1.1517, "learning_rate": 3.5053634785121e-05, "epoch": 0.44055383911202656, "percentage": 44.06, "elapsed_time": "5:19:46", "remaining_time": "6:46:04", "throughput": 1643.84, "total_tokens": 31539200} +{"current_steps": 3860, "total_steps": 8739, "loss": 1.2125, "learning_rate": 3.496063431138431e-05, "epoch": 0.4416981347980318, "percentage": 44.17, "elapsed_time": "5:20:39", "remaining_time": "6:45:18", "throughput": 1643.57, "total_tokens": 31621120} +{"current_steps": 3870, "total_steps": 8739, "loss": 1.287, "learning_rate": 3.4867469696883204e-05, "epoch": 0.4428424304840371, "percentage": 44.28, "elapsed_time": "5:21:32", "remaining_time": "6:44:32", "throughput": 1643.31, "total_tokens": 31703040} +{"current_steps": 3880, "total_steps": 8739, "loss": 1.0745, "learning_rate": 3.477414247687241e-05, "epoch": 0.4439867261700423, "percentage": 44.4, "elapsed_time": "5:22:24", "remaining_time": "6:43:46", "throughput": 1643.07, "total_tokens": 31784960} +{"current_steps": 3890, "total_steps": 8739, "loss": 1.146, "learning_rate": 3.468065418928625e-05, "epoch": 0.4451310218560476, "percentage": 44.51, "elapsed_time": "5:23:18", "remaining_time": "6:43:00", "throughput": 1642.79, "total_tokens": 31866880} +{"current_steps": 3900, "total_steps": 8739, "loss": 1.0793, "learning_rate": 3.458700637471325e-05, "epoch": 0.44627531754205285, "percentage": 44.63, "elapsed_time": "5:24:10", "remaining_time": "6:42:14", "throughput": 1642.53, "total_tokens": 31948800} +{"current_steps": 3910, "total_steps": 8739, "loss": 1.1415, "learning_rate": 3.4493200576370776e-05, "epoch": 0.4474196132280581, "percentage": 44.74, "elapsed_time": "5:25:04", "remaining_time": "6:41:28", "throughput": 1642.25, "total_tokens": 32030720} +{"current_steps": 3920, "total_steps": 8739, "loss": 1.2075, "learning_rate": 3.4399238340079607e-05, "epoch": 0.4485639089140634, "percentage": 44.86, "elapsed_time": "5:25:57", "remaining_time": "6:40:42", "throughput": 1641.99, "total_tokens": 32112640} +{"current_steps": 3930, "total_steps": 8739, "loss": 1.1582, "learning_rate": 3.4305121214238446e-05, "epoch": 0.44970820460006866, "percentage": 44.97, "elapsed_time": "5:26:50", "remaining_time": "6:39:56", "throughput": 1641.74, "total_tokens": 32194560} +{"current_steps": 3940, "total_steps": 8739, "loss": 1.3309, "learning_rate": 3.4210850749798415e-05, "epoch": 0.45085250028607393, "percentage": 45.09, "elapsed_time": "5:27:43", "remaining_time": "6:39:10", "throughput": 1641.47, "total_tokens": 32276480} +{"current_steps": 3950, "total_steps": 8739, "loss": 1.2072, "learning_rate": 3.411642850023751e-05, "epoch": 0.4519967959720792, "percentage": 45.2, "elapsed_time": "5:28:36", "remaining_time": "6:38:24", "throughput": 1641.21, "total_tokens": 32358400} +{"current_steps": 3960, "total_steps": 8739, "loss": 1.1731, "learning_rate": 3.402185602153495e-05, "epoch": 0.45314109165808447, "percentage": 45.31, "elapsed_time": "5:29:29", "remaining_time": "6:37:38", "throughput": 1640.94, "total_tokens": 32440320} +{"current_steps": 3970, "total_steps": 8739, "loss": 1.1238, "learning_rate": 3.392713487214561e-05, "epoch": 0.4542853873440897, "percentage": 45.43, "elapsed_time": "5:30:22", "remaining_time": "6:36:51", "throughput": 1640.69, "total_tokens": 32522240} +{"current_steps": 3980, "total_steps": 8739, "loss": 1.1262, "learning_rate": 3.38322666129743e-05, "epoch": 0.45542968303009496, "percentage": 45.54, "elapsed_time": "5:31:15", "remaining_time": "6:36:05", "throughput": 1640.44, "total_tokens": 32604160} +{"current_steps": 3990, "total_steps": 8739, "loss": 1.2084, "learning_rate": 3.373725280735e-05, "epoch": 0.4565739787161002, "percentage": 45.66, "elapsed_time": "5:32:08", "remaining_time": "6:35:19", "throughput": 1640.18, "total_tokens": 32686080} +{"current_steps": 4000, "total_steps": 8739, "loss": 1.2836, "learning_rate": 3.3642095021000184e-05, "epoch": 0.4577182744021055, "percentage": 45.77, "elapsed_time": "5:33:01", "remaining_time": "6:34:33", "throughput": 1639.9, "total_tokens": 32768000} +{"current_steps": 4010, "total_steps": 8739, "loss": 1.295, "learning_rate": 3.3546794822024976e-05, "epoch": 0.45886257008811077, "percentage": 45.89, "elapsed_time": "5:34:11", "remaining_time": "6:34:07", "throughput": 1638.26, "total_tokens": 32849920} +{"current_steps": 4020, "total_steps": 8739, "loss": 1.3341, "learning_rate": 3.3451353780871286e-05, "epoch": 0.46000686577411604, "percentage": 46.0, "elapsed_time": "5:35:05", "remaining_time": "6:33:20", "throughput": 1637.99, "total_tokens": 32931840} +{"current_steps": 4030, "total_steps": 8739, "loss": 1.2892, "learning_rate": 3.335577347030697e-05, "epoch": 0.4611511614601213, "percentage": 46.12, "elapsed_time": "5:35:58", "remaining_time": "6:32:35", "throughput": 1637.7, "total_tokens": 33013760} +{"current_steps": 4040, "total_steps": 8739, "loss": 1.5631, "learning_rate": 3.32600554653949e-05, "epoch": 0.4622954571461266, "percentage": 46.23, "elapsed_time": "5:36:51", "remaining_time": "6:31:48", "throughput": 1637.45, "total_tokens": 33095680} +{"current_steps": 4050, "total_steps": 8739, "loss": 0.9705, "learning_rate": 3.316420134346701e-05, "epoch": 0.46343975283213185, "percentage": 46.34, "elapsed_time": "5:37:44", "remaining_time": "6:31:02", "throughput": 1637.21, "total_tokens": 33177600} +{"current_steps": 4060, "total_steps": 8739, "loss": 1.3763, "learning_rate": 3.306821268409827e-05, "epoch": 0.46458404851813706, "percentage": 46.46, "elapsed_time": "5:38:37", "remaining_time": "6:30:15", "throughput": 1636.98, "total_tokens": 33259520} +{"current_steps": 4070, "total_steps": 8739, "loss": 1.2818, "learning_rate": 3.297209106908072e-05, "epoch": 0.46572834420414233, "percentage": 46.57, "elapsed_time": "5:39:30", "remaining_time": "6:29:28", "throughput": 1636.74, "total_tokens": 33341440} +{"current_steps": 4080, "total_steps": 8739, "loss": 1.1623, "learning_rate": 3.287583808239735e-05, "epoch": 0.4668726398901476, "percentage": 46.69, "elapsed_time": "5:40:23", "remaining_time": "6:28:42", "throughput": 1636.5, "total_tokens": 33423360} +{"current_steps": 4090, "total_steps": 8739, "loss": 1.5152, "learning_rate": 3.277945531019601e-05, "epoch": 0.46801693557615287, "percentage": 46.8, "elapsed_time": "5:41:17", "remaining_time": "6:27:55", "throughput": 1636.23, "total_tokens": 33505280} +{"current_steps": 4100, "total_steps": 8739, "loss": 1.5291, "learning_rate": 3.268294434076332e-05, "epoch": 0.46916123126215814, "percentage": 46.92, "elapsed_time": "5:42:10", "remaining_time": "6:27:09", "throughput": 1635.99, "total_tokens": 33587200} +{"current_steps": 4110, "total_steps": 8739, "loss": 1.1453, "learning_rate": 3.2586306764498395e-05, "epoch": 0.4703055269481634, "percentage": 47.03, "elapsed_time": "5:43:03", "remaining_time": "6:26:22", "throughput": 1635.72, "total_tokens": 33669120} +{"current_steps": 4120, "total_steps": 8739, "loss": 1.398, "learning_rate": 3.2489544173886745e-05, "epoch": 0.4714498226341687, "percentage": 47.14, "elapsed_time": "5:43:56", "remaining_time": "6:25:36", "throughput": 1635.47, "total_tokens": 33751040} +{"current_steps": 4130, "total_steps": 8739, "loss": 1.0819, "learning_rate": 3.239265816347397e-05, "epoch": 0.47259411832017395, "percentage": 47.26, "elapsed_time": "5:44:50", "remaining_time": "6:24:50", "throughput": 1635.2, "total_tokens": 33832960} +{"current_steps": 4140, "total_steps": 8739, "loss": 1.3502, "learning_rate": 3.2295650329839474e-05, "epoch": 0.4737384140061792, "percentage": 47.37, "elapsed_time": "5:45:43", "remaining_time": "6:24:03", "throughput": 1634.96, "total_tokens": 33914880} +{"current_steps": 4150, "total_steps": 8739, "loss": 1.1419, "learning_rate": 3.219852227157022e-05, "epoch": 0.47488270969218443, "percentage": 47.49, "elapsed_time": "5:46:36", "remaining_time": "6:23:16", "throughput": 1634.73, "total_tokens": 33996800} +{"current_steps": 4160, "total_steps": 8739, "loss": 1.3278, "learning_rate": 3.210127558923434e-05, "epoch": 0.4760270053781897, "percentage": 47.6, "elapsed_time": "5:47:29", "remaining_time": "6:22:29", "throughput": 1634.48, "total_tokens": 34078720} +{"current_steps": 4170, "total_steps": 8739, "loss": 1.2711, "learning_rate": 3.200391188535472e-05, "epoch": 0.477171301064195, "percentage": 47.72, "elapsed_time": "5:48:23", "remaining_time": "6:21:43", "throughput": 1634.22, "total_tokens": 34160640} +{"current_steps": 4180, "total_steps": 8739, "loss": 1.4901, "learning_rate": 3.1906432764382695e-05, "epoch": 0.47831559675020024, "percentage": 47.83, "elapsed_time": "5:49:16", "remaining_time": "6:20:56", "throughput": 1633.99, "total_tokens": 34242560} +{"current_steps": 4190, "total_steps": 8739, "loss": 1.4351, "learning_rate": 3.1808839832671523e-05, "epoch": 0.4794598924362055, "percentage": 47.95, "elapsed_time": "5:50:09", "remaining_time": "6:20:09", "throughput": 1633.75, "total_tokens": 34324480} +{"current_steps": 4200, "total_steps": 8739, "loss": 1.1299, "learning_rate": 3.1711134698449946e-05, "epoch": 0.4806041881222108, "percentage": 48.06, "elapsed_time": "5:51:02", "remaining_time": "6:19:22", "throughput": 1633.51, "total_tokens": 34406400} +{"current_steps": 4210, "total_steps": 8739, "loss": 1.3597, "learning_rate": 3.161331897179568e-05, "epoch": 0.48174848380821605, "percentage": 48.17, "elapsed_time": "5:51:55", "remaining_time": "6:18:35", "throughput": 1633.31, "total_tokens": 34488320} +{"current_steps": 4220, "total_steps": 8739, "loss": 1.4977, "learning_rate": 3.151539426460892e-05, "epoch": 0.4828927794942213, "percentage": 48.29, "elapsed_time": "5:52:48", "remaining_time": "6:17:48", "throughput": 1633.07, "total_tokens": 34570240} +{"current_steps": 4230, "total_steps": 8739, "loss": 1.1672, "learning_rate": 3.14173621905857e-05, "epoch": 0.4840370751802266, "percentage": 48.4, "elapsed_time": "5:53:41", "remaining_time": "6:17:01", "throughput": 1632.85, "total_tokens": 34652160} +{"current_steps": 4240, "total_steps": 8739, "loss": 1.495, "learning_rate": 3.1319224365191366e-05, "epoch": 0.4851813708662318, "percentage": 48.52, "elapsed_time": "5:54:35", "remaining_time": "6:16:14", "throughput": 1632.62, "total_tokens": 34734080} +{"current_steps": 4250, "total_steps": 8739, "loss": 1.6386, "learning_rate": 3.122098240563396e-05, "epoch": 0.4863256665522371, "percentage": 48.63, "elapsed_time": "5:55:28", "remaining_time": "6:15:27", "throughput": 1632.38, "total_tokens": 34816000} +{"current_steps": 4260, "total_steps": 8739, "loss": 1.2742, "learning_rate": 3.1122637930837486e-05, "epoch": 0.48746996223824235, "percentage": 48.75, "elapsed_time": "5:56:21", "remaining_time": "6:14:40", "throughput": 1632.14, "total_tokens": 34897920} +{"current_steps": 4270, "total_steps": 8739, "loss": 1.2173, "learning_rate": 3.102419256141536e-05, "epoch": 0.4886142579242476, "percentage": 48.86, "elapsed_time": "5:57:15", "remaining_time": "6:13:54", "throughput": 1631.89, "total_tokens": 34979840} +{"current_steps": 4280, "total_steps": 8739, "loss": 1.187, "learning_rate": 3.092564791964358e-05, "epoch": 0.4897585536102529, "percentage": 48.98, "elapsed_time": "5:58:08", "remaining_time": "6:13:06", "throughput": 1631.67, "total_tokens": 35061760} +{"current_steps": 4290, "total_steps": 8739, "loss": 1.5849, "learning_rate": 3.082700562943409e-05, "epoch": 0.49090284929625816, "percentage": 49.09, "elapsed_time": "5:59:01", "remaining_time": "6:12:19", "throughput": 1631.44, "total_tokens": 35143680} +{"current_steps": 4300, "total_steps": 8739, "loss": 1.2716, "learning_rate": 3.0728267316307945e-05, "epoch": 0.49204714498226343, "percentage": 49.2, "elapsed_time": "5:59:54", "remaining_time": "6:11:32", "throughput": 1631.23, "total_tokens": 35225600} +{"current_steps": 4310, "total_steps": 8739, "loss": 1.2538, "learning_rate": 3.062943460736857e-05, "epoch": 0.4931914406682687, "percentage": 49.32, "elapsed_time": "6:00:47", "remaining_time": "6:10:45", "throughput": 1631.02, "total_tokens": 35307520} +{"current_steps": 4320, "total_steps": 8739, "loss": 1.1509, "learning_rate": 3.0530509131274935e-05, "epoch": 0.49433573635427397, "percentage": 49.43, "elapsed_time": "6:01:40", "remaining_time": "6:09:58", "throughput": 1630.79, "total_tokens": 35389440} +{"current_steps": 4330, "total_steps": 8739, "loss": 1.1693, "learning_rate": 3.04314925182147e-05, "epoch": 0.4954800320402792, "percentage": 49.55, "elapsed_time": "6:02:33", "remaining_time": "6:09:10", "throughput": 1630.57, "total_tokens": 35471360} +{"current_steps": 4340, "total_steps": 8739, "loss": 1.2192, "learning_rate": 3.03323863998774e-05, "epoch": 0.49662432772628445, "percentage": 49.66, "elapsed_time": "6:03:27", "remaining_time": "6:08:23", "throughput": 1630.35, "total_tokens": 35553280} +{"current_steps": 4350, "total_steps": 8739, "loss": 1.2383, "learning_rate": 3.0233192409427492e-05, "epoch": 0.4977686234122897, "percentage": 49.78, "elapsed_time": "6:04:20", "remaining_time": "6:07:36", "throughput": 1630.08, "total_tokens": 35635200} +{"current_steps": 4360, "total_steps": 8739, "loss": 1.1951, "learning_rate": 3.0133912181477475e-05, "epoch": 0.498912919098295, "percentage": 49.89, "elapsed_time": "6:05:14", "remaining_time": "6:06:50", "throughput": 1629.82, "total_tokens": 35717120} +{"current_steps": 4370, "total_steps": 8739, "loss": 1.4106, "learning_rate": 3.003454735206097e-05, "epoch": 0.5000572147843002, "percentage": 50.01, "elapsed_time": "6:06:08", "remaining_time": "6:06:03", "throughput": 1629.59, "total_tokens": 35799040} +{"current_steps": 4380, "total_steps": 8739, "loss": 1.2978, "learning_rate": 2.9935099558605728e-05, "epoch": 0.5012015104703055, "percentage": 50.12, "elapsed_time": "6:07:01", "remaining_time": "6:05:15", "throughput": 1629.37, "total_tokens": 35880960} +{"current_steps": 4390, "total_steps": 8739, "loss": 1.1646, "learning_rate": 2.9835570439906657e-05, "epoch": 0.5023458061563107, "percentage": 50.23, "elapsed_time": "6:07:54", "remaining_time": "6:04:28", "throughput": 1629.16, "total_tokens": 35962880} +{"current_steps": 4400, "total_steps": 8739, "loss": 1.2874, "learning_rate": 2.973596163609883e-05, "epoch": 0.503490101842316, "percentage": 50.35, "elapsed_time": "6:08:47", "remaining_time": "6:03:40", "throughput": 1628.94, "total_tokens": 36044800} +{"current_steps": 4410, "total_steps": 8739, "loss": 1.2198, "learning_rate": 2.9636274788630437e-05, "epoch": 0.5046343975283213, "percentage": 50.46, "elapsed_time": "6:09:40", "remaining_time": "6:02:52", "throughput": 1628.77, "total_tokens": 36126720} +{"current_steps": 4420, "total_steps": 8739, "loss": 1.2435, "learning_rate": 2.9536511540235744e-05, "epoch": 0.5057786932143266, "percentage": 50.58, "elapsed_time": "6:10:33", "remaining_time": "6:02:05", "throughput": 1628.58, "total_tokens": 36208640} +{"current_steps": 4430, "total_steps": 8739, "loss": 1.367, "learning_rate": 2.9436673534908044e-05, "epoch": 0.5069229889003318, "percentage": 50.69, "elapsed_time": "6:11:27", "remaining_time": "6:01:18", "throughput": 1628.32, "total_tokens": 36290560} +{"current_steps": 4440, "total_steps": 8739, "loss": 1.1908, "learning_rate": 2.9336762417872516e-05, "epoch": 0.5080672845863371, "percentage": 50.81, "elapsed_time": "6:12:20", "remaining_time": "6:00:31", "throughput": 1628.09, "total_tokens": 36372480} +{"current_steps": 4450, "total_steps": 8739, "loss": 1.2709, "learning_rate": 2.9236779835559165e-05, "epoch": 0.5092115802723424, "percentage": 50.92, "elapsed_time": "6:13:14", "remaining_time": "5:59:43", "throughput": 1627.85, "total_tokens": 36454400} +{"current_steps": 4460, "total_steps": 8739, "loss": 1.1411, "learning_rate": 2.913672743557565e-05, "epoch": 0.5103558759583476, "percentage": 51.04, "elapsed_time": "6:14:07", "remaining_time": "5:58:56", "throughput": 1627.63, "total_tokens": 36536320} +{"current_steps": 4470, "total_steps": 8739, "loss": 1.1795, "learning_rate": 2.9036606866680187e-05, "epoch": 0.5115001716443529, "percentage": 51.15, "elapsed_time": "6:15:01", "remaining_time": "5:58:09", "throughput": 1627.4, "total_tokens": 36618240} +{"current_steps": 4480, "total_steps": 8739, "loss": 1.4518, "learning_rate": 2.8936419778754294e-05, "epoch": 0.5126444673303582, "percentage": 51.26, "elapsed_time": "6:15:54", "remaining_time": "5:57:22", "throughput": 1627.15, "total_tokens": 36700160} +{"current_steps": 4490, "total_steps": 8739, "loss": 1.1565, "learning_rate": 2.883616782277569e-05, "epoch": 0.5137887630163634, "percentage": 51.38, "elapsed_time": "6:16:47", "remaining_time": "5:56:34", "throughput": 1626.96, "total_tokens": 36782080} +{"current_steps": 4500, "total_steps": 8739, "loss": 1.1245, "learning_rate": 2.8735852650791035e-05, "epoch": 0.5149330587023687, "percentage": 51.49, "elapsed_time": "6:17:41", "remaining_time": "5:55:47", "throughput": 1626.73, "total_tokens": 36864000} +{"current_steps": 4510, "total_steps": 8739, "loss": 1.2498, "learning_rate": 2.8635475915888732e-05, "epoch": 0.516077354388374, "percentage": 51.61, "elapsed_time": "6:18:34", "remaining_time": "5:54:59", "throughput": 1626.54, "total_tokens": 36945920} +{"current_steps": 4520, "total_steps": 8739, "loss": 1.222, "learning_rate": 2.853503927217167e-05, "epoch": 0.5172216500743793, "percentage": 51.72, "elapsed_time": "6:19:27", "remaining_time": "5:54:11", "throughput": 1626.34, "total_tokens": 37027840} +{"current_steps": 4530, "total_steps": 8739, "loss": 1.3003, "learning_rate": 2.8434544374729965e-05, "epoch": 0.5183659457603845, "percentage": 51.84, "elapsed_time": "6:20:20", "remaining_time": "5:53:23", "throughput": 1626.14, "total_tokens": 37109760} +{"current_steps": 4540, "total_steps": 8739, "loss": 1.1049, "learning_rate": 2.8333992879613712e-05, "epoch": 0.5195102414463898, "percentage": 51.95, "elapsed_time": "6:21:14", "remaining_time": "5:52:36", "throughput": 1625.91, "total_tokens": 37191680} +{"current_steps": 4550, "total_steps": 8739, "loss": 1.2885, "learning_rate": 2.823338644380566e-05, "epoch": 0.520654537132395, "percentage": 52.07, "elapsed_time": "6:22:07", "remaining_time": "5:51:48", "throughput": 1625.71, "total_tokens": 37273600} +{"current_steps": 4560, "total_steps": 8739, "loss": 1.3466, "learning_rate": 2.8132726725193926e-05, "epoch": 0.5217988328184002, "percentage": 52.18, "elapsed_time": "6:23:01", "remaining_time": "5:51:01", "throughput": 1625.48, "total_tokens": 37355520} +{"current_steps": 4570, "total_steps": 8739, "loss": 1.3192, "learning_rate": 2.803201538254467e-05, "epoch": 0.5229431285044055, "percentage": 52.29, "elapsed_time": "6:23:54", "remaining_time": "5:50:12", "throughput": 1625.31, "total_tokens": 37437440} +{"current_steps": 4580, "total_steps": 8739, "loss": 1.2215, "learning_rate": 2.7931254075474768e-05, "epoch": 0.5240874241904108, "percentage": 52.41, "elapsed_time": "6:24:47", "remaining_time": "5:49:24", "throughput": 1625.12, "total_tokens": 37519360} +{"current_steps": 4590, "total_steps": 8739, "loss": 1.1609, "learning_rate": 2.7830444464424466e-05, "epoch": 0.525231719876416, "percentage": 52.52, "elapsed_time": "6:25:40", "remaining_time": "5:48:37", "throughput": 1624.93, "total_tokens": 37601280} +{"current_steps": 4600, "total_steps": 8739, "loss": 1.0642, "learning_rate": 2.772958821062997e-05, "epoch": 0.5263760155624213, "percentage": 52.64, "elapsed_time": "6:26:33", "remaining_time": "5:47:49", "throughput": 1624.71, "total_tokens": 37683200} +{"current_steps": 4610, "total_steps": 8739, "loss": 1.1454, "learning_rate": 2.7628686976096164e-05, "epoch": 0.5275203112484266, "percentage": 52.75, "elapsed_time": "6:27:26", "remaining_time": "5:47:01", "throughput": 1624.54, "total_tokens": 37765120} +{"current_steps": 4620, "total_steps": 8739, "loss": 1.1747, "learning_rate": 2.7527742423569124e-05, "epoch": 0.5286646069344318, "percentage": 52.87, "elapsed_time": "6:28:19", "remaining_time": "5:46:13", "throughput": 1624.36, "total_tokens": 37847040} +{"current_steps": 4630, "total_steps": 8739, "loss": 1.1861, "learning_rate": 2.7426756216508776e-05, "epoch": 0.5298089026204371, "percentage": 52.98, "elapsed_time": "6:29:12", "remaining_time": "5:45:24", "throughput": 1624.18, "total_tokens": 37928960} +{"current_steps": 4640, "total_steps": 8739, "loss": 1.3794, "learning_rate": 2.7325730019061474e-05, "epoch": 0.5309531983064424, "percentage": 53.1, "elapsed_time": "6:30:06", "remaining_time": "5:44:37", "throughput": 1623.96, "total_tokens": 38010880} +{"current_steps": 4650, "total_steps": 8739, "loss": 1.1395, "learning_rate": 2.7224665496032565e-05, "epoch": 0.5320974939924477, "percentage": 53.21, "elapsed_time": "6:30:59", "remaining_time": "5:43:48", "throughput": 1623.8, "total_tokens": 38092800} +{"current_steps": 4660, "total_steps": 8739, "loss": 1.1517, "learning_rate": 2.712356431285896e-05, "epoch": 0.5332417896784529, "percentage": 53.32, "elapsed_time": "6:31:52", "remaining_time": "5:43:00", "throughput": 1623.62, "total_tokens": 38174720} +{"current_steps": 4670, "total_steps": 8739, "loss": 1.2753, "learning_rate": 2.70224281355817e-05, "epoch": 0.5343860853644582, "percentage": 53.44, "elapsed_time": "6:32:45", "remaining_time": "5:42:12", "throughput": 1623.44, "total_tokens": 38256640} +{"current_steps": 4680, "total_steps": 8739, "loss": 1.1533, "learning_rate": 2.6921258630818475e-05, "epoch": 0.5355303810504635, "percentage": 53.55, "elapsed_time": "6:33:38", "remaining_time": "5:41:24", "throughput": 1623.25, "total_tokens": 38338560} +{"current_steps": 4690, "total_steps": 8739, "loss": 1.1615, "learning_rate": 2.6820057465736197e-05, "epoch": 0.5366746767364687, "percentage": 53.67, "elapsed_time": "6:34:31", "remaining_time": "5:40:36", "throughput": 1623.08, "total_tokens": 38420480} +{"current_steps": 4700, "total_steps": 8739, "loss": 1.1366, "learning_rate": 2.6718826308023487e-05, "epoch": 0.537818972422474, "percentage": 53.78, "elapsed_time": "6:35:24", "remaining_time": "5:39:47", "throughput": 1622.9, "total_tokens": 38502400} +{"current_steps": 4710, "total_steps": 8739, "loss": 1.129, "learning_rate": 2.6617566825863237e-05, "epoch": 0.5389632681084793, "percentage": 53.9, "elapsed_time": "6:36:17", "remaining_time": "5:38:59", "throughput": 1622.74, "total_tokens": 38584320} +{"current_steps": 4720, "total_steps": 8739, "loss": 1.0386, "learning_rate": 2.651628068790507e-05, "epoch": 0.5401075637944845, "percentage": 54.01, "elapsed_time": "6:37:10", "remaining_time": "5:38:10", "throughput": 1622.58, "total_tokens": 38666240} +{"current_steps": 4730, "total_steps": 8739, "loss": 1.0903, "learning_rate": 2.6414969563237874e-05, "epoch": 0.5412518594804897, "percentage": 54.13, "elapsed_time": "6:38:03", "remaining_time": "5:37:22", "throughput": 1622.39, "total_tokens": 38748160} +{"current_steps": 4740, "total_steps": 8739, "loss": 1.2361, "learning_rate": 2.6313635121362322e-05, "epoch": 0.542396155166495, "percentage": 54.24, "elapsed_time": "6:38:56", "remaining_time": "5:36:34", "throughput": 1622.19, "total_tokens": 38830080} +{"current_steps": 4750, "total_steps": 8739, "loss": 1.5279, "learning_rate": 2.6212279032163283e-05, "epoch": 0.5435404508525002, "percentage": 54.35, "elapsed_time": "6:39:50", "remaining_time": "5:35:46", "throughput": 1622.0, "total_tokens": 38912000} +{"current_steps": 4760, "total_steps": 8739, "loss": 1.3035, "learning_rate": 2.6110902965882383e-05, "epoch": 0.5446847465385055, "percentage": 54.47, "elapsed_time": "6:40:43", "remaining_time": "5:34:58", "throughput": 1621.82, "total_tokens": 38993920} +{"current_steps": 4770, "total_steps": 8739, "loss": 1.2656, "learning_rate": 2.6009508593090448e-05, "epoch": 0.5458290422245108, "percentage": 54.58, "elapsed_time": "6:41:36", "remaining_time": "5:34:10", "throughput": 1621.63, "total_tokens": 39075840} +{"current_steps": 4780, "total_steps": 8739, "loss": 1.3347, "learning_rate": 2.590809758465995e-05, "epoch": 0.546973337910516, "percentage": 54.7, "elapsed_time": "6:42:29", "remaining_time": "5:33:21", "throughput": 1621.45, "total_tokens": 39157760} +{"current_steps": 4790, "total_steps": 8739, "loss": 1.0816, "learning_rate": 2.580667161173753e-05, "epoch": 0.5481176335965213, "percentage": 54.81, "elapsed_time": "6:43:22", "remaining_time": "5:32:33", "throughput": 1621.29, "total_tokens": 39239680} +{"current_steps": 4800, "total_steps": 8739, "loss": 1.072, "learning_rate": 2.570523234571642e-05, "epoch": 0.5492619292825266, "percentage": 54.93, "elapsed_time": "6:44:16", "remaining_time": "5:31:45", "throughput": 1621.1, "total_tokens": 39321600} +{"current_steps": 4810, "total_steps": 8739, "loss": 1.105, "learning_rate": 2.5603781458208885e-05, "epoch": 0.5504062249685319, "percentage": 55.04, "elapsed_time": "6:45:09", "remaining_time": "5:30:56", "throughput": 1620.93, "total_tokens": 39403520} +{"current_steps": 4820, "total_steps": 8739, "loss": 1.1652, "learning_rate": 2.5502320621018732e-05, "epoch": 0.5515505206545371, "percentage": 55.16, "elapsed_time": "6:46:02", "remaining_time": "5:30:08", "throughput": 1620.73, "total_tokens": 39485440} +{"current_steps": 4830, "total_steps": 8739, "loss": 1.2073, "learning_rate": 2.5400851506113728e-05, "epoch": 0.5526948163405424, "percentage": 55.27, "elapsed_time": "6:46:55", "remaining_time": "5:29:20", "throughput": 1620.56, "total_tokens": 39567360} +{"current_steps": 4840, "total_steps": 8739, "loss": 1.2457, "learning_rate": 2.5299375785598005e-05, "epoch": 0.5538391120265477, "percentage": 55.38, "elapsed_time": "6:47:48", "remaining_time": "5:28:31", "throughput": 1620.4, "total_tokens": 39649280} +{"current_steps": 4850, "total_steps": 8739, "loss": 1.3313, "learning_rate": 2.519789513168459e-05, "epoch": 0.554983407712553, "percentage": 55.5, "elapsed_time": "6:48:42", "remaining_time": "5:27:43", "throughput": 1620.2, "total_tokens": 39731200} +{"current_steps": 4860, "total_steps": 8739, "loss": 1.1312, "learning_rate": 2.509641121666781e-05, "epoch": 0.5561277033985582, "percentage": 55.61, "elapsed_time": "6:49:35", "remaining_time": "5:26:54", "throughput": 1620.04, "total_tokens": 39813120} +{"current_steps": 4870, "total_steps": 8739, "loss": 1.1891, "learning_rate": 2.4994925712895697e-05, "epoch": 0.5572719990845635, "percentage": 55.73, "elapsed_time": "6:50:28", "remaining_time": "5:26:06", "throughput": 1619.88, "total_tokens": 39895040} +{"current_steps": 4880, "total_steps": 8739, "loss": 1.4017, "learning_rate": 2.489344029274249e-05, "epoch": 0.5584162947705688, "percentage": 55.84, "elapsed_time": "6:51:22", "remaining_time": "5:25:18", "throughput": 1619.67, "total_tokens": 39976960} +{"current_steps": 4890, "total_steps": 8739, "loss": 1.1554, "learning_rate": 2.479195662858105e-05, "epoch": 0.559560590456574, "percentage": 55.96, "elapsed_time": "6:52:15", "remaining_time": "5:24:29", "throughput": 1619.49, "total_tokens": 40058880} +{"current_steps": 4900, "total_steps": 8739, "loss": 1.3402, "learning_rate": 2.4690476392755298e-05, "epoch": 0.5607048861425793, "percentage": 56.07, "elapsed_time": "6:53:08", "remaining_time": "5:23:41", "throughput": 1619.33, "total_tokens": 40140800} +{"current_steps": 4910, "total_steps": 8739, "loss": 1.288, "learning_rate": 2.4589001257552637e-05, "epoch": 0.5618491818285845, "percentage": 56.18, "elapsed_time": "6:54:01", "remaining_time": "5:22:52", "throughput": 1619.15, "total_tokens": 40222720} +{"current_steps": 4920, "total_steps": 8739, "loss": 1.2969, "learning_rate": 2.4487532895176457e-05, "epoch": 0.5629934775145897, "percentage": 56.3, "elapsed_time": "6:54:55", "remaining_time": "5:22:04", "throughput": 1618.95, "total_tokens": 40304640} +{"current_steps": 4930, "total_steps": 8739, "loss": 1.346, "learning_rate": 2.4386072977718503e-05, "epoch": 0.564137773200595, "percentage": 56.41, "elapsed_time": "6:55:48", "remaining_time": "5:21:15", "throughput": 1618.79, "total_tokens": 40386560} +{"current_steps": 4940, "total_steps": 8739, "loss": 1.2043, "learning_rate": 2.4284623177131395e-05, "epoch": 0.5652820688866003, "percentage": 56.53, "elapsed_time": "6:56:41", "remaining_time": "5:20:27", "throughput": 1618.62, "total_tokens": 40468480} +{"current_steps": 4950, "total_steps": 8739, "loss": 1.1418, "learning_rate": 2.4183185165200998e-05, "epoch": 0.5664263645726055, "percentage": 56.64, "elapsed_time": "6:57:35", "remaining_time": "5:19:38", "throughput": 1618.42, "total_tokens": 40550400} +{"current_steps": 4960, "total_steps": 8739, "loss": 1.0886, "learning_rate": 2.4081760613518924e-05, "epoch": 0.5675706602586108, "percentage": 56.76, "elapsed_time": "6:58:28", "remaining_time": "5:18:50", "throughput": 1618.27, "total_tokens": 40632320} +{"current_steps": 4970, "total_steps": 8739, "loss": 1.3159, "learning_rate": 2.3980351193455e-05, "epoch": 0.5687149559446161, "percentage": 56.87, "elapsed_time": "6:59:21", "remaining_time": "5:18:01", "throughput": 1618.1, "total_tokens": 40714240} +{"current_steps": 4980, "total_steps": 8739, "loss": 1.2942, "learning_rate": 2.3878958576129664e-05, "epoch": 0.5698592516306213, "percentage": 56.99, "elapsed_time": "7:00:14", "remaining_time": "5:17:12", "throughput": 1617.93, "total_tokens": 40796160} +{"current_steps": 4990, "total_steps": 8739, "loss": 1.3472, "learning_rate": 2.3777584432386474e-05, "epoch": 0.5710035473166266, "percentage": 57.1, "elapsed_time": "7:01:08", "remaining_time": "5:16:24", "throughput": 1617.74, "total_tokens": 40878080} +{"current_steps": 5000, "total_steps": 8739, "loss": 1.1461, "learning_rate": 2.367623043276459e-05, "epoch": 0.5721478430026319, "percentage": 57.21, "elapsed_time": "7:02:02", "remaining_time": "5:15:35", "throughput": 1617.55, "total_tokens": 40960000} +{"current_steps": 5010, "total_steps": 8739, "loss": 0.997, "learning_rate": 2.3574898247471167e-05, "epoch": 0.5732921386886372, "percentage": 57.33, "elapsed_time": "7:03:10", "remaining_time": "5:14:58", "throughput": 1616.41, "total_tokens": 41041920} +{"current_steps": 5020, "total_steps": 8739, "loss": 1.2608, "learning_rate": 2.347358954635393e-05, "epoch": 0.5744364343746424, "percentage": 57.44, "elapsed_time": "7:04:04", "remaining_time": "5:14:10", "throughput": 1616.23, "total_tokens": 41123840} +{"current_steps": 5030, "total_steps": 8739, "loss": 1.1886, "learning_rate": 2.337230599887358e-05, "epoch": 0.5755807300606477, "percentage": 57.56, "elapsed_time": "7:04:57", "remaining_time": "5:13:21", "throughput": 1616.09, "total_tokens": 41205760} +{"current_steps": 5040, "total_steps": 8739, "loss": 1.2545, "learning_rate": 2.327104927407634e-05, "epoch": 0.576725025746653, "percentage": 57.67, "elapsed_time": "7:05:50", "remaining_time": "5:12:32", "throughput": 1615.91, "total_tokens": 41287680} +{"current_steps": 5050, "total_steps": 8739, "loss": 1.0687, "learning_rate": 2.3169821040566387e-05, "epoch": 0.5778693214326582, "percentage": 57.79, "elapsed_time": "7:06:44", "remaining_time": "5:11:43", "throughput": 1615.72, "total_tokens": 41369600} +{"current_steps": 5060, "total_steps": 8739, "loss": 1.1071, "learning_rate": 2.306862296647841e-05, "epoch": 0.5790136171186635, "percentage": 57.9, "elapsed_time": "7:07:37", "remaining_time": "5:10:54", "throughput": 1615.57, "total_tokens": 41451520} +{"current_steps": 5070, "total_steps": 8739, "loss": 1.0824, "learning_rate": 2.2967456719450127e-05, "epoch": 0.5801579128046688, "percentage": 58.02, "elapsed_time": "7:08:30", "remaining_time": "5:10:06", "throughput": 1615.4, "total_tokens": 41533440} +{"current_steps": 5080, "total_steps": 8739, "loss": 1.451, "learning_rate": 2.2866323966594736e-05, "epoch": 0.581302208490674, "percentage": 58.13, "elapsed_time": "7:09:23", "remaining_time": "5:09:17", "throughput": 1615.27, "total_tokens": 41615360} +{"current_steps": 5090, "total_steps": 8739, "loss": 1.2207, "learning_rate": 2.2765226374473504e-05, "epoch": 0.5824465041766792, "percentage": 58.24, "elapsed_time": "7:10:17", "remaining_time": "5:08:28", "throughput": 1615.08, "total_tokens": 41697280} +{"current_steps": 5100, "total_steps": 8739, "loss": 1.1504, "learning_rate": 2.2664165609068304e-05, "epoch": 0.5835907998626845, "percentage": 58.36, "elapsed_time": "7:11:10", "remaining_time": "5:07:39", "throughput": 1614.92, "total_tokens": 41779200} +{"current_steps": 5110, "total_steps": 8739, "loss": 1.1436, "learning_rate": 2.2563143335754118e-05, "epoch": 0.5847350955486897, "percentage": 58.47, "elapsed_time": "7:12:04", "remaining_time": "5:06:50", "throughput": 1614.76, "total_tokens": 41861120} +{"current_steps": 5120, "total_steps": 8739, "loss": 1.5087, "learning_rate": 2.2462161219271622e-05, "epoch": 0.585879391234695, "percentage": 58.59, "elapsed_time": "7:12:57", "remaining_time": "5:06:01", "throughput": 1614.59, "total_tokens": 41943040} +{"current_steps": 5130, "total_steps": 8739, "loss": 1.2635, "learning_rate": 2.236122092369977e-05, "epoch": 0.5870236869207003, "percentage": 58.7, "elapsed_time": "7:13:50", "remaining_time": "5:05:12", "throughput": 1614.43, "total_tokens": 42024960} +{"current_steps": 5140, "total_steps": 8739, "loss": 1.4867, "learning_rate": 2.2260324112428336e-05, "epoch": 0.5881679826067056, "percentage": 58.82, "elapsed_time": "7:14:44", "remaining_time": "5:04:23", "throughput": 1614.27, "total_tokens": 42106880} +{"current_steps": 5150, "total_steps": 8739, "loss": 1.2188, "learning_rate": 2.2159472448130513e-05, "epoch": 0.5893122782927108, "percentage": 58.93, "elapsed_time": "7:15:37", "remaining_time": "5:03:34", "throughput": 1614.12, "total_tokens": 42188800} +{"current_steps": 5160, "total_steps": 8739, "loss": 1.3696, "learning_rate": 2.2058667592735532e-05, "epoch": 0.5904565739787161, "percentage": 59.05, "elapsed_time": "7:16:30", "remaining_time": "5:02:45", "throughput": 1613.96, "total_tokens": 42270720} +{"current_steps": 5170, "total_steps": 8739, "loss": 1.6279, "learning_rate": 2.1957911207401267e-05, "epoch": 0.5916008696647214, "percentage": 59.16, "elapsed_time": "7:17:24", "remaining_time": "5:01:57", "throughput": 1613.74, "total_tokens": 42352640} +{"current_steps": 5180, "total_steps": 8739, "loss": 1.521, "learning_rate": 2.1857204952486824e-05, "epoch": 0.5927451653507266, "percentage": 59.27, "elapsed_time": "7:18:17", "remaining_time": "5:01:08", "throughput": 1613.61, "total_tokens": 42434560} +{"current_steps": 5190, "total_steps": 8739, "loss": 1.3385, "learning_rate": 2.1756550487525247e-05, "epoch": 0.5938894610367319, "percentage": 59.39, "elapsed_time": "7:19:11", "remaining_time": "5:00:19", "throughput": 1613.44, "total_tokens": 42516480} +{"current_steps": 5200, "total_steps": 8739, "loss": 1.1232, "learning_rate": 2.165594947119613e-05, "epoch": 0.5950337567227372, "percentage": 59.5, "elapsed_time": "7:20:04", "remaining_time": "4:59:30", "throughput": 1613.29, "total_tokens": 42598400} +{"current_steps": 5210, "total_steps": 8739, "loss": 1.3692, "learning_rate": 2.1555403561298287e-05, "epoch": 0.5961780524087424, "percentage": 59.62, "elapsed_time": "7:20:58", "remaining_time": "4:58:41", "throughput": 1613.13, "total_tokens": 42680320} +{"current_steps": 5220, "total_steps": 8739, "loss": 1.2656, "learning_rate": 2.1454914414722417e-05, "epoch": 0.5973223480947477, "percentage": 59.73, "elapsed_time": "7:21:51", "remaining_time": "4:57:52", "throughput": 1612.98, "total_tokens": 42762240} +{"current_steps": 5230, "total_steps": 8739, "loss": 1.2838, "learning_rate": 2.135448368742385e-05, "epoch": 0.598466643780753, "percentage": 59.85, "elapsed_time": "7:22:45", "remaining_time": "4:57:03", "throughput": 1612.8, "total_tokens": 42844160} +{"current_steps": 5240, "total_steps": 8739, "loss": 1.2797, "learning_rate": 2.1254113034395212e-05, "epoch": 0.5996109394667583, "percentage": 59.96, "elapsed_time": "7:23:37", "remaining_time": "4:56:14", "throughput": 1612.67, "total_tokens": 42926080} +{"current_steps": 5250, "total_steps": 8739, "loss": 1.2836, "learning_rate": 2.1153804109639157e-05, "epoch": 0.6007552351527635, "percentage": 60.08, "elapsed_time": "7:24:30", "remaining_time": "4:55:24", "throughput": 1612.54, "total_tokens": 43008000} +{"current_steps": 5260, "total_steps": 8739, "loss": 1.1154, "learning_rate": 2.105355856614115e-05, "epoch": 0.6018995308387688, "percentage": 60.19, "elapsed_time": "7:25:23", "remaining_time": "4:54:35", "throughput": 1612.42, "total_tokens": 43089920} +{"current_steps": 5270, "total_steps": 8739, "loss": 1.3152, "learning_rate": 2.0953378055842183e-05, "epoch": 0.603043826524774, "percentage": 60.3, "elapsed_time": "7:26:16", "remaining_time": "4:53:45", "throughput": 1612.29, "total_tokens": 43171840} +{"current_steps": 5280, "total_steps": 8739, "loss": 0.9663, "learning_rate": 2.0853264229611557e-05, "epoch": 0.6041881222107792, "percentage": 60.42, "elapsed_time": "7:27:09", "remaining_time": "4:52:56", "throughput": 1612.15, "total_tokens": 43253760} +{"current_steps": 5290, "total_steps": 8739, "loss": 1.0387, "learning_rate": 2.075321873721972e-05, "epoch": 0.6053324178967845, "percentage": 60.53, "elapsed_time": "7:28:03", "remaining_time": "4:52:07", "throughput": 1612.0, "total_tokens": 43335680} +{"current_steps": 5300, "total_steps": 8739, "loss": 1.3762, "learning_rate": 2.0653243227311014e-05, "epoch": 0.6064767135827898, "percentage": 60.65, "elapsed_time": "7:28:56", "remaining_time": "4:51:18", "throughput": 1611.86, "total_tokens": 43417600} +{"current_steps": 5310, "total_steps": 8739, "loss": 1.187, "learning_rate": 2.0553339347376592e-05, "epoch": 0.607621009268795, "percentage": 60.76, "elapsed_time": "7:29:49", "remaining_time": "4:50:28", "throughput": 1611.73, "total_tokens": 43499520} +{"current_steps": 5320, "total_steps": 8739, "loss": 1.0539, "learning_rate": 2.045350874372717e-05, "epoch": 0.6087653049548003, "percentage": 60.88, "elapsed_time": "7:30:42", "remaining_time": "4:49:39", "throughput": 1611.57, "total_tokens": 43581440} +{"current_steps": 5330, "total_steps": 8739, "loss": 1.3189, "learning_rate": 2.0353753061465972e-05, "epoch": 0.6099096006408056, "percentage": 60.99, "elapsed_time": "7:31:35", "remaining_time": "4:48:50", "throughput": 1611.44, "total_tokens": 43663360} +{"current_steps": 5340, "total_steps": 8739, "loss": 1.2721, "learning_rate": 2.0254073944461603e-05, "epoch": 0.6110538963268108, "percentage": 61.11, "elapsed_time": "7:32:29", "remaining_time": "4:48:01", "throughput": 1611.27, "total_tokens": 43745280} +{"current_steps": 5350, "total_steps": 8739, "loss": 1.1475, "learning_rate": 2.0154473035320936e-05, "epoch": 0.6121981920128161, "percentage": 61.22, "elapsed_time": "7:33:23", "remaining_time": "4:47:12", "throughput": 1611.1, "total_tokens": 43827200} +{"current_steps": 5360, "total_steps": 8739, "loss": 1.2035, "learning_rate": 2.0054951975362067e-05, "epoch": 0.6133424876988214, "percentage": 61.33, "elapsed_time": "7:34:16", "remaining_time": "4:46:22", "throughput": 1610.96, "total_tokens": 43909120} +{"current_steps": 5370, "total_steps": 8739, "loss": 1.1699, "learning_rate": 1.995551240458728e-05, "epoch": 0.6144867833848267, "percentage": 61.45, "elapsed_time": "7:35:09", "remaining_time": "4:45:33", "throughput": 1610.83, "total_tokens": 43991040} +{"current_steps": 5380, "total_steps": 8739, "loss": 1.2418, "learning_rate": 1.985615596165597e-05, "epoch": 0.6156310790708319, "percentage": 61.56, "elapsed_time": "7:36:02", "remaining_time": "4:44:43", "throughput": 1610.71, "total_tokens": 44072960} +{"current_steps": 5390, "total_steps": 8739, "loss": 1.4331, "learning_rate": 1.9756884283857685e-05, "epoch": 0.6167753747568372, "percentage": 61.68, "elapsed_time": "7:36:55", "remaining_time": "4:43:54", "throughput": 1610.58, "total_tokens": 44154880} +{"current_steps": 5400, "total_steps": 8739, "loss": 1.3412, "learning_rate": 1.965769900708515e-05, "epoch": 0.6179196704428425, "percentage": 61.79, "elapsed_time": "7:37:48", "remaining_time": "4:43:04", "throughput": 1610.44, "total_tokens": 44236800} +{"current_steps": 5410, "total_steps": 8739, "loss": 1.1733, "learning_rate": 1.955860176580729e-05, "epoch": 0.6190639661288477, "percentage": 61.91, "elapsed_time": "7:38:41", "remaining_time": "4:42:15", "throughput": 1610.31, "total_tokens": 44318720} +{"current_steps": 5420, "total_steps": 8739, "loss": 1.2493, "learning_rate": 1.945959419304226e-05, "epoch": 0.620208261814853, "percentage": 62.02, "elapsed_time": "7:39:35", "remaining_time": "4:41:25", "throughput": 1610.17, "total_tokens": 44400640} +{"current_steps": 5430, "total_steps": 8739, "loss": 1.2361, "learning_rate": 1.936067792033061e-05, "epoch": 0.6213525575008583, "percentage": 62.14, "elapsed_time": "7:40:28", "remaining_time": "4:40:36", "throughput": 1610.05, "total_tokens": 44482560} +{"current_steps": 5440, "total_steps": 8739, "loss": 1.2999, "learning_rate": 1.9261854577708366e-05, "epoch": 0.6224968531868634, "percentage": 62.25, "elapsed_time": "7:41:21", "remaining_time": "4:39:47", "throughput": 1609.9, "total_tokens": 44564480} +{"current_steps": 5450, "total_steps": 8739, "loss": 1.4174, "learning_rate": 1.9163125793680125e-05, "epoch": 0.6236411488728687, "percentage": 62.36, "elapsed_time": "7:42:14", "remaining_time": "4:38:57", "throughput": 1609.77, "total_tokens": 44646400} +{"current_steps": 5460, "total_steps": 8739, "loss": 1.0868, "learning_rate": 1.9064493195192293e-05, "epoch": 0.624785444558874, "percentage": 62.48, "elapsed_time": "7:43:07", "remaining_time": "4:38:07", "throughput": 1609.66, "total_tokens": 44728320} +{"current_steps": 5470, "total_steps": 8739, "loss": 1.1703, "learning_rate": 1.8965958407606236e-05, "epoch": 0.6259297402448792, "percentage": 62.59, "elapsed_time": "7:43:59", "remaining_time": "4:37:17", "throughput": 1609.56, "total_tokens": 44810240} +{"current_steps": 5480, "total_steps": 8739, "loss": 1.2942, "learning_rate": 1.8867523054671475e-05, "epoch": 0.6270740359308845, "percentage": 62.71, "elapsed_time": "7:44:53", "remaining_time": "4:36:28", "throughput": 1609.43, "total_tokens": 44892160} +{"current_steps": 5490, "total_steps": 8739, "loss": 1.1778, "learning_rate": 1.8769188758498973e-05, "epoch": 0.6282183316168898, "percentage": 62.82, "elapsed_time": "7:45:46", "remaining_time": "4:35:39", "throughput": 1609.27, "total_tokens": 44974080} +{"current_steps": 5500, "total_steps": 8739, "loss": 1.2899, "learning_rate": 1.867095713953439e-05, "epoch": 0.629362627302895, "percentage": 62.94, "elapsed_time": "7:46:39", "remaining_time": "4:34:49", "throughput": 1609.15, "total_tokens": 45056000} +{"current_steps": 5510, "total_steps": 8739, "loss": 1.2486, "learning_rate": 1.8572829816531364e-05, "epoch": 0.6305069229889003, "percentage": 63.05, "elapsed_time": "7:47:33", "remaining_time": "4:34:00", "throughput": 1608.99, "total_tokens": 45137920} +{"current_steps": 5520, "total_steps": 8739, "loss": 1.2433, "learning_rate": 1.847480840652483e-05, "epoch": 0.6316512186749056, "percentage": 63.17, "elapsed_time": "7:48:26", "remaining_time": "4:33:10", "throughput": 1608.86, "total_tokens": 45219840} +{"current_steps": 5530, "total_steps": 8739, "loss": 1.2503, "learning_rate": 1.8376894524804416e-05, "epoch": 0.6327955143609109, "percentage": 63.28, "elapsed_time": "7:49:19", "remaining_time": "4:32:20", "throughput": 1608.75, "total_tokens": 45301760} +{"current_steps": 5540, "total_steps": 8739, "loss": 1.3593, "learning_rate": 1.827908978488779e-05, "epoch": 0.6339398100469161, "percentage": 63.39, "elapsed_time": "7:50:13", "remaining_time": "4:31:31", "throughput": 1608.61, "total_tokens": 45383680} +{"current_steps": 5550, "total_steps": 8739, "loss": 1.3471, "learning_rate": 1.8181395798494048e-05, "epoch": 0.6350841057329214, "percentage": 63.51, "elapsed_time": "7:51:06", "remaining_time": "4:30:41", "throughput": 1608.48, "total_tokens": 45465600} +{"current_steps": 5560, "total_steps": 8739, "loss": 1.3265, "learning_rate": 1.8083814175517234e-05, "epoch": 0.6362284014189267, "percentage": 63.62, "elapsed_time": "7:52:00", "remaining_time": "4:29:52", "throughput": 1608.31, "total_tokens": 45547520} +{"current_steps": 5570, "total_steps": 8739, "loss": 1.6024, "learning_rate": 1.798634652399972e-05, "epoch": 0.6373726971049319, "percentage": 63.74, "elapsed_time": "7:52:53", "remaining_time": "4:29:03", "throughput": 1608.15, "total_tokens": 45629440} +{"current_steps": 5580, "total_steps": 8739, "loss": 1.2416, "learning_rate": 1.7888994450105788e-05, "epoch": 0.6385169927909372, "percentage": 63.85, "elapsed_time": "7:53:46", "remaining_time": "4:28:13", "throughput": 1608.04, "total_tokens": 45711360} +{"current_steps": 5590, "total_steps": 8739, "loss": 1.3582, "learning_rate": 1.7791759558095077e-05, "epoch": 0.6396612884769425, "percentage": 63.97, "elapsed_time": "7:54:40", "remaining_time": "4:27:23", "throughput": 1607.91, "total_tokens": 45793280} +{"current_steps": 5600, "total_steps": 8739, "loss": 1.4037, "learning_rate": 1.7694643450296216e-05, "epoch": 0.6408055841629478, "percentage": 64.08, "elapsed_time": "7:55:33", "remaining_time": "4:26:33", "throughput": 1607.77, "total_tokens": 45875200} +{"current_steps": 5610, "total_steps": 8739, "loss": 1.3859, "learning_rate": 1.7597647727080408e-05, "epoch": 0.641949879848953, "percentage": 64.19, "elapsed_time": "7:56:26", "remaining_time": "4:25:44", "throughput": 1607.64, "total_tokens": 45957120} +{"current_steps": 5620, "total_steps": 8739, "loss": 1.0984, "learning_rate": 1.7500773986835013e-05, "epoch": 0.6430941755349582, "percentage": 64.31, "elapsed_time": "7:57:19", "remaining_time": "4:24:54", "throughput": 1607.52, "total_tokens": 46039040} +{"current_steps": 5630, "total_steps": 8739, "loss": 1.3061, "learning_rate": 1.740402382593727e-05, "epoch": 0.6442384712209634, "percentage": 64.42, "elapsed_time": "7:58:13", "remaining_time": "4:24:05", "throughput": 1607.37, "total_tokens": 46120960} +{"current_steps": 5640, "total_steps": 8739, "loss": 1.0178, "learning_rate": 1.730739883872795e-05, "epoch": 0.6453827669069687, "percentage": 64.54, "elapsed_time": "7:59:06", "remaining_time": "4:23:15", "throughput": 1607.25, "total_tokens": 46202880} +{"current_steps": 5650, "total_steps": 8739, "loss": 1.2927, "learning_rate": 1.7210900617485075e-05, "epoch": 0.646527062592974, "percentage": 64.65, "elapsed_time": "7:59:59", "remaining_time": "4:22:25", "throughput": 1607.13, "total_tokens": 46284800} +{"current_steps": 5660, "total_steps": 8739, "loss": 1.205, "learning_rate": 1.711453075239773e-05, "epoch": 0.6476713582789793, "percentage": 64.77, "elapsed_time": "8:00:52", "remaining_time": "4:21:35", "throughput": 1607.01, "total_tokens": 46366720} +{"current_steps": 5670, "total_steps": 8739, "loss": 1.378, "learning_rate": 1.7018290831539795e-05, "epoch": 0.6488156539649845, "percentage": 64.88, "elapsed_time": "8:01:46", "remaining_time": "4:20:45", "throughput": 1606.88, "total_tokens": 46448640} +{"current_steps": 5680, "total_steps": 8739, "loss": 1.0102, "learning_rate": 1.6922182440843843e-05, "epoch": 0.6499599496509898, "percentage": 65.0, "elapsed_time": "8:02:39", "remaining_time": "4:19:56", "throughput": 1606.76, "total_tokens": 46530560} +{"current_steps": 5690, "total_steps": 8739, "loss": 1.2101, "learning_rate": 1.6826207164074924e-05, "epoch": 0.6511042453369951, "percentage": 65.11, "elapsed_time": "8:03:32", "remaining_time": "4:19:06", "throughput": 1606.65, "total_tokens": 46612480} +{"current_steps": 5700, "total_steps": 8739, "loss": 1.1996, "learning_rate": 1.6730366582804535e-05, "epoch": 0.6522485410230003, "percentage": 65.22, "elapsed_time": "8:04:24", "remaining_time": "4:18:16", "throughput": 1606.56, "total_tokens": 46694400} +{"current_steps": 5710, "total_steps": 8739, "loss": 1.2356, "learning_rate": 1.6634662276384548e-05, "epoch": 0.6533928367090056, "percentage": 65.34, "elapsed_time": "8:05:18", "remaining_time": "4:17:26", "throughput": 1606.44, "total_tokens": 46776320} +{"current_steps": 5720, "total_steps": 8739, "loss": 1.2006, "learning_rate": 1.6539095821921136e-05, "epoch": 0.6545371323950109, "percentage": 65.45, "elapsed_time": "8:06:11", "remaining_time": "4:16:36", "throughput": 1606.31, "total_tokens": 46858240} +{"current_steps": 5730, "total_steps": 8739, "loss": 1.2621, "learning_rate": 1.6443668794248828e-05, "epoch": 0.6556814280810161, "percentage": 65.57, "elapsed_time": "8:07:04", "remaining_time": "4:15:46", "throughput": 1606.21, "total_tokens": 46940160} +{"current_steps": 5740, "total_steps": 8739, "loss": 1.0727, "learning_rate": 1.6348382765904567e-05, "epoch": 0.6568257237670214, "percentage": 65.68, "elapsed_time": "8:07:57", "remaining_time": "4:14:56", "throughput": 1606.09, "total_tokens": 47022080} +{"current_steps": 5750, "total_steps": 8739, "loss": 1.212, "learning_rate": 1.6253239307101748e-05, "epoch": 0.6579700194530267, "percentage": 65.8, "elapsed_time": "8:08:50", "remaining_time": "4:14:06", "throughput": 1605.97, "total_tokens": 47104000} +{"current_steps": 5760, "total_steps": 8739, "loss": 1.3306, "learning_rate": 1.6158239985704378e-05, "epoch": 0.659114315139032, "percentage": 65.91, "elapsed_time": "8:09:43", "remaining_time": "4:13:16", "throughput": 1605.84, "total_tokens": 47185920} +{"current_steps": 5770, "total_steps": 8739, "loss": 1.0573, "learning_rate": 1.606338636720125e-05, "epoch": 0.6602586108250372, "percentage": 66.03, "elapsed_time": "8:10:37", "remaining_time": "4:12:27", "throughput": 1605.73, "total_tokens": 47267840} +{"current_steps": 5780, "total_steps": 8739, "loss": 1.4235, "learning_rate": 1.5968680014680105e-05, "epoch": 0.6614029065110425, "percentage": 66.14, "elapsed_time": "8:11:30", "remaining_time": "4:11:37", "throughput": 1605.6, "total_tokens": 47349760} +{"current_steps": 5790, "total_steps": 8739, "loss": 1.1993, "learning_rate": 1.5874122488801888e-05, "epoch": 0.6625472021970478, "percentage": 66.25, "elapsed_time": "8:12:23", "remaining_time": "4:10:47", "throughput": 1605.48, "total_tokens": 47431680} +{"current_steps": 5800, "total_steps": 8739, "loss": 1.1437, "learning_rate": 1.577971534777507e-05, "epoch": 0.6636914978830529, "percentage": 66.37, "elapsed_time": "8:13:16", "remaining_time": "4:09:57", "throughput": 1605.36, "total_tokens": 47513600} +{"current_steps": 5810, "total_steps": 8739, "loss": 1.2579, "learning_rate": 1.5685460147329917e-05, "epoch": 0.6648357935690582, "percentage": 66.48, "elapsed_time": "8:14:10", "remaining_time": "4:09:07", "throughput": 1605.23, "total_tokens": 47595520} +{"current_steps": 5820, "total_steps": 8739, "loss": 1.2693, "learning_rate": 1.5591358440692865e-05, "epoch": 0.6659800892550635, "percentage": 66.6, "elapsed_time": "8:15:02", "remaining_time": "4:08:17", "throughput": 1605.14, "total_tokens": 47677440} +{"current_steps": 5830, "total_steps": 8739, "loss": 1.1159, "learning_rate": 1.5497411778560954e-05, "epoch": 0.6671243849410687, "percentage": 66.71, "elapsed_time": "8:15:56", "remaining_time": "4:07:27", "throughput": 1605.02, "total_tokens": 47759360} +{"current_steps": 5840, "total_steps": 8739, "loss": 1.1901, "learning_rate": 1.5403621709076247e-05, "epoch": 0.668268680627074, "percentage": 66.83, "elapsed_time": "8:16:49", "remaining_time": "4:06:37", "throughput": 1604.91, "total_tokens": 47841280} +{"current_steps": 5850, "total_steps": 8739, "loss": 1.4804, "learning_rate": 1.530998977780033e-05, "epoch": 0.6694129763130793, "percentage": 66.94, "elapsed_time": "8:17:43", "remaining_time": "4:05:47", "throughput": 1604.75, "total_tokens": 47923200} +{"current_steps": 5860, "total_steps": 8739, "loss": 1.1893, "learning_rate": 1.5216517527688818e-05, "epoch": 0.6705572719990845, "percentage": 67.06, "elapsed_time": "8:18:36", "remaining_time": "4:04:58", "throughput": 1604.62, "total_tokens": 48005120} +{"current_steps": 5870, "total_steps": 8739, "loss": 1.085, "learning_rate": 1.5123206499065967e-05, "epoch": 0.6717015676850898, "percentage": 67.17, "elapsed_time": "8:19:30", "remaining_time": "4:04:08", "throughput": 1604.5, "total_tokens": 48087040} +{"current_steps": 5880, "total_steps": 8739, "loss": 1.0382, "learning_rate": 1.5030058229599275e-05, "epoch": 0.6728458633710951, "percentage": 67.28, "elapsed_time": "8:20:23", "remaining_time": "4:03:18", "throughput": 1604.38, "total_tokens": 48168960} +{"current_steps": 5890, "total_steps": 8739, "loss": 1.3036, "learning_rate": 1.4937074254274117e-05, "epoch": 0.6739901590571004, "percentage": 67.4, "elapsed_time": "8:21:16", "remaining_time": "4:02:28", "throughput": 1604.25, "total_tokens": 48250880} +{"current_steps": 5900, "total_steps": 8739, "loss": 1.3465, "learning_rate": 1.4844256105368504e-05, "epoch": 0.6751344547431056, "percentage": 67.51, "elapsed_time": "8:22:09", "remaining_time": "4:01:38", "throughput": 1604.14, "total_tokens": 48332800} +{"current_steps": 5910, "total_steps": 8739, "loss": 1.4707, "learning_rate": 1.4751605312427786e-05, "epoch": 0.6762787504291109, "percentage": 67.63, "elapsed_time": "8:23:02", "remaining_time": "4:00:47", "throughput": 1604.04, "total_tokens": 48414720} +{"current_steps": 5920, "total_steps": 8739, "loss": 1.1061, "learning_rate": 1.4659123402239454e-05, "epoch": 0.6774230461151162, "percentage": 67.74, "elapsed_time": "8:23:56", "remaining_time": "3:59:57", "throughput": 1603.93, "total_tokens": 48496640} +{"current_steps": 5930, "total_steps": 8739, "loss": 1.2819, "learning_rate": 1.4566811898808013e-05, "epoch": 0.6785673418011214, "percentage": 67.86, "elapsed_time": "8:24:49", "remaining_time": "3:59:07", "throughput": 1603.82, "total_tokens": 48578560} +{"current_steps": 5940, "total_steps": 8739, "loss": 1.4707, "learning_rate": 1.4474672323329819e-05, "epoch": 0.6797116374871267, "percentage": 67.97, "elapsed_time": "8:25:42", "remaining_time": "3:58:17", "throughput": 1603.7, "total_tokens": 48660480} +{"current_steps": 5950, "total_steps": 8739, "loss": 1.4235, "learning_rate": 1.4382706194168066e-05, "epoch": 0.680855933173132, "percentage": 68.09, "elapsed_time": "8:26:35", "remaining_time": "3:57:27", "throughput": 1603.59, "total_tokens": 48742400} +{"current_steps": 5960, "total_steps": 8739, "loss": 1.2991, "learning_rate": 1.42909150268277e-05, "epoch": 0.6820002288591372, "percentage": 68.2, "elapsed_time": "8:27:29", "remaining_time": "3:56:37", "throughput": 1603.46, "total_tokens": 48824320} +{"current_steps": 5970, "total_steps": 8739, "loss": 1.0258, "learning_rate": 1.4199300333930515e-05, "epoch": 0.6831445245451425, "percentage": 68.31, "elapsed_time": "8:28:22", "remaining_time": "3:55:47", "throughput": 1603.34, "total_tokens": 48906240} +{"current_steps": 5980, "total_steps": 8739, "loss": 1.2446, "learning_rate": 1.4107863625190163e-05, "epoch": 0.6842888202311477, "percentage": 68.43, "elapsed_time": "8:29:16", "remaining_time": "3:54:57", "throughput": 1603.22, "total_tokens": 48988160} +{"current_steps": 5990, "total_steps": 8739, "loss": 1.2735, "learning_rate": 1.4016606407387312e-05, "epoch": 0.685433115917153, "percentage": 68.54, "elapsed_time": "8:30:09", "remaining_time": "3:54:07", "throughput": 1603.09, "total_tokens": 49070080} +{"current_steps": 6000, "total_steps": 8739, "loss": 1.3767, "learning_rate": 1.3925530184344818e-05, "epoch": 0.6865774116031582, "percentage": 68.66, "elapsed_time": "8:31:02", "remaining_time": "3:53:17", "throughput": 1603.0, "total_tokens": 49152000} +{"current_steps": 6010, "total_steps": 8739, "loss": 1.4241, "learning_rate": 1.3834636456902944e-05, "epoch": 0.6877217072891635, "percentage": 68.77, "elapsed_time": "8:32:01", "remaining_time": "3:52:30", "throughput": 1602.57, "total_tokens": 49233920} +{"current_steps": 6020, "total_steps": 8739, "loss": 1.1986, "learning_rate": 1.3743926722894579e-05, "epoch": 0.6888660029751688, "percentage": 68.89, "elapsed_time": "8:32:54", "remaining_time": "3:51:39", "throughput": 1602.48, "total_tokens": 49315840} +{"current_steps": 6030, "total_steps": 8739, "loss": 0.9731, "learning_rate": 1.365340247712064e-05, "epoch": 0.690010298661174, "percentage": 69.0, "elapsed_time": "8:33:47", "remaining_time": "3:50:49", "throughput": 1602.38, "total_tokens": 49397760} +{"current_steps": 6040, "total_steps": 8739, "loss": 1.2101, "learning_rate": 1.3563065211325349e-05, "epoch": 0.6911545943471793, "percentage": 69.12, "elapsed_time": "8:34:41", "remaining_time": "3:49:59", "throughput": 1602.27, "total_tokens": 49479680} +{"current_steps": 6050, "total_steps": 8739, "loss": 1.0661, "learning_rate": 1.3472916414171738e-05, "epoch": 0.6922988900331846, "percentage": 69.23, "elapsed_time": "8:35:34", "remaining_time": "3:49:09", "throughput": 1602.16, "total_tokens": 49561600} +{"current_steps": 6060, "total_steps": 8739, "loss": 1.2239, "learning_rate": 1.338295757121703e-05, "epoch": 0.6934431857191898, "percentage": 69.34, "elapsed_time": "8:36:27", "remaining_time": "3:48:18", "throughput": 1602.07, "total_tokens": 49643520} +{"current_steps": 6070, "total_steps": 8739, "loss": 1.3588, "learning_rate": 1.3293190164888242e-05, "epoch": 0.6945874814051951, "percentage": 69.46, "elapsed_time": "8:37:20", "remaining_time": "3:47:28", "throughput": 1601.96, "total_tokens": 49725440} +{"current_steps": 6080, "total_steps": 8739, "loss": 1.1447, "learning_rate": 1.3203615674457709e-05, "epoch": 0.6957317770912004, "percentage": 69.57, "elapsed_time": "8:38:14", "remaining_time": "3:46:38", "throughput": 1601.83, "total_tokens": 49807360} +{"current_steps": 6090, "total_steps": 8739, "loss": 1.3927, "learning_rate": 1.3114235576018686e-05, "epoch": 0.6968760727772056, "percentage": 69.69, "elapsed_time": "8:39:07", "remaining_time": "3:45:48", "throughput": 1601.72, "total_tokens": 49889280} +{"current_steps": 6100, "total_steps": 8739, "loss": 1.2068, "learning_rate": 1.3025051342461087e-05, "epoch": 0.6980203684632109, "percentage": 69.8, "elapsed_time": "8:40:00", "remaining_time": "3:44:57", "throughput": 1601.64, "total_tokens": 49971200} +{"current_steps": 6110, "total_steps": 8739, "loss": 1.5996, "learning_rate": 1.2936064443447157e-05, "epoch": 0.6991646641492162, "percentage": 69.92, "elapsed_time": "8:40:53", "remaining_time": "3:44:07", "throughput": 1601.54, "total_tokens": 50053120} +{"current_steps": 6120, "total_steps": 8739, "loss": 1.0368, "learning_rate": 1.2847276345387299e-05, "epoch": 0.7003089598352215, "percentage": 70.03, "elapsed_time": "8:41:46", "remaining_time": "3:43:17", "throughput": 1601.44, "total_tokens": 50135040} +{"current_steps": 6130, "total_steps": 8739, "loss": 1.3925, "learning_rate": 1.2758688511415848e-05, "epoch": 0.7014532555212267, "percentage": 70.15, "elapsed_time": "8:42:39", "remaining_time": "3:42:26", "throughput": 1601.35, "total_tokens": 50216960} +{"current_steps": 6140, "total_steps": 8739, "loss": 1.1923, "learning_rate": 1.2670302401367035e-05, "epoch": 0.702597551207232, "percentage": 70.26, "elapsed_time": "8:43:32", "remaining_time": "3:41:36", "throughput": 1601.25, "total_tokens": 50298880} +{"current_steps": 6150, "total_steps": 8739, "loss": 1.3158, "learning_rate": 1.2582119471750888e-05, "epoch": 0.7037418468932373, "percentage": 70.37, "elapsed_time": "8:44:25", "remaining_time": "3:40:46", "throughput": 1601.12, "total_tokens": 50380800} +{"current_steps": 6160, "total_steps": 8739, "loss": 1.1663, "learning_rate": 1.2494141175729216e-05, "epoch": 0.7048861425792424, "percentage": 70.49, "elapsed_time": "8:45:18", "remaining_time": "3:39:55", "throughput": 1601.04, "total_tokens": 50462720} +{"current_steps": 6170, "total_steps": 8739, "loss": 1.1836, "learning_rate": 1.240636896309168e-05, "epoch": 0.7060304382652477, "percentage": 70.6, "elapsed_time": "8:46:11", "remaining_time": "3:39:05", "throughput": 1600.93, "total_tokens": 50544640} +{"current_steps": 6180, "total_steps": 8739, "loss": 1.3311, "learning_rate": 1.2318804280231939e-05, "epoch": 0.707174733951253, "percentage": 70.72, "elapsed_time": "8:47:05", "remaining_time": "3:38:15", "throughput": 1600.83, "total_tokens": 50626560} +{"current_steps": 6190, "total_steps": 8739, "loss": 1.1546, "learning_rate": 1.2231448570123732e-05, "epoch": 0.7083190296372582, "percentage": 70.83, "elapsed_time": "8:47:58", "remaining_time": "3:37:24", "throughput": 1600.73, "total_tokens": 50708480} +{"current_steps": 6200, "total_steps": 8739, "loss": 1.1482, "learning_rate": 1.2144303272297186e-05, "epoch": 0.7094633253232635, "percentage": 70.95, "elapsed_time": "8:48:51", "remaining_time": "3:36:34", "throughput": 1600.64, "total_tokens": 50790400} +{"current_steps": 6210, "total_steps": 8739, "loss": 1.2103, "learning_rate": 1.2057369822815051e-05, "epoch": 0.7106076210092688, "percentage": 71.06, "elapsed_time": "8:49:44", "remaining_time": "3:35:44", "throughput": 1600.53, "total_tokens": 50872320} +{"current_steps": 6220, "total_steps": 8739, "loss": 1.5064, "learning_rate": 1.1970649654249017e-05, "epoch": 0.711751916695274, "percentage": 71.18, "elapsed_time": "8:50:38", "remaining_time": "3:34:53", "throughput": 1600.41, "total_tokens": 50954240} +{"current_steps": 6230, "total_steps": 8739, "loss": 1.3582, "learning_rate": 1.1884144195656133e-05, "epoch": 0.7128962123812793, "percentage": 71.29, "elapsed_time": "8:51:31", "remaining_time": "3:34:03", "throughput": 1600.32, "total_tokens": 51036160} +{"current_steps": 6240, "total_steps": 8739, "loss": 1.3876, "learning_rate": 1.1797854872555272e-05, "epoch": 0.7140405080672846, "percentage": 71.4, "elapsed_time": "8:52:24", "remaining_time": "3:33:13", "throughput": 1600.22, "total_tokens": 51118080} +{"current_steps": 6250, "total_steps": 8739, "loss": 1.07, "learning_rate": 1.171178310690362e-05, "epoch": 0.7151848037532899, "percentage": 71.52, "elapsed_time": "8:53:17", "remaining_time": "3:32:22", "throughput": 1600.11, "total_tokens": 51200000} +{"current_steps": 6260, "total_steps": 8739, "loss": 1.2047, "learning_rate": 1.1625930317073221e-05, "epoch": 0.7163290994392951, "percentage": 71.63, "elapsed_time": "8:54:11", "remaining_time": "3:31:32", "throughput": 1600.01, "total_tokens": 51281920} +{"current_steps": 6270, "total_steps": 8739, "loss": 1.2819, "learning_rate": 1.154029791782765e-05, "epoch": 0.7174733951253004, "percentage": 71.75, "elapsed_time": "8:55:04", "remaining_time": "3:30:41", "throughput": 1599.92, "total_tokens": 51363840} +{"current_steps": 6280, "total_steps": 8739, "loss": 1.2803, "learning_rate": 1.1454887320298686e-05, "epoch": 0.7186176908113057, "percentage": 71.86, "elapsed_time": "8:55:56", "remaining_time": "3:29:51", "throughput": 1599.83, "total_tokens": 51445760} +{"current_steps": 6290, "total_steps": 8739, "loss": 1.1276, "learning_rate": 1.1369699931963018e-05, "epoch": 0.7197619864973109, "percentage": 71.98, "elapsed_time": "8:56:49", "remaining_time": "3:29:00", "throughput": 1599.75, "total_tokens": 51527680} +{"current_steps": 6300, "total_steps": 8739, "loss": 1.1392, "learning_rate": 1.1284737156619096e-05, "epoch": 0.7209062821833162, "percentage": 72.09, "elapsed_time": "8:57:43", "remaining_time": "3:28:10", "throughput": 1599.64, "total_tokens": 51609600} +{"current_steps": 6310, "total_steps": 8739, "loss": 1.1951, "learning_rate": 1.1200000394363996e-05, "epoch": 0.7220505778693215, "percentage": 72.21, "elapsed_time": "8:58:36", "remaining_time": "3:27:20", "throughput": 1599.54, "total_tokens": 51691520} +{"current_steps": 6320, "total_steps": 8739, "loss": 1.0797, "learning_rate": 1.1115491041570337e-05, "epoch": 0.7231948735553267, "percentage": 72.32, "elapsed_time": "8:59:29", "remaining_time": "3:26:29", "throughput": 1599.45, "total_tokens": 51773440} +{"current_steps": 6330, "total_steps": 8739, "loss": 1.3091, "learning_rate": 1.103121049086324e-05, "epoch": 0.724339169241332, "percentage": 72.43, "elapsed_time": "9:00:22", "remaining_time": "3:25:39", "throughput": 1599.34, "total_tokens": 51855360} +{"current_steps": 6340, "total_steps": 8739, "loss": 1.1386, "learning_rate": 1.094716013109745e-05, "epoch": 0.7254834649273372, "percentage": 72.55, "elapsed_time": "9:01:15", "remaining_time": "3:24:48", "throughput": 1599.26, "total_tokens": 51937280} +{"current_steps": 6350, "total_steps": 8739, "loss": 1.2296, "learning_rate": 1.0863341347334376e-05, "epoch": 0.7266277606133424, "percentage": 72.66, "elapsed_time": "9:02:08", "remaining_time": "3:23:58", "throughput": 1599.17, "total_tokens": 52019200} +{"current_steps": 6360, "total_steps": 8739, "loss": 1.2027, "learning_rate": 1.0779755520819302e-05, "epoch": 0.7277720562993477, "percentage": 72.78, "elapsed_time": "9:03:01", "remaining_time": "3:23:07", "throughput": 1599.09, "total_tokens": 52101120} +{"current_steps": 6370, "total_steps": 8739, "loss": 1.1153, "learning_rate": 1.0696404028958634e-05, "epoch": 0.728916351985353, "percentage": 72.89, "elapsed_time": "9:03:54", "remaining_time": "3:22:16", "throughput": 1599.0, "total_tokens": 52183040} +{"current_steps": 6380, "total_steps": 8739, "loss": 1.097, "learning_rate": 1.0613288245297193e-05, "epoch": 0.7300606476713583, "percentage": 73.01, "elapsed_time": "9:04:47", "remaining_time": "3:21:26", "throughput": 1598.91, "total_tokens": 52264960} +{"current_steps": 6390, "total_steps": 8739, "loss": 1.2608, "learning_rate": 1.053040953949557e-05, "epoch": 0.7312049433573635, "percentage": 73.12, "elapsed_time": "9:05:40", "remaining_time": "3:20:35", "throughput": 1598.82, "total_tokens": 52346880} +{"current_steps": 6400, "total_steps": 8739, "loss": 1.0397, "learning_rate": 1.0447769277307554e-05, "epoch": 0.7323492390433688, "percentage": 73.23, "elapsed_time": "9:06:34", "remaining_time": "3:19:45", "throughput": 1598.72, "total_tokens": 52428800} +{"current_steps": 6410, "total_steps": 8739, "loss": 1.0589, "learning_rate": 1.0365368820557633e-05, "epoch": 0.7334935347293741, "percentage": 73.35, "elapsed_time": "9:07:27", "remaining_time": "3:18:54", "throughput": 1598.62, "total_tokens": 52510720} +{"current_steps": 6420, "total_steps": 8739, "loss": 1.0307, "learning_rate": 1.0283209527118584e-05, "epoch": 0.7346378304153793, "percentage": 73.46, "elapsed_time": "9:08:20", "remaining_time": "3:18:04", "throughput": 1598.54, "total_tokens": 52592640} +{"current_steps": 6430, "total_steps": 8739, "loss": 1.3241, "learning_rate": 1.0201292750889022e-05, "epoch": 0.7357821261013846, "percentage": 73.58, "elapsed_time": "9:09:13", "remaining_time": "3:17:13", "throughput": 1598.44, "total_tokens": 52674560} +{"current_steps": 6440, "total_steps": 8739, "loss": 1.1761, "learning_rate": 1.011961984177117e-05, "epoch": 0.7369264217873899, "percentage": 73.69, "elapsed_time": "9:10:06", "remaining_time": "3:16:23", "throughput": 1598.35, "total_tokens": 52756480} +{"current_steps": 6450, "total_steps": 8739, "loss": 1.0847, "learning_rate": 1.0038192145648567e-05, "epoch": 0.7380707174733951, "percentage": 73.81, "elapsed_time": "9:10:59", "remaining_time": "3:15:32", "throughput": 1598.27, "total_tokens": 52838400} +{"current_steps": 6460, "total_steps": 8739, "loss": 1.1278, "learning_rate": 9.95701100436389e-06, "epoch": 0.7392150131594004, "percentage": 73.92, "elapsed_time": "9:11:52", "remaining_time": "3:14:41", "throughput": 1598.19, "total_tokens": 52920320} +{"current_steps": 6470, "total_steps": 8739, "loss": 1.2579, "learning_rate": 9.876077755696868e-06, "epoch": 0.7403593088454057, "percentage": 74.04, "elapsed_time": "9:12:45", "remaining_time": "3:13:51", "throughput": 1598.1, "total_tokens": 53002240} +{"current_steps": 6480, "total_steps": 8739, "loss": 1.3319, "learning_rate": 9.795393733342203e-06, "epoch": 0.741503604531411, "percentage": 74.15, "elapsed_time": "9:13:39", "remaining_time": "3:13:00", "throughput": 1598.0, "total_tokens": 53084160} +{"current_steps": 6490, "total_steps": 8739, "loss": 1.4099, "learning_rate": 9.71496026688763e-06, "epoch": 0.7426479002174162, "percentage": 74.26, "elapsed_time": "9:14:32", "remaining_time": "3:12:10", "throughput": 1597.9, "total_tokens": 53166080} +{"current_steps": 6500, "total_steps": 8739, "loss": 1.2894, "learning_rate": 9.634778681791962e-06, "epoch": 0.7437921959034215, "percentage": 74.38, "elapsed_time": "9:15:25", "remaining_time": "3:11:19", "throughput": 1597.8, "total_tokens": 53248000} +{"current_steps": 6510, "total_steps": 8739, "loss": 1.4331, "learning_rate": 9.554850299363294e-06, "epoch": 0.7449364915894267, "percentage": 74.49, "elapsed_time": "9:16:19", "remaining_time": "3:10:29", "throughput": 1597.68, "total_tokens": 53329920} +{"current_steps": 6520, "total_steps": 8739, "loss": 1.1623, "learning_rate": 9.47517643673721e-06, "epoch": 0.7460807872754319, "percentage": 74.61, "elapsed_time": "9:17:12", "remaining_time": "3:09:38", "throughput": 1597.58, "total_tokens": 53411840} +{"current_steps": 6530, "total_steps": 8739, "loss": 1.195, "learning_rate": 9.395758406855053e-06, "epoch": 0.7472250829614372, "percentage": 74.72, "elapsed_time": "9:18:06", "remaining_time": "3:08:47", "throughput": 1597.49, "total_tokens": 53493760} +{"current_steps": 6540, "total_steps": 8739, "loss": 1.2136, "learning_rate": 9.31659751844232e-06, "epoch": 0.7483693786474425, "percentage": 74.84, "elapsed_time": "9:18:59", "remaining_time": "3:07:57", "throughput": 1597.4, "total_tokens": 53575680} +{"current_steps": 6550, "total_steps": 8739, "loss": 1.476, "learning_rate": 9.237695075987106e-06, "epoch": 0.7495136743334477, "percentage": 74.95, "elapsed_time": "9:19:52", "remaining_time": "3:07:06", "throughput": 1597.29, "total_tokens": 53657600} +{"current_steps": 6560, "total_steps": 8739, "loss": 1.3678, "learning_rate": 9.15905237971856e-06, "epoch": 0.750657970019453, "percentage": 75.07, "elapsed_time": "9:20:45", "remaining_time": "3:06:15", "throughput": 1597.21, "total_tokens": 53739520} +{"current_steps": 6570, "total_steps": 8739, "loss": 1.4367, "learning_rate": 9.080670725585511e-06, "epoch": 0.7518022657054583, "percentage": 75.18, "elapsed_time": "9:21:39", "remaining_time": "3:05:25", "throughput": 1597.08, "total_tokens": 53821440} +{"current_steps": 6580, "total_steps": 8739, "loss": 1.2801, "learning_rate": 9.002551405235082e-06, "epoch": 0.7529465613914635, "percentage": 75.29, "elapsed_time": "9:22:32", "remaining_time": "3:04:34", "throughput": 1597.0, "total_tokens": 53903360} +{"current_steps": 6590, "total_steps": 8739, "loss": 1.4574, "learning_rate": 8.924695705991407e-06, "epoch": 0.7540908570774688, "percentage": 75.41, "elapsed_time": "9:23:26", "remaining_time": "3:03:44", "throughput": 1596.9, "total_tokens": 53985280} +{"current_steps": 6600, "total_steps": 8739, "loss": 1.4978, "learning_rate": 8.847104910834414e-06, "epoch": 0.7552351527634741, "percentage": 75.52, "elapsed_time": "9:24:19", "remaining_time": "3:02:53", "throughput": 1596.81, "total_tokens": 54067200} +{"current_steps": 6610, "total_steps": 8739, "loss": 1.277, "learning_rate": 8.769780298378705e-06, "epoch": 0.7563794484494794, "percentage": 75.64, "elapsed_time": "9:25:12", "remaining_time": "3:02:02", "throughput": 1596.72, "total_tokens": 54149120} +{"current_steps": 6620, "total_steps": 8739, "loss": 1.0243, "learning_rate": 8.69272314285248e-06, "epoch": 0.7575237441354846, "percentage": 75.75, "elapsed_time": "9:26:06", "remaining_time": "3:01:12", "throughput": 1596.62, "total_tokens": 54231040} +{"current_steps": 6630, "total_steps": 8739, "loss": 1.2217, "learning_rate": 8.6159347140765e-06, "epoch": 0.7586680398214899, "percentage": 75.87, "elapsed_time": "9:26:59", "remaining_time": "3:00:21", "throughput": 1596.53, "total_tokens": 54312960} +{"current_steps": 6640, "total_steps": 8739, "loss": 1.2161, "learning_rate": 8.539416277443218e-06, "epoch": 0.7598123355074952, "percentage": 75.98, "elapsed_time": "9:27:52", "remaining_time": "2:59:30", "throughput": 1596.44, "total_tokens": 54394880} +{"current_steps": 6650, "total_steps": 8739, "loss": 1.069, "learning_rate": 8.463169093895887e-06, "epoch": 0.7609566311935004, "percentage": 76.1, "elapsed_time": "9:28:46", "remaining_time": "2:58:40", "throughput": 1596.34, "total_tokens": 54476800} +{"current_steps": 6660, "total_steps": 8739, "loss": 1.5262, "learning_rate": 8.38719441990781e-06, "epoch": 0.7621009268795057, "percentage": 76.21, "elapsed_time": "9:29:39", "remaining_time": "2:57:49", "throughput": 1596.25, "total_tokens": 54558720} +{"current_steps": 6670, "total_steps": 8739, "loss": 1.3362, "learning_rate": 8.311493507461593e-06, "epoch": 0.763245222565511, "percentage": 76.32, "elapsed_time": "9:30:32", "remaining_time": "2:56:58", "throughput": 1596.18, "total_tokens": 54640640} +{"current_steps": 6680, "total_steps": 8739, "loss": 1.2781, "learning_rate": 8.236067604028563e-06, "epoch": 0.7643895182515162, "percentage": 76.44, "elapsed_time": "9:31:25", "remaining_time": "2:56:07", "throughput": 1596.09, "total_tokens": 54722560} +{"current_steps": 6690, "total_steps": 8739, "loss": 1.4282, "learning_rate": 8.160917952548197e-06, "epoch": 0.7655338139375214, "percentage": 76.55, "elapsed_time": "9:32:18", "remaining_time": "2:55:17", "throughput": 1596.02, "total_tokens": 54804480} +{"current_steps": 6700, "total_steps": 8739, "loss": 1.2766, "learning_rate": 8.08604579140759e-06, "epoch": 0.7666781096235267, "percentage": 76.67, "elapsed_time": "9:33:11", "remaining_time": "2:54:26", "throughput": 1595.92, "total_tokens": 54886400} +{"current_steps": 6710, "total_steps": 8739, "loss": 1.4154, "learning_rate": 8.011452354421136e-06, "epoch": 0.7678224053095319, "percentage": 76.78, "elapsed_time": "9:34:05", "remaining_time": "2:53:35", "throughput": 1595.82, "total_tokens": 54968320} +{"current_steps": 6720, "total_steps": 8739, "loss": 0.9568, "learning_rate": 7.937138870810115e-06, "epoch": 0.7689667009955372, "percentage": 76.9, "elapsed_time": "9:34:58", "remaining_time": "2:52:45", "throughput": 1595.71, "total_tokens": 55050240} +{"current_steps": 6730, "total_steps": 8739, "loss": 1.4689, "learning_rate": 7.863106565182474e-06, "epoch": 0.7701109966815425, "percentage": 77.01, "elapsed_time": "9:35:52", "remaining_time": "2:51:54", "throughput": 1595.6, "total_tokens": 55132160} +{"current_steps": 6740, "total_steps": 8739, "loss": 1.3219, "learning_rate": 7.78935665751266e-06, "epoch": 0.7712552923675478, "percentage": 77.13, "elapsed_time": "9:36:45", "remaining_time": "2:51:03", "throughput": 1595.51, "total_tokens": 55214080} +{"current_steps": 6750, "total_steps": 8739, "loss": 1.1528, "learning_rate": 7.715890363121484e-06, "epoch": 0.772399588053553, "percentage": 77.24, "elapsed_time": "9:37:38", "remaining_time": "2:50:12", "throughput": 1595.45, "total_tokens": 55296000} +{"current_steps": 6760, "total_steps": 8739, "loss": 1.129, "learning_rate": 7.642708892656125e-06, "epoch": 0.7735438837395583, "percentage": 77.35, "elapsed_time": "9:38:31", "remaining_time": "2:49:21", "throughput": 1595.36, "total_tokens": 55377920} +{"current_steps": 6770, "total_steps": 8739, "loss": 1.0879, "learning_rate": 7.569813452070146e-06, "epoch": 0.7746881794255636, "percentage": 77.47, "elapsed_time": "9:39:25", "remaining_time": "2:48:31", "throughput": 1595.28, "total_tokens": 55459840} +{"current_steps": 6780, "total_steps": 8739, "loss": 1.2824, "learning_rate": 7.497205242603636e-06, "epoch": 0.7758324751115688, "percentage": 77.58, "elapsed_time": "9:40:18", "remaining_time": "2:47:40", "throughput": 1595.18, "total_tokens": 55541760} +{"current_steps": 6790, "total_steps": 8739, "loss": 1.2056, "learning_rate": 7.424885460763442e-06, "epoch": 0.7769767707975741, "percentage": 77.7, "elapsed_time": "9:41:11", "remaining_time": "2:46:49", "throughput": 1595.09, "total_tokens": 55623680} +{"current_steps": 6800, "total_steps": 8739, "loss": 1.2665, "learning_rate": 7.3528552983033985e-06, "epoch": 0.7781210664835794, "percentage": 77.81, "elapsed_time": "9:42:05", "remaining_time": "2:45:58", "throughput": 1595.0, "total_tokens": 55705600} +{"current_steps": 6810, "total_steps": 8739, "loss": 1.0662, "learning_rate": 7.281115942204739e-06, "epoch": 0.7792653621695846, "percentage": 77.93, "elapsed_time": "9:42:58", "remaining_time": "2:45:08", "throughput": 1594.9, "total_tokens": 55787520} +{"current_steps": 6820, "total_steps": 8739, "loss": 1.1699, "learning_rate": 7.209668574656514e-06, "epoch": 0.7804096578555899, "percentage": 78.04, "elapsed_time": "9:43:51", "remaining_time": "2:44:17", "throughput": 1594.83, "total_tokens": 55869440} +{"current_steps": 6830, "total_steps": 8739, "loss": 1.3507, "learning_rate": 7.138514373036098e-06, "epoch": 0.7815539535415952, "percentage": 78.16, "elapsed_time": "9:44:44", "remaining_time": "2:43:26", "throughput": 1594.74, "total_tokens": 55951360} +{"current_steps": 6840, "total_steps": 8739, "loss": 1.3175, "learning_rate": 7.0676545098897956e-06, "epoch": 0.7826982492276005, "percentage": 78.27, "elapsed_time": "9:45:38", "remaining_time": "2:42:35", "throughput": 1594.65, "total_tokens": 56033280} +{"current_steps": 6850, "total_steps": 8739, "loss": 1.1614, "learning_rate": 6.997090152913535e-06, "epoch": 0.7838425449136057, "percentage": 78.38, "elapsed_time": "9:46:31", "remaining_time": "2:41:44", "throughput": 1594.59, "total_tokens": 56115200} +{"current_steps": 6860, "total_steps": 8739, "loss": 1.0802, "learning_rate": 6.92682246493363e-06, "epoch": 0.784986840599611, "percentage": 78.5, "elapsed_time": "9:47:23", "remaining_time": "2:40:53", "throughput": 1594.53, "total_tokens": 56197120} +{"current_steps": 6870, "total_steps": 8739, "loss": 1.2859, "learning_rate": 6.856852603887556e-06, "epoch": 0.7861311362856161, "percentage": 78.61, "elapsed_time": "9:48:16", "remaining_time": "2:40:02", "throughput": 1594.44, "total_tokens": 56279040} +{"current_steps": 6880, "total_steps": 8739, "loss": 1.0909, "learning_rate": 6.787181722804959e-06, "epoch": 0.7872754319716214, "percentage": 78.73, "elapsed_time": "9:49:10", "remaining_time": "2:39:11", "throughput": 1594.34, "total_tokens": 56360960} +{"current_steps": 6890, "total_steps": 8739, "loss": 1.2816, "learning_rate": 6.717810969788596e-06, "epoch": 0.7884197276576267, "percentage": 78.84, "elapsed_time": "9:50:03", "remaining_time": "2:38:20", "throughput": 1594.27, "total_tokens": 56442880} +{"current_steps": 6900, "total_steps": 8739, "loss": 1.036, "learning_rate": 6.648741487995416e-06, "epoch": 0.789564023343632, "percentage": 78.96, "elapsed_time": "9:50:56", "remaining_time": "2:37:29", "throughput": 1594.19, "total_tokens": 56524800} +{"current_steps": 6910, "total_steps": 8739, "loss": 0.9993, "learning_rate": 6.57997441561774e-06, "epoch": 0.7907083190296372, "percentage": 79.07, "elapsed_time": "9:51:49", "remaining_time": "2:36:39", "throughput": 1594.11, "total_tokens": 56606720} +{"current_steps": 6920, "total_steps": 8739, "loss": 1.1192, "learning_rate": 6.511510885864516e-06, "epoch": 0.7918526147156425, "percentage": 79.19, "elapsed_time": "9:52:43", "remaining_time": "2:35:48", "throughput": 1594.02, "total_tokens": 56688640} +{"current_steps": 6930, "total_steps": 8739, "loss": 1.3028, "learning_rate": 6.44335202694262e-06, "epoch": 0.7929969104016478, "percentage": 79.3, "elapsed_time": "9:53:36", "remaining_time": "2:34:57", "throughput": 1593.93, "total_tokens": 56770560} +{"current_steps": 6940, "total_steps": 8739, "loss": 1.4295, "learning_rate": 6.375498962038265e-06, "epoch": 0.794141206087653, "percentage": 79.41, "elapsed_time": "9:54:30", "remaining_time": "2:34:06", "throughput": 1593.84, "total_tokens": 56852480} +{"current_steps": 6950, "total_steps": 8739, "loss": 1.503, "learning_rate": 6.307952809298517e-06, "epoch": 0.7952855017736583, "percentage": 79.53, "elapsed_time": "9:55:23", "remaining_time": "2:33:15", "throughput": 1593.75, "total_tokens": 56934400} +{"current_steps": 6960, "total_steps": 8739, "loss": 1.1341, "learning_rate": 6.240714681812837e-06, "epoch": 0.7964297974596636, "percentage": 79.64, "elapsed_time": "9:56:16", "remaining_time": "2:32:24", "throughput": 1593.67, "total_tokens": 57016320} +{"current_steps": 6970, "total_steps": 8739, "loss": 1.14, "learning_rate": 6.173785687594761e-06, "epoch": 0.7975740931456688, "percentage": 79.76, "elapsed_time": "9:57:10", "remaining_time": "2:31:33", "throughput": 1593.58, "total_tokens": 57098240} +{"current_steps": 6980, "total_steps": 8739, "loss": 1.2954, "learning_rate": 6.107166929563629e-06, "epoch": 0.7987183888316741, "percentage": 79.87, "elapsed_time": "9:58:03", "remaining_time": "2:30:42", "throughput": 1593.52, "total_tokens": 57180160} +{"current_steps": 6990, "total_steps": 8739, "loss": 1.3446, "learning_rate": 6.040859505526439e-06, "epoch": 0.7998626845176794, "percentage": 79.99, "elapsed_time": "9:58:56", "remaining_time": "2:29:51", "throughput": 1593.44, "total_tokens": 57262080} +{"current_steps": 7000, "total_steps": 8739, "loss": 1.0721, "learning_rate": 5.974864508159692e-06, "epoch": 0.8010069802036847, "percentage": 80.1, "elapsed_time": "9:59:49", "remaining_time": "2:29:00", "throughput": 1593.36, "total_tokens": 57344000} +{"current_steps": 7010, "total_steps": 8739, "loss": 1.3073, "learning_rate": 5.9091830249914685e-06, "epoch": 0.8021512758896899, "percentage": 80.22, "elapsed_time": "10:00:53", "remaining_time": "2:28:12", "throughput": 1592.79, "total_tokens": 57425920} +{"current_steps": 7020, "total_steps": 8739, "loss": 1.3409, "learning_rate": 5.843816138383429e-06, "epoch": 0.8032955715756952, "percentage": 80.33, "elapsed_time": "10:01:47", "remaining_time": "2:27:21", "throughput": 1592.69, "total_tokens": 57507840} +{"current_steps": 7030, "total_steps": 8739, "loss": 1.3687, "learning_rate": 5.778764925513045e-06, "epoch": 0.8044398672617005, "percentage": 80.44, "elapsed_time": "10:02:40", "remaining_time": "2:26:30", "throughput": 1592.61, "total_tokens": 57589760} +{"current_steps": 7040, "total_steps": 8739, "loss": 1.099, "learning_rate": 5.714030458355784e-06, "epoch": 0.8055841629477057, "percentage": 80.56, "elapsed_time": "10:03:33", "remaining_time": "2:25:39", "throughput": 1592.54, "total_tokens": 57671680} +{"current_steps": 7050, "total_steps": 8739, "loss": 1.3109, "learning_rate": 5.649613803667511e-06, "epoch": 0.8067284586337109, "percentage": 80.67, "elapsed_time": "10:04:27", "remaining_time": "2:24:48", "throughput": 1592.44, "total_tokens": 57753600} +{"current_steps": 7060, "total_steps": 8739, "loss": 1.2747, "learning_rate": 5.5855160229668636e-06, "epoch": 0.8078727543197162, "percentage": 80.79, "elapsed_time": "10:05:20", "remaining_time": "2:23:57", "throughput": 1592.38, "total_tokens": 57835520} +{"current_steps": 7070, "total_steps": 8739, "loss": 1.2696, "learning_rate": 5.5217381725177624e-06, "epoch": 0.8090170500057214, "percentage": 80.9, "elapsed_time": "10:06:13", "remaining_time": "2:23:06", "throughput": 1592.3, "total_tokens": 57917440} +{"current_steps": 7080, "total_steps": 8739, "loss": 1.1509, "learning_rate": 5.458281303312016e-06, "epoch": 0.8101613456917267, "percentage": 81.02, "elapsed_time": "10:07:07", "remaining_time": "2:22:15", "throughput": 1592.2, "total_tokens": 57999360} +{"current_steps": 7090, "total_steps": 8739, "loss": 1.2708, "learning_rate": 5.39514646105202e-06, "epoch": 0.811305641377732, "percentage": 81.13, "elapsed_time": "10:08:00", "remaining_time": "2:21:24", "throughput": 1592.12, "total_tokens": 58081280} +{"current_steps": 7100, "total_steps": 8739, "loss": 1.4797, "learning_rate": 5.332334686133475e-06, "epoch": 0.8124499370637372, "percentage": 81.24, "elapsed_time": "10:08:54", "remaining_time": "2:20:33", "throughput": 1592.01, "total_tokens": 58163200} +{"current_steps": 7110, "total_steps": 8739, "loss": 1.192, "learning_rate": 5.269847013628299e-06, "epoch": 0.8135942327497425, "percentage": 81.36, "elapsed_time": "10:09:47", "remaining_time": "2:19:42", "throughput": 1591.93, "total_tokens": 58245120} +{"current_steps": 7120, "total_steps": 8739, "loss": 1.5395, "learning_rate": 5.207684473267527e-06, "epoch": 0.8147385284357478, "percentage": 81.47, "elapsed_time": "10:10:40", "remaining_time": "2:18:51", "throughput": 1591.87, "total_tokens": 58327040} +{"current_steps": 7130, "total_steps": 8739, "loss": 1.2233, "learning_rate": 5.145848089424374e-06, "epoch": 0.8158828241217531, "percentage": 81.59, "elapsed_time": "10:11:33", "remaining_time": "2:18:00", "throughput": 1591.79, "total_tokens": 58408960} +{"current_steps": 7140, "total_steps": 8739, "loss": 1.4877, "learning_rate": 5.0843388810973195e-06, "epoch": 0.8170271198077583, "percentage": 81.7, "elapsed_time": "10:12:26", "remaining_time": "2:17:09", "throughput": 1591.74, "total_tokens": 58490880} +{"current_steps": 7150, "total_steps": 8739, "loss": 1.1406, "learning_rate": 5.02315786189334e-06, "epoch": 0.8181714154937636, "percentage": 81.82, "elapsed_time": "10:13:20", "remaining_time": "2:16:18", "throughput": 1591.65, "total_tokens": 58572800} +{"current_steps": 7160, "total_steps": 8739, "loss": 1.1193, "learning_rate": 4.962306040011222e-06, "epoch": 0.8193157111797689, "percentage": 81.93, "elapsed_time": "10:14:13", "remaining_time": "2:15:27", "throughput": 1591.57, "total_tokens": 58654720} +{"current_steps": 7170, "total_steps": 8739, "loss": 1.0802, "learning_rate": 4.901784418224892e-06, "epoch": 0.8204600068657741, "percentage": 82.05, "elapsed_time": "10:15:06", "remaining_time": "2:14:36", "throughput": 1591.49, "total_tokens": 58736640} +{"current_steps": 7180, "total_steps": 8739, "loss": 1.0499, "learning_rate": 4.841593993866949e-06, "epoch": 0.8216043025517794, "percentage": 82.16, "elapsed_time": "10:15:59", "remaining_time": "2:13:45", "throughput": 1591.42, "total_tokens": 58818560} +{"current_steps": 7190, "total_steps": 8739, "loss": 1.2981, "learning_rate": 4.781735758812217e-06, "epoch": 0.8227485982377847, "percentage": 82.27, "elapsed_time": "10:16:52", "remaining_time": "2:12:53", "throughput": 1591.35, "total_tokens": 58900480} +{"current_steps": 7200, "total_steps": 8739, "loss": 1.1535, "learning_rate": 4.7222106994613655e-06, "epoch": 0.82389289392379, "percentage": 82.39, "elapsed_time": "10:17:46", "remaining_time": "2:12:02", "throughput": 1591.27, "total_tokens": 58982400} +{"current_steps": 7210, "total_steps": 8739, "loss": 1.2276, "learning_rate": 4.663019796724685e-06, "epoch": 0.8250371896097952, "percentage": 82.5, "elapsed_time": "10:18:39", "remaining_time": "2:11:11", "throughput": 1591.21, "total_tokens": 59064320} +{"current_steps": 7220, "total_steps": 8739, "loss": 1.3646, "learning_rate": 4.604164026005925e-06, "epoch": 0.8261814852958005, "percentage": 82.62, "elapsed_time": "10:19:32", "remaining_time": "2:10:20", "throughput": 1591.13, "total_tokens": 59146240} +{"current_steps": 7230, "total_steps": 8739, "loss": 1.3941, "learning_rate": 4.5456443571862185e-06, "epoch": 0.8273257809818056, "percentage": 82.73, "elapsed_time": "10:20:25", "remaining_time": "2:09:29", "throughput": 1591.05, "total_tokens": 59228160} +{"current_steps": 7240, "total_steps": 8739, "loss": 1.102, "learning_rate": 4.487461754608066e-06, "epoch": 0.8284700766678109, "percentage": 82.85, "elapsed_time": "10:21:18", "remaining_time": "2:08:38", "throughput": 1591.0, "total_tokens": 59310080} +{"current_steps": 7250, "total_steps": 8739, "loss": 1.167, "learning_rate": 4.429617177059508e-06, "epoch": 0.8296143723538162, "percentage": 82.96, "elapsed_time": "10:22:12", "remaining_time": "2:07:47", "throughput": 1590.91, "total_tokens": 59392000} +{"current_steps": 7260, "total_steps": 8739, "loss": 1.0619, "learning_rate": 4.372111577758261e-06, "epoch": 0.8307586680398215, "percentage": 83.08, "elapsed_time": "10:23:05", "remaining_time": "2:06:56", "throughput": 1590.84, "total_tokens": 59473920} +{"current_steps": 7270, "total_steps": 8739, "loss": 1.2679, "learning_rate": 4.314945904336037e-06, "epoch": 0.8319029637258267, "percentage": 83.19, "elapsed_time": "10:23:58", "remaining_time": "2:06:04", "throughput": 1590.78, "total_tokens": 59555840} +{"current_steps": 7280, "total_steps": 8739, "loss": 1.2982, "learning_rate": 4.258121098822945e-06, "epoch": 0.833047259411832, "percentage": 83.3, "elapsed_time": "10:24:51", "remaining_time": "2:05:13", "throughput": 1590.71, "total_tokens": 59637760} +{"current_steps": 7290, "total_steps": 8739, "loss": 1.2368, "learning_rate": 4.201638097631938e-06, "epoch": 0.8341915550978373, "percentage": 83.42, "elapsed_time": "10:25:44", "remaining_time": "2:04:22", "throughput": 1590.64, "total_tokens": 59719680} +{"current_steps": 7300, "total_steps": 8739, "loss": 0.9904, "learning_rate": 4.145497831543402e-06, "epoch": 0.8353358507838425, "percentage": 83.53, "elapsed_time": "10:26:37", "remaining_time": "2:03:31", "throughput": 1590.57, "total_tokens": 59801600} +{"current_steps": 7310, "total_steps": 8739, "loss": 1.186, "learning_rate": 4.089701225689793e-06, "epoch": 0.8364801464698478, "percentage": 83.65, "elapsed_time": "10:27:30", "remaining_time": "2:02:40", "throughput": 1590.5, "total_tokens": 59883520} +{"current_steps": 7320, "total_steps": 8739, "loss": 1.359, "learning_rate": 4.034249199540432e-06, "epoch": 0.8376244421558531, "percentage": 83.76, "elapsed_time": "10:28:23", "remaining_time": "2:01:48", "throughput": 1590.43, "total_tokens": 59965440} +{"current_steps": 7330, "total_steps": 8739, "loss": 1.1773, "learning_rate": 3.97914266688631e-06, "epoch": 0.8387687378418583, "percentage": 83.88, "elapsed_time": "10:29:17", "remaining_time": "2:00:57", "throughput": 1590.36, "total_tokens": 60047360} +{"current_steps": 7340, "total_steps": 8739, "loss": 1.2996, "learning_rate": 3.924382535825047e-06, "epoch": 0.8399130335278636, "percentage": 83.99, "elapsed_time": "10:30:10", "remaining_time": "2:00:06", "throughput": 1590.27, "total_tokens": 60129280} +{"current_steps": 7350, "total_steps": 8739, "loss": 1.1155, "learning_rate": 3.869969708745946e-06, "epoch": 0.8410573292138689, "percentage": 84.11, "elapsed_time": "10:31:03", "remaining_time": "1:59:15", "throughput": 1590.2, "total_tokens": 60211200} +{"current_steps": 7360, "total_steps": 8739, "loss": 1.058, "learning_rate": 3.815905082315102e-06, "epoch": 0.8422016248998742, "percentage": 84.22, "elapsed_time": "10:31:57", "remaining_time": "1:58:24", "throughput": 1590.13, "total_tokens": 60293120} +{"current_steps": 7370, "total_steps": 8739, "loss": 1.2502, "learning_rate": 3.762189547460615e-06, "epoch": 0.8433459205858794, "percentage": 84.33, "elapsed_time": "10:32:50", "remaining_time": "1:57:33", "throughput": 1590.07, "total_tokens": 60375040} +{"current_steps": 7380, "total_steps": 8739, "loss": 1.2315, "learning_rate": 3.7088239893579456e-06, "epoch": 0.8444902162718847, "percentage": 84.45, "elapsed_time": "10:33:43", "remaining_time": "1:56:41", "throughput": 1590.0, "total_tokens": 60456960} +{"current_steps": 7390, "total_steps": 8739, "loss": 1.46, "learning_rate": 3.655809287415285e-06, "epoch": 0.84563451195789, "percentage": 84.56, "elapsed_time": "10:34:37", "remaining_time": "1:55:50", "throughput": 1589.89, "total_tokens": 60538880} +{"current_steps": 7400, "total_steps": 8739, "loss": 1.2398, "learning_rate": 3.603146315259104e-06, "epoch": 0.8467788076438952, "percentage": 84.68, "elapsed_time": "10:35:36", "remaining_time": "1:55:00", "throughput": 1589.56, "total_tokens": 60620800} +{"current_steps": 7410, "total_steps": 8739, "loss": 1.2431, "learning_rate": 3.5508359407197157e-06, "epoch": 0.8479231033299004, "percentage": 84.79, "elapsed_time": "10:36:31", "remaining_time": "1:54:09", "throughput": 1589.42, "total_tokens": 60702720} +{"current_steps": 7420, "total_steps": 8739, "loss": 0.9851, "learning_rate": 3.4988790258170146e-06, "epoch": 0.8490673990159057, "percentage": 84.91, "elapsed_time": "10:37:24", "remaining_time": "1:53:18", "throughput": 1589.36, "total_tokens": 60784640} +{"current_steps": 7430, "total_steps": 8739, "loss": 1.1814, "learning_rate": 3.4472764267462486e-06, "epoch": 0.8502116947019109, "percentage": 85.02, "elapsed_time": "10:38:17", "remaining_time": "1:52:27", "throughput": 1589.33, "total_tokens": 60866560} +{"current_steps": 7440, "total_steps": 8739, "loss": 1.0398, "learning_rate": 3.396028993863906e-06, "epoch": 0.8513559903879162, "percentage": 85.14, "elapsed_time": "10:39:07", "remaining_time": "1:51:35", "throughput": 1589.39, "total_tokens": 60948480} +{"current_steps": 7450, "total_steps": 8739, "loss": 1.1797, "learning_rate": 3.3451375716737067e-06, "epoch": 0.8525002860739215, "percentage": 85.25, "elapsed_time": "10:39:51", "remaining_time": "1:50:42", "throughput": 1589.7, "total_tokens": 61030400} +{"current_steps": 7460, "total_steps": 8739, "loss": 1.3581, "learning_rate": 3.2946029988127068e-06, "epoch": 0.8536445817599267, "percentage": 85.36, "elapsed_time": "10:40:36", "remaining_time": "1:49:49", "throughput": 1589.94, "total_tokens": 61112320} +{"current_steps": 7470, "total_steps": 8739, "loss": 1.1539, "learning_rate": 3.2444261080374546e-06, "epoch": 0.854788877445932, "percentage": 85.48, "elapsed_time": "10:41:22", "remaining_time": "1:48:57", "throughput": 1590.17, "total_tokens": 61194240} +{"current_steps": 7480, "total_steps": 8739, "loss": 1.0741, "learning_rate": 3.194607726210261e-06, "epoch": 0.8559331731319373, "percentage": 85.59, "elapsed_time": "10:42:09", "remaining_time": "1:48:05", "throughput": 1590.38, "total_tokens": 61276160} +{"current_steps": 7490, "total_steps": 8739, "loss": 1.2566, "learning_rate": 3.1451486742856055e-06, "epoch": 0.8570774688179426, "percentage": 85.71, "elapsed_time": "10:42:57", "remaining_time": "1:47:13", "throughput": 1590.5, "total_tokens": 61358080} +{"current_steps": 7500, "total_steps": 8739, "loss": 1.2257, "learning_rate": 3.0960497672965825e-06, "epoch": 0.8582217645039478, "percentage": 85.82, "elapsed_time": "10:43:47", "remaining_time": "1:46:21", "throughput": 1590.59, "total_tokens": 61440000} +{"current_steps": 7510, "total_steps": 8739, "loss": 1.4217, "learning_rate": 3.0473118143414634e-06, "epoch": 0.8593660601899531, "percentage": 85.94, "elapsed_time": "10:44:33", "remaining_time": "1:45:28", "throughput": 1590.79, "total_tokens": 61521920} +{"current_steps": 7520, "total_steps": 8739, "loss": 1.4657, "learning_rate": 2.9989356185703975e-06, "epoch": 0.8605103558759584, "percentage": 86.05, "elapsed_time": "10:45:27", "remaining_time": "1:44:37", "throughput": 1590.68, "total_tokens": 61603840} +{"current_steps": 7530, "total_steps": 8739, "loss": 1.0984, "learning_rate": 2.950921977172155e-06, "epoch": 0.8616546515619636, "percentage": 86.17, "elapsed_time": "10:46:41", "remaining_time": "1:43:49", "throughput": 1589.79, "total_tokens": 61685760} +{"current_steps": 7540, "total_steps": 8739, "loss": 1.1865, "learning_rate": 2.9032716813609723e-06, "epoch": 0.8627989472479689, "percentage": 86.28, "elapsed_time": "10:47:36", "remaining_time": "1:42:58", "throughput": 1589.64, "total_tokens": 61767680} +{"current_steps": 7550, "total_steps": 8739, "loss": 1.1777, "learning_rate": 2.8559855163635544e-06, "epoch": 0.8639432429339742, "percentage": 86.39, "elapsed_time": "10:48:37", "remaining_time": "1:42:08", "throughput": 1589.25, "total_tokens": 61849600} +{"current_steps": 7560, "total_steps": 8739, "loss": 1.5473, "learning_rate": 2.809064261406111e-06, "epoch": 0.8650875386199794, "percentage": 86.51, "elapsed_time": "10:49:25", "remaining_time": "1:41:16", "throughput": 1589.39, "total_tokens": 61931520} +{"current_steps": 7570, "total_steps": 8739, "loss": 1.1929, "learning_rate": 2.762508689701504e-06, "epoch": 0.8662318343059847, "percentage": 86.62, "elapsed_time": "10:50:16", "remaining_time": "1:40:25", "throughput": 1589.41, "total_tokens": 62013440} +{"current_steps": 7580, "total_steps": 8739, "loss": 1.0352, "learning_rate": 2.716319568436529e-06, "epoch": 0.8673761299919899, "percentage": 86.74, "elapsed_time": "10:51:03", "remaining_time": "1:39:32", "throughput": 1589.61, "total_tokens": 62095360} +{"current_steps": 7590, "total_steps": 8739, "loss": 1.0181, "learning_rate": 2.6704976587592688e-06, "epoch": 0.8685204256779951, "percentage": 86.85, "elapsed_time": "10:51:50", "remaining_time": "1:38:40", "throughput": 1589.77, "total_tokens": 62177280} +{"current_steps": 7600, "total_steps": 8739, "loss": 1.2663, "learning_rate": 2.6250437157665455e-06, "epoch": 0.8696647213640004, "percentage": 86.97, "elapsed_time": "10:52:39", "remaining_time": "1:37:48", "throughput": 1589.89, "total_tokens": 62259200} +{"current_steps": 7610, "total_steps": 8739, "loss": 1.0863, "learning_rate": 2.5799584884914685e-06, "epoch": 0.8708090170500057, "percentage": 87.08, "elapsed_time": "10:53:27", "remaining_time": "1:36:56", "throughput": 1590.01, "total_tokens": 62341120} +{"current_steps": 7620, "total_steps": 8739, "loss": 1.1277, "learning_rate": 2.535242719891112e-06, "epoch": 0.871953312736011, "percentage": 87.2, "elapsed_time": "10:54:14", "remaining_time": "1:36:04", "throughput": 1590.2, "total_tokens": 62423040} +{"current_steps": 7630, "total_steps": 8739, "loss": 1.067, "learning_rate": 2.4908971468342535e-06, "epoch": 0.8730976084220162, "percentage": 87.31, "elapsed_time": "10:55:03", "remaining_time": "1:35:12", "throughput": 1590.34, "total_tokens": 62504960} +{"current_steps": 7640, "total_steps": 8739, "loss": 1.2818, "learning_rate": 2.44692250008923e-06, "epoch": 0.8742419041080215, "percentage": 87.42, "elapsed_time": "10:55:50", "remaining_time": "1:34:20", "throughput": 1590.51, "total_tokens": 62586880} +{"current_steps": 7650, "total_steps": 8739, "loss": 1.1506, "learning_rate": 2.403319504311921e-06, "epoch": 0.8753861997940268, "percentage": 87.54, "elapsed_time": "10:56:37", "remaining_time": "1:33:28", "throughput": 1590.69, "total_tokens": 62668800} +{"current_steps": 7660, "total_steps": 8739, "loss": 1.5572, "learning_rate": 2.360088878033778e-06, "epoch": 0.876530495480032, "percentage": 87.65, "elapsed_time": "10:57:25", "remaining_time": "1:32:36", "throughput": 1590.82, "total_tokens": 62750720} +{"current_steps": 7670, "total_steps": 8739, "loss": 1.2879, "learning_rate": 2.317231333650005e-06, "epoch": 0.8776747911660373, "percentage": 87.77, "elapsed_time": "10:58:13", "remaining_time": "1:31:44", "throughput": 1590.94, "total_tokens": 62832640} +{"current_steps": 7680, "total_steps": 8739, "loss": 1.1017, "learning_rate": 2.2747475774077986e-06, "epoch": 0.8788190868520426, "percentage": 87.88, "elapsed_time": "10:59:01", "remaining_time": "1:30:52", "throughput": 1591.11, "total_tokens": 62914560} +{"current_steps": 7690, "total_steps": 8739, "loss": 1.2244, "learning_rate": 2.2326383093947135e-06, "epoch": 0.8799633825380478, "percentage": 88.0, "elapsed_time": "10:59:50", "remaining_time": "1:30:00", "throughput": 1591.19, "total_tokens": 62996480} +{"current_steps": 7700, "total_steps": 8739, "loss": 1.3507, "learning_rate": 2.1909042235271597e-06, "epoch": 0.8811076782240531, "percentage": 88.11, "elapsed_time": "11:00:43", "remaining_time": "1:29:09", "throughput": 1591.13, "total_tokens": 63078400} +{"current_steps": 7710, "total_steps": 8739, "loss": 1.0351, "learning_rate": 2.1495460075389133e-06, "epoch": 0.8822519739100584, "percentage": 88.23, "elapsed_time": "11:01:31", "remaining_time": "1:28:17", "throughput": 1591.26, "total_tokens": 63160320} +{"current_steps": 7720, "total_steps": 8739, "loss": 1.1214, "learning_rate": 2.1085643429698236e-06, "epoch": 0.8833962695960637, "percentage": 88.34, "elapsed_time": "11:02:23", "remaining_time": "1:27:25", "throughput": 1591.25, "total_tokens": 63242240} +{"current_steps": 7730, "total_steps": 8739, "loss": 1.1543, "learning_rate": 2.067959905154568e-06, "epoch": 0.8845405652820689, "percentage": 88.45, "elapsed_time": "11:03:13", "remaining_time": "1:26:34", "throughput": 1591.33, "total_tokens": 63324160} +{"current_steps": 7740, "total_steps": 8739, "loss": 0.9881, "learning_rate": 2.0277333632115288e-06, "epoch": 0.8856848609680742, "percentage": 88.57, "elapsed_time": "11:04:04", "remaining_time": "1:25:42", "throughput": 1591.33, "total_tokens": 63406080} +{"current_steps": 7750, "total_steps": 8739, "loss": 1.4237, "learning_rate": 1.9878853800317535e-06, "epoch": 0.8868291566540795, "percentage": 88.68, "elapsed_time": "11:04:55", "remaining_time": "1:24:51", "throughput": 1591.37, "total_tokens": 63488000} +{"current_steps": 7760, "total_steps": 8739, "loss": 1.1573, "learning_rate": 1.948416612268034e-06, "epoch": 0.8879734523400846, "percentage": 88.8, "elapsed_time": "11:05:53", "remaining_time": "1:24:00", "throughput": 1591.09, "total_tokens": 63569920} +{"current_steps": 7770, "total_steps": 8739, "loss": 1.303, "learning_rate": 1.909327710324116e-06, "epoch": 0.8891177480260899, "percentage": 88.91, "elapsed_time": "11:06:56", "remaining_time": "1:23:10", "throughput": 1590.64, "total_tokens": 63651840} +{"current_steps": 7780, "total_steps": 8739, "loss": 1.2495, "learning_rate": 1.8706193183439247e-06, "epoch": 0.8902620437120952, "percentage": 89.03, "elapsed_time": "11:07:51", "remaining_time": "1:22:19", "throughput": 1590.49, "total_tokens": 63733760} +{"current_steps": 7790, "total_steps": 8739, "loss": 1.1877, "learning_rate": 1.8322920742010086e-06, "epoch": 0.8914063393981004, "percentage": 89.14, "elapsed_time": "11:08:48", "remaining_time": "1:21:28", "throughput": 1590.27, "total_tokens": 63815680} +{"current_steps": 7800, "total_steps": 8739, "loss": 1.1676, "learning_rate": 1.7943466094879902e-06, "epoch": 0.8925506350841057, "percentage": 89.26, "elapsed_time": "11:09:44", "remaining_time": "1:20:37", "throughput": 1590.12, "total_tokens": 63897600} +{"current_steps": 7810, "total_steps": 8739, "loss": 1.1575, "learning_rate": 1.7567835495061718e-06, "epoch": 0.893694930770111, "percentage": 89.37, "elapsed_time": "11:11:19", "remaining_time": "1:19:51", "throughput": 1588.4, "total_tokens": 63979520} +{"current_steps": 7820, "total_steps": 8739, "loss": 1.0517, "learning_rate": 1.7196035132552135e-06, "epoch": 0.8948392264561162, "percentage": 89.48, "elapsed_time": "11:12:24", "remaining_time": "1:19:01", "throughput": 1587.86, "total_tokens": 64061440} +{"current_steps": 7830, "total_steps": 8739, "loss": 1.4192, "learning_rate": 1.682807113422971e-06, "epoch": 0.8959835221421215, "percentage": 89.6, "elapsed_time": "11:13:24", "remaining_time": "1:18:10", "throughput": 1587.52, "total_tokens": 64143360} +{"current_steps": 7840, "total_steps": 8739, "loss": 1.5286, "learning_rate": 1.646394956375369e-06, "epoch": 0.8971278178281268, "percentage": 89.71, "elapsed_time": "11:14:15", "remaining_time": "1:17:18", "throughput": 1587.57, "total_tokens": 64225280} +{"current_steps": 7850, "total_steps": 8739, "loss": 0.9688, "learning_rate": 1.6103676421463986e-06, "epoch": 0.898272113514132, "percentage": 89.83, "elapsed_time": "11:15:17", "remaining_time": "1:16:28", "throughput": 1587.16, "total_tokens": 64307200} +{"current_steps": 7860, "total_steps": 8739, "loss": 1.1801, "learning_rate": 1.5747257644282726e-06, "epoch": 0.8994164092001373, "percentage": 89.94, "elapsed_time": "11:16:16", "remaining_time": "1:15:37", "throughput": 1586.85, "total_tokens": 64389120} +{"current_steps": 7870, "total_steps": 8739, "loss": 1.0305, "learning_rate": 1.5394699105616002e-06, "epoch": 0.9005607048861426, "percentage": 90.06, "elapsed_time": "11:17:05", "remaining_time": "1:14:45", "throughput": 1586.96, "total_tokens": 64471040} +{"current_steps": 7880, "total_steps": 8739, "loss": 1.1399, "learning_rate": 1.504600661525718e-06, "epoch": 0.9017050005721479, "percentage": 90.17, "elapsed_time": "11:17:55", "remaining_time": "1:13:54", "throughput": 1587.01, "total_tokens": 64552960} +{"current_steps": 7890, "total_steps": 8739, "loss": 1.4673, "learning_rate": 1.4701185919291372e-06, "epoch": 0.9028492962581531, "percentage": 90.28, "elapsed_time": "11:18:44", "remaining_time": "1:13:02", "throughput": 1587.12, "total_tokens": 64634880} +{"current_steps": 7900, "total_steps": 8739, "loss": 1.0752, "learning_rate": 1.436024270000058e-06, "epoch": 0.9039935919441584, "percentage": 90.4, "elapsed_time": "11:19:33", "remaining_time": "1:12:10", "throughput": 1587.22, "total_tokens": 64716800} +{"current_steps": 7910, "total_steps": 8739, "loss": 1.1824, "learning_rate": 1.4023182575769956e-06, "epoch": 0.9051378876301637, "percentage": 90.51, "elapsed_time": "11:20:24", "remaining_time": "1:11:18", "throughput": 1587.23, "total_tokens": 64798720} +{"current_steps": 7920, "total_steps": 8739, "loss": 1.0409, "learning_rate": 1.3690011100995437e-06, "epoch": 0.9062821833161689, "percentage": 90.63, "elapsed_time": "11:21:22", "remaining_time": "1:10:27", "throughput": 1586.99, "total_tokens": 64880640} +{"current_steps": 7930, "total_steps": 8739, "loss": 1.2628, "learning_rate": 1.3360733765992116e-06, "epoch": 0.9074264790021742, "percentage": 90.74, "elapsed_time": "11:22:15", "remaining_time": "1:09:36", "throughput": 1586.95, "total_tokens": 64962560} +{"current_steps": 7940, "total_steps": 8739, "loss": 1.307, "learning_rate": 1.3035355996903697e-06, "epoch": 0.9085707746881794, "percentage": 90.86, "elapsed_time": "11:23:10", "remaining_time": "1:08:44", "throughput": 1586.82, "total_tokens": 65044480} +{"current_steps": 7950, "total_steps": 8739, "loss": 1.061, "learning_rate": 1.2713883155613144e-06, "epoch": 0.9097150703741846, "percentage": 90.97, "elapsed_time": "11:24:02", "remaining_time": "1:07:53", "throughput": 1586.81, "total_tokens": 65126400} +{"current_steps": 7960, "total_steps": 8739, "loss": 1.178, "learning_rate": 1.2396320539654366e-06, "epoch": 0.9108593660601899, "percentage": 91.09, "elapsed_time": "11:24:50", "remaining_time": "1:07:01", "throughput": 1586.94, "total_tokens": 65208320} +{"current_steps": 7970, "total_steps": 8739, "loss": 1.3368, "learning_rate": 1.208267338212493e-06, "epoch": 0.9120036617461952, "percentage": 91.2, "elapsed_time": "11:25:42", "remaining_time": "1:06:09", "throughput": 1586.94, "total_tokens": 65290240} +{"current_steps": 7980, "total_steps": 8739, "loss": 1.3091, "learning_rate": 1.177294685159963e-06, "epoch": 0.9131479574322005, "percentage": 91.31, "elapsed_time": "11:26:33", "remaining_time": "1:05:18", "throughput": 1586.94, "total_tokens": 65372160} +{"current_steps": 7990, "total_steps": 8739, "loss": 1.2932, "learning_rate": 1.1467146052045603e-06, "epoch": 0.9142922531182057, "percentage": 91.43, "elapsed_time": "11:27:22", "remaining_time": "1:04:26", "throughput": 1587.05, "total_tokens": 65454080} +{"current_steps": 8000, "total_steps": 8739, "loss": 1.1777, "learning_rate": 1.1165276022737926e-06, "epoch": 0.915436548804211, "percentage": 91.54, "elapsed_time": "11:28:19", "remaining_time": "1:03:35", "throughput": 1586.85, "total_tokens": 65536000} +{"current_steps": 8010, "total_steps": 8739, "loss": 1.3184, "learning_rate": 1.0867341738176857e-06, "epoch": 0.9165808444902163, "percentage": 91.66, "elapsed_time": "11:29:20", "remaining_time": "1:02:44", "throughput": 1586.47, "total_tokens": 65617920} +{"current_steps": 8020, "total_steps": 8739, "loss": 1.2283, "learning_rate": 1.0573348108005614e-06, "epoch": 0.9177251401762215, "percentage": 91.77, "elapsed_time": "11:30:09", "remaining_time": "1:01:52", "throughput": 1586.57, "total_tokens": 65699840} +{"current_steps": 8030, "total_steps": 8739, "loss": 1.4513, "learning_rate": 1.0283299976929672e-06, "epoch": 0.9188694358622268, "percentage": 91.89, "elapsed_time": "11:30:59", "remaining_time": "1:01:00", "throughput": 1586.65, "total_tokens": 65781760} +{"current_steps": 8040, "total_steps": 8739, "loss": 1.2401, "learning_rate": 9.997202124636785e-07, "epoch": 0.9200137315482321, "percentage": 92.0, "elapsed_time": "11:31:48", "remaining_time": "1:00:08", "throughput": 1586.74, "total_tokens": 65863680} +{"current_steps": 8050, "total_steps": 8739, "loss": 1.0646, "learning_rate": 9.715059265718335e-07, "epoch": 0.9211580272342373, "percentage": 92.12, "elapsed_time": "11:32:37", "remaining_time": "0:59:16", "throughput": 1586.83, "total_tokens": 65945600} +{"current_steps": 8060, "total_steps": 8739, "loss": 1.4221, "learning_rate": 9.436876049591398e-07, "epoch": 0.9223023229202426, "percentage": 92.23, "elapsed_time": "11:33:27", "remaining_time": "0:58:25", "throughput": 1586.92, "total_tokens": 66027520} +{"current_steps": 8070, "total_steps": 8739, "loss": 1.2108, "learning_rate": 9.162657060422574e-07, "epoch": 0.9234466186062479, "percentage": 92.34, "elapsed_time": "11:34:16", "remaining_time": "0:57:33", "throughput": 1587.02, "total_tokens": 66109440} +{"current_steps": 8080, "total_steps": 8739, "loss": 1.4522, "learning_rate": 8.892406817051946e-07, "epoch": 0.9245909142922532, "percentage": 92.46, "elapsed_time": "11:35:05", "remaining_time": "0:56:41", "throughput": 1587.11, "total_tokens": 66191360} +{"current_steps": 8090, "total_steps": 8739, "loss": 1.2966, "learning_rate": 8.626129772918962e-07, "epoch": 0.9257352099782584, "percentage": 92.57, "elapsed_time": "11:35:54", "remaining_time": "0:55:49", "throughput": 1587.21, "total_tokens": 66273280} +{"current_steps": 8100, "total_steps": 8739, "loss": 1.2018, "learning_rate": 8.363830315988947e-07, "epoch": 0.9268795056642637, "percentage": 92.69, "elapsed_time": "11:36:44", "remaining_time": "0:54:57", "throughput": 1587.29, "total_tokens": 66355200} +{"current_steps": 8110, "total_steps": 8739, "loss": 1.1427, "learning_rate": 8.105512768680712e-07, "epoch": 0.928023801350269, "percentage": 92.8, "elapsed_time": "11:37:34", "remaining_time": "0:54:06", "throughput": 1587.35, "total_tokens": 66437120} +{"current_steps": 8120, "total_steps": 8739, "loss": 1.1591, "learning_rate": 7.851181387795392e-07, "epoch": 0.9291680970362741, "percentage": 92.92, "elapsed_time": "11:38:22", "remaining_time": "0:53:14", "throughput": 1587.45, "total_tokens": 66519040} +{"current_steps": 8130, "total_steps": 8739, "loss": 1.4109, "learning_rate": 7.600840364446333e-07, "epoch": 0.9303123927222794, "percentage": 93.03, "elapsed_time": "11:39:12", "remaining_time": "0:52:22", "throughput": 1587.55, "total_tokens": 66600960} +{"current_steps": 8140, "total_steps": 8739, "loss": 1.4194, "learning_rate": 7.354493823990006e-07, "epoch": 0.9314566884082847, "percentage": 93.15, "elapsed_time": "11:40:01", "remaining_time": "0:51:30", "throughput": 1587.64, "total_tokens": 66682880} +{"current_steps": 8150, "total_steps": 8739, "loss": 1.1635, "learning_rate": 7.112145825957927e-07, "epoch": 0.9326009840942899, "percentage": 93.26, "elapsed_time": "11:40:50", "remaining_time": "0:50:38", "throughput": 1587.73, "total_tokens": 66764800} +{"current_steps": 8160, "total_steps": 8739, "loss": 1.2245, "learning_rate": 6.873800363989935e-07, "epoch": 0.9337452797802952, "percentage": 93.37, "elapsed_time": "11:41:39", "remaining_time": "0:49:47", "throughput": 1587.82, "total_tokens": 66846720} +{"current_steps": 8170, "total_steps": 8739, "loss": 1.4055, "learning_rate": 6.63946136576829e-07, "epoch": 0.9348895754663005, "percentage": 93.49, "elapsed_time": "11:42:29", "remaining_time": "0:48:55", "throughput": 1587.9, "total_tokens": 66928640} +{"current_steps": 8180, "total_steps": 8739, "loss": 1.134, "learning_rate": 6.409132692952874e-07, "epoch": 0.9360338711523057, "percentage": 93.6, "elapsed_time": "11:43:18", "remaining_time": "0:48:03", "throughput": 1588.0, "total_tokens": 67010560} +{"current_steps": 8190, "total_steps": 8739, "loss": 1.1915, "learning_rate": 6.182818141117625e-07, "epoch": 0.937178166838311, "percentage": 93.72, "elapsed_time": "11:44:05", "remaining_time": "0:47:11", "throughput": 1588.17, "total_tokens": 67092480} +{"current_steps": 8200, "total_steps": 8739, "loss": 1.0641, "learning_rate": 5.960521439688088e-07, "epoch": 0.9383224625243163, "percentage": 93.83, "elapsed_time": "11:44:52", "remaining_time": "0:46:19", "throughput": 1588.33, "total_tokens": 67174400} +{"current_steps": 8210, "total_steps": 8739, "loss": 1.1629, "learning_rate": 5.742246251879829e-07, "epoch": 0.9394667582103216, "percentage": 93.95, "elapsed_time": "11:45:38", "remaining_time": "0:45:28", "throughput": 1588.53, "total_tokens": 67256320} +{"current_steps": 8220, "total_steps": 8739, "loss": 1.1297, "learning_rate": 5.527996174638061e-07, "epoch": 0.9406110538963268, "percentage": 94.06, "elapsed_time": "11:46:24", "remaining_time": "0:44:36", "throughput": 1588.75, "total_tokens": 67338240} +{"current_steps": 8230, "total_steps": 8739, "loss": 1.269, "learning_rate": 5.317774738578446e-07, "epoch": 0.9417553495823321, "percentage": 94.18, "elapsed_time": "11:47:12", "remaining_time": "0:43:44", "throughput": 1588.88, "total_tokens": 67420160} +{"current_steps": 8240, "total_steps": 8739, "loss": 1.0976, "learning_rate": 5.111585407928887e-07, "epoch": 0.9428996452683374, "percentage": 94.29, "elapsed_time": "11:48:09", "remaining_time": "0:42:53", "throughput": 1588.68, "total_tokens": 67502080} +{"current_steps": 8250, "total_steps": 8739, "loss": 1.2052, "learning_rate": 4.909431580472385e-07, "epoch": 0.9440439409543426, "percentage": 94.4, "elapsed_time": "11:48:57", "remaining_time": "0:42:01", "throughput": 1588.82, "total_tokens": 67584000} +{"current_steps": 8260, "total_steps": 8739, "loss": 1.1078, "learning_rate": 4.711316587491188e-07, "epoch": 0.9451882366403479, "percentage": 94.52, "elapsed_time": "11:49:45", "remaining_time": "0:41:09", "throughput": 1588.93, "total_tokens": 67665920} +{"current_steps": 8270, "total_steps": 8739, "loss": 1.2543, "learning_rate": 4.5172436937117036e-07, "epoch": 0.9463325323263532, "percentage": 94.63, "elapsed_time": "11:50:33", "remaining_time": "0:40:17", "throughput": 1589.08, "total_tokens": 67747840} +{"current_steps": 8280, "total_steps": 8739, "loss": 1.1164, "learning_rate": 4.3272160972509524e-07, "epoch": 0.9474768280123584, "percentage": 94.75, "elapsed_time": "11:51:22", "remaining_time": "0:39:26", "throughput": 1589.18, "total_tokens": 67829760} +{"current_steps": 8290, "total_steps": 8739, "loss": 1.1804, "learning_rate": 4.1412369295635023e-07, "epoch": 0.9486211236983637, "percentage": 94.86, "elapsed_time": "11:52:13", "remaining_time": "0:38:34", "throughput": 1589.19, "total_tokens": 67911680} +{"current_steps": 8300, "total_steps": 8739, "loss": 1.1059, "learning_rate": 3.9593092553902587e-07, "epoch": 0.9497654193843689, "percentage": 94.98, "elapsed_time": "11:53:05", "remaining_time": "0:37:42", "throughput": 1589.17, "total_tokens": 67993600} +{"current_steps": 8310, "total_steps": 8739, "loss": 1.1965, "learning_rate": 3.7814360727076724e-07, "epoch": 0.9509097150703741, "percentage": 95.09, "elapsed_time": "11:53:58", "remaining_time": "0:36:51", "throughput": 1589.14, "total_tokens": 68075520} +{"current_steps": 8320, "total_steps": 8739, "loss": 1.3606, "learning_rate": 3.607620312678528e-07, "epoch": 0.9520540107563794, "percentage": 95.21, "elapsed_time": "11:55:09", "remaining_time": "0:36:00", "throughput": 1588.42, "total_tokens": 68157440} +{"current_steps": 8330, "total_steps": 8739, "loss": 1.0969, "learning_rate": 3.437864839603455e-07, "epoch": 0.9531983064423847, "percentage": 95.32, "elapsed_time": "11:56:26", "remaining_time": "0:35:10", "throughput": 1587.45, "total_tokens": 68239360} +{"current_steps": 8340, "total_steps": 8739, "loss": 1.6294, "learning_rate": 3.272172450873967e-07, "epoch": 0.95434260212839, "percentage": 95.43, "elapsed_time": "11:57:17", "remaining_time": "0:34:18", "throughput": 1587.48, "total_tokens": 68321280} +{"current_steps": 8350, "total_steps": 8739, "loss": 1.0976, "learning_rate": 3.11054587692608e-07, "epoch": 0.9554868978143952, "percentage": 95.55, "elapsed_time": "11:58:08", "remaining_time": "0:33:27", "throughput": 1587.5, "total_tokens": 68403200} +{"current_steps": 8360, "total_steps": 8739, "loss": 1.1881, "learning_rate": 2.952987781195599e-07, "epoch": 0.9566311935004005, "percentage": 95.66, "elapsed_time": "11:58:57", "remaining_time": "0:32:35", "throughput": 1587.61, "total_tokens": 68485120} +{"current_steps": 8370, "total_steps": 8739, "loss": 1.1826, "learning_rate": 2.799500760073931e-07, "epoch": 0.9577754891864058, "percentage": 95.78, "elapsed_time": "11:59:45", "remaining_time": "0:31:43", "throughput": 1587.74, "total_tokens": 68567040} +{"current_steps": 8380, "total_steps": 8739, "loss": 1.1567, "learning_rate": 2.6500873428656483e-07, "epoch": 0.958919784872411, "percentage": 95.89, "elapsed_time": "12:00:33", "remaining_time": "0:30:52", "throughput": 1587.86, "total_tokens": 68648960} +{"current_steps": 8390, "total_steps": 8739, "loss": 0.9999, "learning_rate": 2.5047499917464636e-07, "epoch": 0.9600640805584163, "percentage": 96.01, "elapsed_time": "12:01:22", "remaining_time": "0:30:00", "throughput": 1587.97, "total_tokens": 68730880} +{"current_steps": 8400, "total_steps": 8739, "loss": 1.347, "learning_rate": 2.3634911017229034e-07, "epoch": 0.9612083762444216, "percentage": 96.12, "elapsed_time": "12:02:11", "remaining_time": "0:29:08", "throughput": 1588.07, "total_tokens": 68812800} +{"current_steps": 8410, "total_steps": 8739, "loss": 1.0357, "learning_rate": 2.2263130005927558e-07, "epoch": 0.9623526719304268, "percentage": 96.24, "elapsed_time": "12:03:00", "remaining_time": "0:28:17", "throughput": 1588.16, "total_tokens": 68894720} +{"current_steps": 8420, "total_steps": 8739, "loss": 1.3101, "learning_rate": 2.0932179489066006e-07, "epoch": 0.9634969676164321, "percentage": 96.35, "elapsed_time": "12:03:49", "remaining_time": "0:27:25", "throughput": 1588.24, "total_tokens": 68976640} +{"current_steps": 8430, "total_steps": 8739, "loss": 1.4347, "learning_rate": 1.9642081399307844e-07, "epoch": 0.9646412633024374, "percentage": 96.46, "elapsed_time": "12:04:37", "remaining_time": "0:26:33", "throughput": 1588.36, "total_tokens": 69058560} +{"current_steps": 8440, "total_steps": 8739, "loss": 0.9711, "learning_rate": 1.8392856996110875e-07, "epoch": 0.9657855589884426, "percentage": 96.58, "elapsed_time": "12:05:25", "remaining_time": "0:25:41", "throughput": 1588.5, "total_tokens": 69140480} +{"current_steps": 8450, "total_steps": 8739, "loss": 1.1246, "learning_rate": 1.7184526865377805e-07, "epoch": 0.9669298546744479, "percentage": 96.69, "elapsed_time": "12:06:14", "remaining_time": "0:24:50", "throughput": 1588.62, "total_tokens": 69222400} +{"current_steps": 8460, "total_steps": 8739, "loss": 1.182, "learning_rate": 1.6017110919116786e-07, "epoch": 0.9680741503604532, "percentage": 96.81, "elapsed_time": "12:07:01", "remaining_time": "0:23:58", "throughput": 1588.76, "total_tokens": 69304320} +{"current_steps": 8470, "total_steps": 8739, "loss": 1.2913, "learning_rate": 1.4890628395113072e-07, "epoch": 0.9692184460464585, "percentage": 96.92, "elapsed_time": "12:07:49", "remaining_time": "0:23:06", "throughput": 1588.9, "total_tokens": 69386240} +{"current_steps": 8480, "total_steps": 8739, "loss": 1.1669, "learning_rate": 1.380509785661288e-07, "epoch": 0.9703627417324636, "percentage": 97.04, "elapsed_time": "12:08:37", "remaining_time": "0:22:15", "throughput": 1589.02, "total_tokens": 69468160} +{"current_steps": 8490, "total_steps": 8739, "loss": 1.2136, "learning_rate": 1.2760537192015866e-07, "epoch": 0.9715070374184689, "percentage": 97.15, "elapsed_time": "12:09:26", "remaining_time": "0:21:23", "throughput": 1589.13, "total_tokens": 69550080} +{"current_steps": 8500, "total_steps": 8739, "loss": 1.4041, "learning_rate": 1.1756963614582006e-07, "epoch": 0.9726513331044742, "percentage": 97.27, "elapsed_time": "12:10:14", "remaining_time": "0:20:31", "throughput": 1589.23, "total_tokens": 69632000} +{"current_steps": 8510, "total_steps": 8739, "loss": 1.4145, "learning_rate": 1.0794393662147129e-07, "epoch": 0.9737956287904794, "percentage": 97.38, "elapsed_time": "12:11:02", "remaining_time": "0:19:40", "throughput": 1589.36, "total_tokens": 69713920} +{"current_steps": 8520, "total_steps": 8739, "loss": 1.1534, "learning_rate": 9.872843196850057e-08, "epoch": 0.9749399244764847, "percentage": 97.49, "elapsed_time": "12:11:49", "remaining_time": "0:18:48", "throughput": 1589.53, "total_tokens": 69795840} +{"current_steps": 8530, "total_steps": 8739, "loss": 1.1406, "learning_rate": 8.992327404872825e-08, "epoch": 0.97608422016249, "percentage": 97.61, "elapsed_time": "12:12:35", "remaining_time": "0:17:56", "throughput": 1589.72, "total_tokens": 69877760} +{"current_steps": 8540, "total_steps": 8739, "loss": 1.4171, "learning_rate": 8.152860796187545e-08, "epoch": 0.9772285158484952, "percentage": 97.72, "elapsed_time": "12:13:22", "remaining_time": "0:17:05", "throughput": 1589.91, "total_tokens": 69959680} +{"current_steps": 8550, "total_steps": 8739, "loss": 1.2596, "learning_rate": 7.354457204320486e-08, "epoch": 0.9783728115345005, "percentage": 97.84, "elapsed_time": "12:14:09", "remaining_time": "0:16:13", "throughput": 1590.06, "total_tokens": 70041600} +{"current_steps": 8560, "total_steps": 8739, "loss": 1.4422, "learning_rate": 6.59712978612198e-08, "epoch": 0.9795171072205058, "percentage": 97.95, "elapsed_time": "12:14:56", "remaining_time": "0:15:22", "throughput": 1590.21, "total_tokens": 70123520} +{"current_steps": 8570, "total_steps": 8739, "loss": 1.1456, "learning_rate": 5.880891021549928e-08, "epoch": 0.980661402906511, "percentage": 98.07, "elapsed_time": "12:15:44", "remaining_time": "0:14:30", "throughput": 1590.37, "total_tokens": 70205440} +{"current_steps": 8580, "total_steps": 8739, "loss": 1.235, "learning_rate": 5.205752713465794e-08, "epoch": 0.9818056985925163, "percentage": 98.18, "elapsed_time": "12:16:33", "remaining_time": "0:13:38", "throughput": 1590.43, "total_tokens": 70287360} +{"current_steps": 8590, "total_steps": 8739, "loss": 1.2076, "learning_rate": 4.57172598743727e-08, "epoch": 0.9829499942785216, "percentage": 98.29, "elapsed_time": "12:17:25", "remaining_time": "0:12:47", "throughput": 1590.44, "total_tokens": 70369280} +{"current_steps": 8600, "total_steps": 8739, "loss": 1.1558, "learning_rate": 3.9788212915573e-08, "epoch": 0.9840942899645269, "percentage": 98.41, "elapsed_time": "12:18:13", "remaining_time": "0:11:55", "throughput": 1590.54, "total_tokens": 70451200} +{"current_steps": 8610, "total_steps": 8739, "loss": 1.2666, "learning_rate": 3.427048396271171e-08, "epoch": 0.9852385856505321, "percentage": 98.52, "elapsed_time": "12:19:02", "remaining_time": "0:11:04", "throughput": 1590.64, "total_tokens": 70533120} +{"current_steps": 8620, "total_steps": 8739, "loss": 1.4532, "learning_rate": 2.9164163942146937e-08, "epoch": 0.9863828813365374, "percentage": 98.64, "elapsed_time": "12:19:54", "remaining_time": "0:10:12", "throughput": 1590.61, "total_tokens": 70615040} +{"current_steps": 8630, "total_steps": 8739, "loss": 1.4154, "learning_rate": 2.44693370006599e-08, "epoch": 0.9875271770225427, "percentage": 98.75, "elapsed_time": "12:20:45", "remaining_time": "0:09:21", "throughput": 1590.66, "total_tokens": 70696960} +{"current_steps": 8640, "total_steps": 8739, "loss": 1.062, "learning_rate": 2.0186080504050466e-08, "epoch": 0.9886714727085479, "percentage": 98.87, "elapsed_time": "12:21:33", "remaining_time": "0:08:29", "throughput": 1590.76, "total_tokens": 70778880} +{"current_steps": 8650, "total_steps": 8739, "loss": 1.0299, "learning_rate": 1.6314465035879855e-08, "epoch": 0.9898157683945531, "percentage": 98.98, "elapsed_time": "12:22:20", "remaining_time": "0:07:38", "throughput": 1590.92, "total_tokens": 70860800} +{"current_steps": 8660, "total_steps": 8739, "loss": 1.1402, "learning_rate": 1.2854554396291018e-08, "epoch": 0.9909600640805584, "percentage": 99.1, "elapsed_time": "12:23:12", "remaining_time": "0:06:46", "throughput": 1590.91, "total_tokens": 70942720} +{"current_steps": 8670, "total_steps": 8739, "loss": 1.3485, "learning_rate": 9.806405600967794e-09, "epoch": 0.9921043597665636, "percentage": 99.21, "elapsed_time": "12:24:02", "remaining_time": "0:05:55", "throughput": 1590.96, "total_tokens": 71024640} +{"current_steps": 8680, "total_steps": 8739, "loss": 1.26, "learning_rate": 7.1700688801940034e-09, "epoch": 0.9932486554525689, "percentage": 99.32, "elapsed_time": "12:24:53", "remaining_time": "0:05:03", "throughput": 1590.97, "total_tokens": 71106560} +{"current_steps": 8690, "total_steps": 8739, "loss": 1.1129, "learning_rate": 4.94558767802078e-09, "epoch": 0.9943929511385742, "percentage": 99.44, "elapsed_time": "12:25:41", "remaining_time": "0:04:12", "throughput": 1591.1, "total_tokens": 71188480} +{"current_steps": 8700, "total_steps": 8739, "loss": 1.2407, "learning_rate": 3.1329986515560295e-09, "epoch": 0.9955372468245794, "percentage": 99.55, "elapsed_time": "12:26:28", "remaining_time": "0:03:20", "throughput": 1591.28, "total_tokens": 71270400} +{"current_steps": 8710, "total_steps": 8739, "loss": 1.2159, "learning_rate": 1.7323316703621305e-09, "epoch": 0.9966815425105847, "percentage": 99.67, "elapsed_time": "12:27:13", "remaining_time": "0:02:29", "throughput": 1591.49, "total_tokens": 71352320} +{"current_steps": 8720, "total_steps": 8739, "loss": 1.0369, "learning_rate": 7.436098159480099e-10, "epoch": 0.99782583819659, "percentage": 99.78, "elapsed_time": "12:28:06", "remaining_time": "0:01:37", "throughput": 1591.45, "total_tokens": 71434240} +{"current_steps": 8730, "total_steps": 8739, "loss": 1.1446, "learning_rate": 1.6684938141664498e-10, "epoch": 0.9989701338825953, "percentage": 99.9, "elapsed_time": "12:28:56", "remaining_time": "0:00:46", "throughput": 1591.49, "total_tokens": 71516160} +{"current_steps": 8739, "total_steps": 8739, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "12:29:47", "remaining_time": "0:00:00", "throughput": 1591.34, "total_tokens": 71589888}