diff --git "a/Luminia-8B-RP/trainer_log.jsonl" "b/Luminia-8B-RP/trainer_log.jsonl" --- "a/Luminia-8B-RP/trainer_log.jsonl" +++ "b/Luminia-8B-RP/trainer_log.jsonl" @@ -1,2083 +1,2144 @@ -{"current_steps": 10, "total_steps": 20825, "loss": 1.3448, "learning_rate": 5.000000000000001e-07, "epoch": 0.0004801920768307323, "percentage": 0.05, "elapsed_time": "0:00:52", "remaining_time": "1 day, 6:24:33", "throughput": 1557.6, "total_tokens": 81920} -{"current_steps": 20, "total_steps": 20825, "loss": 1.3391, "learning_rate": 1.0000000000000002e-06, "epoch": 0.0009603841536614646, "percentage": 0.1, "elapsed_time": "0:01:39", "remaining_time": "1 day, 4:39:49", "throughput": 1651.66, "total_tokens": 163840} -{"current_steps": 30, "total_steps": 20825, "loss": 1.3258, "learning_rate": 1.5e-06, "epoch": 0.0014405762304921968, "percentage": 0.14, "elapsed_time": "0:02:25", "remaining_time": "1 day, 4:00:58", "throughput": 1689.03, "total_tokens": 245760} -{"current_steps": 40, "total_steps": 20825, "loss": 1.4027, "learning_rate": 2.0000000000000003e-06, "epoch": 0.0019207683073229293, "percentage": 0.19, "elapsed_time": "0:03:12", "remaining_time": "1 day, 3:44:40", "throughput": 1704.75, "total_tokens": 327680} -{"current_steps": 50, "total_steps": 20825, "loss": 1.1825, "learning_rate": 2.5e-06, "epoch": 0.0024009603841536613, "percentage": 0.24, "elapsed_time": "0:03:58", "remaining_time": "1 day, 3:34:20", "throughput": 1714.56, "total_tokens": 409600} -{"current_steps": 60, "total_steps": 20825, "loss": 1.0617, "learning_rate": 3e-06, "epoch": 0.0028811524609843936, "percentage": 0.29, "elapsed_time": "0:04:45", "remaining_time": "1 day, 3:29:10", "throughput": 1719.11, "total_tokens": 491520} -{"current_steps": 70, "total_steps": 20825, "loss": 1.2087, "learning_rate": 3.5000000000000004e-06, "epoch": 0.0033613445378151263, "percentage": 0.34, "elapsed_time": "0:05:33", "remaining_time": "1 day, 3:26:51", "throughput": 1720.7, "total_tokens": 573440} -{"current_steps": 80, "total_steps": 20825, "loss": 1.2009, "learning_rate": 4.000000000000001e-06, "epoch": 0.0038415366146458585, "percentage": 0.38, "elapsed_time": "0:06:20", "remaining_time": "1 day, 3:23:36", "throughput": 1723.27, "total_tokens": 655360} -{"current_steps": 90, "total_steps": 20825, "loss": 1.2692, "learning_rate": 4.5e-06, "epoch": 0.004321728691476591, "percentage": 0.43, "elapsed_time": "0:07:07", "remaining_time": "1 day, 3:20:35", "throughput": 1725.61, "total_tokens": 737280} -{"current_steps": 100, "total_steps": 20825, "loss": 1.187, "learning_rate": 5e-06, "epoch": 0.004801920768307323, "percentage": 0.48, "elapsed_time": "0:07:54", "remaining_time": "1 day, 3:18:56", "throughput": 1726.52, "total_tokens": 819200} -{"current_steps": 110, "total_steps": 20825, "loss": 1.21, "learning_rate": 5.500000000000001e-06, "epoch": 0.005282112845138055, "percentage": 0.53, "elapsed_time": "0:08:41", "remaining_time": "1 day, 3:16:51", "throughput": 1727.88, "total_tokens": 901120} -{"current_steps": 120, "total_steps": 20825, "loss": 1.4533, "learning_rate": 6e-06, "epoch": 0.005762304921968787, "percentage": 0.58, "elapsed_time": "0:09:28", "remaining_time": "1 day, 3:14:49", "throughput": 1729.18, "total_tokens": 983040} -{"current_steps": 130, "total_steps": 20825, "loss": 1.3365, "learning_rate": 6.5000000000000004e-06, "epoch": 0.00624249699879952, "percentage": 0.62, "elapsed_time": "0:10:15", "remaining_time": "1 day, 3:12:31", "throughput": 1730.79, "total_tokens": 1064960} -{"current_steps": 140, "total_steps": 20825, "loss": 1.0839, "learning_rate": 7.000000000000001e-06, "epoch": 0.0067226890756302525, "percentage": 0.67, "elapsed_time": "0:11:02", "remaining_time": "1 day, 3:10:46", "throughput": 1731.8, "total_tokens": 1146880} -{"current_steps": 150, "total_steps": 20825, "loss": 1.0646, "learning_rate": 7.5e-06, "epoch": 0.007202881152460984, "percentage": 0.72, "elapsed_time": "0:11:49", "remaining_time": "1 day, 3:09:26", "throughput": 1732.39, "total_tokens": 1228800} -{"current_steps": 160, "total_steps": 20825, "loss": 1.366, "learning_rate": 8.000000000000001e-06, "epoch": 0.007683073229291717, "percentage": 0.77, "elapsed_time": "0:12:36", "remaining_time": "1 day, 3:07:45", "throughput": 1733.34, "total_tokens": 1310720} -{"current_steps": 170, "total_steps": 20825, "loss": 1.2509, "learning_rate": 8.500000000000002e-06, "epoch": 0.00816326530612245, "percentage": 0.82, "elapsed_time": "0:13:23", "remaining_time": "1 day, 3:06:22", "throughput": 1733.98, "total_tokens": 1392640} -{"current_steps": 180, "total_steps": 20825, "loss": 1.0235, "learning_rate": 9e-06, "epoch": 0.008643457382953182, "percentage": 0.86, "elapsed_time": "0:14:10", "remaining_time": "1 day, 3:05:21", "throughput": 1734.23, "total_tokens": 1474560} -{"current_steps": 190, "total_steps": 20825, "loss": 0.9992, "learning_rate": 9.5e-06, "epoch": 0.009123649459783913, "percentage": 0.91, "elapsed_time": "0:14:57", "remaining_time": "1 day, 3:03:49", "throughput": 1735.02, "total_tokens": 1556480} -{"current_steps": 200, "total_steps": 20825, "loss": 0.8424, "learning_rate": 1e-05, "epoch": 0.009603841536614645, "percentage": 0.96, "elapsed_time": "0:15:44", "remaining_time": "1 day, 3:03:04", "throughput": 1734.97, "total_tokens": 1638400} -{"current_steps": 210, "total_steps": 20825, "loss": 1.0181, "learning_rate": 1.05e-05, "epoch": 0.010084033613445379, "percentage": 1.01, "elapsed_time": "0:16:31", "remaining_time": "1 day, 3:02:44", "throughput": 1734.49, "total_tokens": 1720320} -{"current_steps": 220, "total_steps": 20825, "loss": 0.8846, "learning_rate": 1.1000000000000001e-05, "epoch": 0.01056422569027611, "percentage": 1.06, "elapsed_time": "0:17:18", "remaining_time": "1 day, 3:01:51", "throughput": 1734.6, "total_tokens": 1802240} -{"current_steps": 230, "total_steps": 20825, "loss": 1.1465, "learning_rate": 1.1500000000000002e-05, "epoch": 0.011044417767106842, "percentage": 1.1, "elapsed_time": "0:18:05", "remaining_time": "1 day, 3:00:39", "throughput": 1735.04, "total_tokens": 1884160} -{"current_steps": 240, "total_steps": 20825, "loss": 1.0085, "learning_rate": 1.2e-05, "epoch": 0.011524609843937574, "percentage": 1.15, "elapsed_time": "0:18:52", "remaining_time": "1 day, 2:59:15", "throughput": 1735.69, "total_tokens": 1966080} -{"current_steps": 250, "total_steps": 20825, "loss": 1.0097, "learning_rate": 1.25e-05, "epoch": 0.012004801920768308, "percentage": 1.2, "elapsed_time": "0:19:39", "remaining_time": "1 day, 2:57:57", "throughput": 1736.24, "total_tokens": 2048000} -{"current_steps": 260, "total_steps": 20825, "loss": 0.968, "learning_rate": 1.3000000000000001e-05, "epoch": 0.01248499399759904, "percentage": 1.25, "elapsed_time": "0:20:26", "remaining_time": "1 day, 2:56:49", "throughput": 1736.62, "total_tokens": 2129920} -{"current_steps": 270, "total_steps": 20825, "loss": 1.1094, "learning_rate": 1.3500000000000001e-05, "epoch": 0.012965186074429771, "percentage": 1.3, "elapsed_time": "0:21:13", "remaining_time": "1 day, 2:55:37", "throughput": 1737.06, "total_tokens": 2211840} -{"current_steps": 280, "total_steps": 20825, "loss": 1.0791, "learning_rate": 1.4000000000000001e-05, "epoch": 0.013445378151260505, "percentage": 1.34, "elapsed_time": "0:22:00", "remaining_time": "1 day, 2:54:37", "throughput": 1737.3, "total_tokens": 2293760} -{"current_steps": 290, "total_steps": 20825, "loss": 1.0844, "learning_rate": 1.45e-05, "epoch": 0.013925570228091237, "percentage": 1.39, "elapsed_time": "0:22:47", "remaining_time": "1 day, 2:53:28", "throughput": 1737.69, "total_tokens": 2375680} -{"current_steps": 300, "total_steps": 20825, "loss": 1.0286, "learning_rate": 1.5e-05, "epoch": 0.014405762304921969, "percentage": 1.44, "elapsed_time": "0:23:33", "remaining_time": "1 day, 2:52:12", "throughput": 1738.2, "total_tokens": 2457600} -{"current_steps": 310, "total_steps": 20825, "loss": 1.1747, "learning_rate": 1.55e-05, "epoch": 0.0148859543817527, "percentage": 1.49, "elapsed_time": "0:24:20", "remaining_time": "1 day, 2:51:23", "throughput": 1738.24, "total_tokens": 2539520} -{"current_steps": 320, "total_steps": 20825, "loss": 1.1556, "learning_rate": 1.6000000000000003e-05, "epoch": 0.015366146458583434, "percentage": 1.54, "elapsed_time": "0:25:08", "remaining_time": "1 day, 2:50:38", "throughput": 1738.2, "total_tokens": 2621440} -{"current_steps": 330, "total_steps": 20825, "loss": 1.0936, "learning_rate": 1.65e-05, "epoch": 0.015846338535414166, "percentage": 1.58, "elapsed_time": "0:25:54", "remaining_time": "1 day, 2:49:27", "throughput": 1738.63, "total_tokens": 2703360} -{"current_steps": 340, "total_steps": 20825, "loss": 1.0638, "learning_rate": 1.7000000000000003e-05, "epoch": 0.0163265306122449, "percentage": 1.63, "elapsed_time": "0:26:42", "remaining_time": "1 day, 2:48:57", "throughput": 1738.33, "total_tokens": 2785280} -{"current_steps": 350, "total_steps": 20825, "loss": 1.171, "learning_rate": 1.75e-05, "epoch": 0.01680672268907563, "percentage": 1.68, "elapsed_time": "0:27:29", "remaining_time": "1 day, 2:48:08", "throughput": 1738.36, "total_tokens": 2867200} -{"current_steps": 360, "total_steps": 20825, "loss": 0.9427, "learning_rate": 1.8e-05, "epoch": 0.017286914765906363, "percentage": 1.73, "elapsed_time": "0:28:16", "remaining_time": "1 day, 2:47:07", "throughput": 1738.61, "total_tokens": 2949120} -{"current_steps": 370, "total_steps": 20825, "loss": 0.9715, "learning_rate": 1.85e-05, "epoch": 0.017767106842737093, "percentage": 1.78, "elapsed_time": "0:29:02", "remaining_time": "1 day, 2:45:57", "throughput": 1739.02, "total_tokens": 3031040} -{"current_steps": 380, "total_steps": 20825, "loss": 1.0749, "learning_rate": 1.9e-05, "epoch": 0.018247298919567827, "percentage": 1.82, "elapsed_time": "0:29:50", "remaining_time": "1 day, 2:45:13", "throughput": 1738.96, "total_tokens": 3112960} -{"current_steps": 390, "total_steps": 20825, "loss": 0.9876, "learning_rate": 1.9500000000000003e-05, "epoch": 0.01872749099639856, "percentage": 1.87, "elapsed_time": "0:30:37", "remaining_time": "1 day, 2:44:35", "throughput": 1738.8, "total_tokens": 3194880} -{"current_steps": 400, "total_steps": 20825, "loss": 1.105, "learning_rate": 2e-05, "epoch": 0.01920768307322929, "percentage": 1.92, "elapsed_time": "0:31:24", "remaining_time": "1 day, 2:43:49", "throughput": 1738.77, "total_tokens": 3276800} -{"current_steps": 410, "total_steps": 20825, "loss": 1.1199, "learning_rate": 2.05e-05, "epoch": 0.019687875150060024, "percentage": 1.97, "elapsed_time": "0:32:12", "remaining_time": "1 day, 2:43:23", "throughput": 1738.4, "total_tokens": 3358720} -{"current_steps": 420, "total_steps": 20825, "loss": 1.0458, "learning_rate": 2.1e-05, "epoch": 0.020168067226890758, "percentage": 2.02, "elapsed_time": "0:32:58", "remaining_time": "1 day, 2:42:15", "throughput": 1738.78, "total_tokens": 3440640} -{"current_steps": 430, "total_steps": 20825, "loss": 1.023, "learning_rate": 2.15e-05, "epoch": 0.020648259303721488, "percentage": 2.06, "elapsed_time": "0:33:46", "remaining_time": "1 day, 2:41:38", "throughput": 1738.59, "total_tokens": 3522560} -{"current_steps": 440, "total_steps": 20825, "loss": 1.1381, "learning_rate": 2.2000000000000003e-05, "epoch": 0.02112845138055222, "percentage": 2.11, "elapsed_time": "0:34:33", "remaining_time": "1 day, 2:41:08", "throughput": 1738.28, "total_tokens": 3604480} -{"current_steps": 450, "total_steps": 20825, "loss": 0.9443, "learning_rate": 2.25e-05, "epoch": 0.021608643457382955, "percentage": 2.16, "elapsed_time": "0:35:20", "remaining_time": "1 day, 2:40:26", "throughput": 1738.19, "total_tokens": 3686400} -{"current_steps": 460, "total_steps": 20825, "loss": 0.9857, "learning_rate": 2.3000000000000003e-05, "epoch": 0.022088835534213685, "percentage": 2.21, "elapsed_time": "0:36:07", "remaining_time": "1 day, 2:39:29", "throughput": 1738.37, "total_tokens": 3768320} -{"current_steps": 470, "total_steps": 20825, "loss": 1.2423, "learning_rate": 2.35e-05, "epoch": 0.02256902761104442, "percentage": 2.26, "elapsed_time": "0:36:54", "remaining_time": "1 day, 2:38:41", "throughput": 1738.38, "total_tokens": 3850240} -{"current_steps": 480, "total_steps": 20825, "loss": 1.0458, "learning_rate": 2.4e-05, "epoch": 0.02304921968787515, "percentage": 2.3, "elapsed_time": "0:37:41", "remaining_time": "1 day, 2:37:41", "throughput": 1738.62, "total_tokens": 3932160} -{"current_steps": 490, "total_steps": 20825, "loss": 1.0759, "learning_rate": 2.45e-05, "epoch": 0.023529411764705882, "percentage": 2.35, "elapsed_time": "0:38:28", "remaining_time": "1 day, 2:36:27", "throughput": 1739.1, "total_tokens": 4014080} -{"current_steps": 500, "total_steps": 20825, "loss": 1.0799, "learning_rate": 2.5e-05, "epoch": 0.024009603841536616, "percentage": 2.4, "elapsed_time": "0:39:15", "remaining_time": "1 day, 2:35:45", "throughput": 1739.01, "total_tokens": 4096000} -{"current_steps": 510, "total_steps": 20825, "loss": 1.0056, "learning_rate": 2.5500000000000003e-05, "epoch": 0.024489795918367346, "percentage": 2.45, "elapsed_time": "0:40:02", "remaining_time": "1 day, 2:34:44", "throughput": 1739.27, "total_tokens": 4177920} -{"current_steps": 520, "total_steps": 20825, "loss": 0.9158, "learning_rate": 2.6000000000000002e-05, "epoch": 0.02496998799519808, "percentage": 2.5, "elapsed_time": "0:40:49", "remaining_time": "1 day, 2:33:57", "throughput": 1739.26, "total_tokens": 4259840} -{"current_steps": 530, "total_steps": 20825, "loss": 1.0108, "learning_rate": 2.6500000000000004e-05, "epoch": 0.025450180072028813, "percentage": 2.55, "elapsed_time": "0:41:36", "remaining_time": "1 day, 2:33:09", "throughput": 1739.29, "total_tokens": 4341760} -{"current_steps": 540, "total_steps": 20825, "loss": 0.9604, "learning_rate": 2.7000000000000002e-05, "epoch": 0.025930372148859543, "percentage": 2.59, "elapsed_time": "0:42:23", "remaining_time": "1 day, 2:32:08", "throughput": 1739.53, "total_tokens": 4423680} -{"current_steps": 550, "total_steps": 20825, "loss": 1.0828, "learning_rate": 2.7500000000000004e-05, "epoch": 0.026410564225690276, "percentage": 2.64, "elapsed_time": "0:43:10", "remaining_time": "1 day, 2:31:33", "throughput": 1739.31, "total_tokens": 4505600} -{"current_steps": 560, "total_steps": 20825, "loss": 1.2004, "learning_rate": 2.8000000000000003e-05, "epoch": 0.02689075630252101, "percentage": 2.69, "elapsed_time": "0:43:57", "remaining_time": "1 day, 2:30:33", "throughput": 1739.54, "total_tokens": 4587520} -{"current_steps": 570, "total_steps": 20825, "loss": 1.0362, "learning_rate": 2.8499999999999998e-05, "epoch": 0.02737094837935174, "percentage": 2.74, "elapsed_time": "0:44:44", "remaining_time": "1 day, 2:29:43", "throughput": 1739.6, "total_tokens": 4669440} -{"current_steps": 580, "total_steps": 20825, "loss": 1.1366, "learning_rate": 2.9e-05, "epoch": 0.027851140456182474, "percentage": 2.79, "elapsed_time": "0:45:31", "remaining_time": "1 day, 2:28:51", "throughput": 1739.69, "total_tokens": 4751360} -{"current_steps": 590, "total_steps": 20825, "loss": 1.1366, "learning_rate": 2.95e-05, "epoch": 0.028331332533013204, "percentage": 2.83, "elapsed_time": "0:46:17", "remaining_time": "1 day, 2:27:55", "throughput": 1739.85, "total_tokens": 4833280} -{"current_steps": 600, "total_steps": 20825, "loss": 0.8576, "learning_rate": 3e-05, "epoch": 0.028811524609843937, "percentage": 2.88, "elapsed_time": "0:47:04", "remaining_time": "1 day, 2:27:03", "throughput": 1739.95, "total_tokens": 4915200} -{"current_steps": 610, "total_steps": 20825, "loss": 1.2392, "learning_rate": 3.05e-05, "epoch": 0.02929171668667467, "percentage": 2.93, "elapsed_time": "0:47:52", "remaining_time": "1 day, 2:26:26", "throughput": 1739.76, "total_tokens": 4997120} -{"current_steps": 620, "total_steps": 20825, "loss": 0.9339, "learning_rate": 3.1e-05, "epoch": 0.0297719087635054, "percentage": 2.98, "elapsed_time": "0:48:39", "remaining_time": "1 day, 2:25:28", "throughput": 1739.95, "total_tokens": 5079040} -{"current_steps": 630, "total_steps": 20825, "loss": 0.9704, "learning_rate": 3.15e-05, "epoch": 0.030252100840336135, "percentage": 3.03, "elapsed_time": "0:49:25", "remaining_time": "1 day, 2:24:31", "throughput": 1740.14, "total_tokens": 5160960} -{"current_steps": 640, "total_steps": 20825, "loss": 0.9718, "learning_rate": 3.2000000000000005e-05, "epoch": 0.030732292917166868, "percentage": 3.07, "elapsed_time": "0:50:12", "remaining_time": "1 day, 2:23:34", "throughput": 1740.32, "total_tokens": 5242880} -{"current_steps": 650, "total_steps": 20825, "loss": 0.9997, "learning_rate": 3.2500000000000004e-05, "epoch": 0.031212484993997598, "percentage": 3.12, "elapsed_time": "0:50:59", "remaining_time": "1 day, 2:22:42", "throughput": 1740.4, "total_tokens": 5324800} -{"current_steps": 660, "total_steps": 20825, "loss": 0.8748, "learning_rate": 3.3e-05, "epoch": 0.03169267707082833, "percentage": 3.17, "elapsed_time": "0:51:59", "remaining_time": "1 day, 2:28:25", "throughput": 1733.29, "total_tokens": 5406720} -{"current_steps": 670, "total_steps": 20825, "loss": 0.8658, "learning_rate": 3.35e-05, "epoch": 0.032172869147659065, "percentage": 3.22, "elapsed_time": "0:53:11", "remaining_time": "1 day, 2:39:54", "throughput": 1719.99, "total_tokens": 5488640} -{"current_steps": 680, "total_steps": 20825, "loss": 0.8799, "learning_rate": 3.4000000000000007e-05, "epoch": 0.0326530612244898, "percentage": 3.27, "elapsed_time": "0:54:04", "remaining_time": "1 day, 2:41:44", "throughput": 1717.17, "total_tokens": 5570560} -{"current_steps": 690, "total_steps": 20825, "loss": 1.0723, "learning_rate": 3.45e-05, "epoch": 0.033133253301320525, "percentage": 3.31, "elapsed_time": "0:54:52", "remaining_time": "1 day, 2:41:10", "throughput": 1716.93, "total_tokens": 5652480} -{"current_steps": 700, "total_steps": 20825, "loss": 1.0756, "learning_rate": 3.5e-05, "epoch": 0.03361344537815126, "percentage": 3.36, "elapsed_time": "0:55:38", "remaining_time": "1 day, 2:39:39", "throughput": 1717.69, "total_tokens": 5734400} -{"current_steps": 710, "total_steps": 20825, "loss": 0.967, "learning_rate": 3.55e-05, "epoch": 0.03409363745498199, "percentage": 3.41, "elapsed_time": "0:56:23", "remaining_time": "1 day, 2:37:47", "throughput": 1718.86, "total_tokens": 5816320} -{"current_steps": 720, "total_steps": 20825, "loss": 0.9767, "learning_rate": 3.6e-05, "epoch": 0.034573829531812726, "percentage": 3.46, "elapsed_time": "0:57:08", "remaining_time": "1 day, 2:35:30", "throughput": 1720.45, "total_tokens": 5898240} -{"current_steps": 730, "total_steps": 20825, "loss": 0.9352, "learning_rate": 3.65e-05, "epoch": 0.03505402160864346, "percentage": 3.51, "elapsed_time": "0:57:53", "remaining_time": "1 day, 2:33:23", "throughput": 1721.88, "total_tokens": 5980160} -{"current_steps": 740, "total_steps": 20825, "loss": 0.9214, "learning_rate": 3.7e-05, "epoch": 0.035534213685474186, "percentage": 3.55, "elapsed_time": "0:58:37", "remaining_time": "1 day, 2:31:19", "throughput": 1723.26, "total_tokens": 6062080} -{"current_steps": 750, "total_steps": 20825, "loss": 1.0334, "learning_rate": 3.7500000000000003e-05, "epoch": 0.03601440576230492, "percentage": 3.6, "elapsed_time": "0:59:22", "remaining_time": "1 day, 2:29:15", "throughput": 1724.65, "total_tokens": 6144000} -{"current_steps": 760, "total_steps": 20825, "loss": 1.0507, "learning_rate": 3.8e-05, "epoch": 0.036494597839135653, "percentage": 3.65, "elapsed_time": "1:00:07", "remaining_time": "1 day, 2:27:10", "throughput": 1726.05, "total_tokens": 6225920} -{"current_steps": 770, "total_steps": 20825, "loss": 1.0, "learning_rate": 3.85e-05, "epoch": 0.03697478991596639, "percentage": 3.7, "elapsed_time": "1:00:51", "remaining_time": "1 day, 2:25:15", "throughput": 1727.28, "total_tokens": 6307840} -{"current_steps": 780, "total_steps": 20825, "loss": 1.0441, "learning_rate": 3.9000000000000006e-05, "epoch": 0.03745498199279712, "percentage": 3.75, "elapsed_time": "1:01:36", "remaining_time": "1 day, 2:23:14", "throughput": 1728.61, "total_tokens": 6389760} -{"current_steps": 790, "total_steps": 20825, "loss": 1.0698, "learning_rate": 3.9500000000000005e-05, "epoch": 0.037935174069627854, "percentage": 3.79, "elapsed_time": "1:02:21", "remaining_time": "1 day, 2:21:17", "throughput": 1729.88, "total_tokens": 6471680} -{"current_steps": 800, "total_steps": 20825, "loss": 0.9719, "learning_rate": 4e-05, "epoch": 0.03841536614645858, "percentage": 3.84, "elapsed_time": "1:03:05", "remaining_time": "1 day, 2:19:22", "throughput": 1731.12, "total_tokens": 6553600} -{"current_steps": 810, "total_steps": 20825, "loss": 1.1387, "learning_rate": 4.05e-05, "epoch": 0.038895558223289314, "percentage": 3.89, "elapsed_time": "1:03:50", "remaining_time": "1 day, 2:17:26", "throughput": 1732.37, "total_tokens": 6635520} -{"current_steps": 820, "total_steps": 20825, "loss": 1.0304, "learning_rate": 4.1e-05, "epoch": 0.03937575030012005, "percentage": 3.94, "elapsed_time": "1:04:34", "remaining_time": "1 day, 2:15:33", "throughput": 1733.57, "total_tokens": 6717440} -{"current_steps": 830, "total_steps": 20825, "loss": 0.9735, "learning_rate": 4.15e-05, "epoch": 0.03985594237695078, "percentage": 3.99, "elapsed_time": "1:05:19", "remaining_time": "1 day, 2:13:42", "throughput": 1734.74, "total_tokens": 6799360} -{"current_steps": 840, "total_steps": 20825, "loss": 0.9434, "learning_rate": 4.2e-05, "epoch": 0.040336134453781515, "percentage": 4.03, "elapsed_time": "1:06:04", "remaining_time": "1 day, 2:11:58", "throughput": 1735.79, "total_tokens": 6881280} -{"current_steps": 850, "total_steps": 20825, "loss": 0.9919, "learning_rate": 4.25e-05, "epoch": 0.04081632653061224, "percentage": 4.08, "elapsed_time": "1:06:49", "remaining_time": "1 day, 2:10:13", "throughput": 1736.85, "total_tokens": 6963200} -{"current_steps": 860, "total_steps": 20825, "loss": 0.9973, "learning_rate": 4.3e-05, "epoch": 0.041296518607442975, "percentage": 4.13, "elapsed_time": "1:07:33", "remaining_time": "1 day, 2:08:27", "throughput": 1737.94, "total_tokens": 7045120} -{"current_steps": 870, "total_steps": 20825, "loss": 1.0275, "learning_rate": 4.35e-05, "epoch": 0.04177671068427371, "percentage": 4.18, "elapsed_time": "1:08:18", "remaining_time": "1 day, 2:06:42", "throughput": 1739.01, "total_tokens": 7127040} -{"current_steps": 880, "total_steps": 20825, "loss": 0.8301, "learning_rate": 4.4000000000000006e-05, "epoch": 0.04225690276110444, "percentage": 4.23, "elapsed_time": "1:09:02", "remaining_time": "1 day, 2:04:57", "throughput": 1740.09, "total_tokens": 7208960} -{"current_steps": 890, "total_steps": 20825, "loss": 1.3488, "learning_rate": 4.4500000000000004e-05, "epoch": 0.042737094837935176, "percentage": 4.27, "elapsed_time": "1:09:47", "remaining_time": "1 day, 2:03:15", "throughput": 1741.1, "total_tokens": 7290880} -{"current_steps": 900, "total_steps": 20825, "loss": 1.1191, "learning_rate": 4.5e-05, "epoch": 0.04321728691476591, "percentage": 4.32, "elapsed_time": "1:10:32", "remaining_time": "1 day, 2:01:34", "throughput": 1742.11, "total_tokens": 7372800} -{"current_steps": 910, "total_steps": 20825, "loss": 1.179, "learning_rate": 4.55e-05, "epoch": 0.043697478991596636, "percentage": 4.37, "elapsed_time": "1:11:17", "remaining_time": "1 day, 2:00:05", "throughput": 1742.88, "total_tokens": 7454720} -{"current_steps": 920, "total_steps": 20825, "loss": 1.0239, "learning_rate": 4.600000000000001e-05, "epoch": 0.04417767106842737, "percentage": 4.42, "elapsed_time": "1:12:01", "remaining_time": "1 day, 1:58:27", "throughput": 1743.84, "total_tokens": 7536640} -{"current_steps": 930, "total_steps": 20825, "loss": 1.0599, "learning_rate": 4.6500000000000005e-05, "epoch": 0.0446578631452581, "percentage": 4.47, "elapsed_time": "1:12:46", "remaining_time": "1 day, 1:56:52", "throughput": 1744.73, "total_tokens": 7618560} -{"current_steps": 940, "total_steps": 20825, "loss": 0.9898, "learning_rate": 4.7e-05, "epoch": 0.04513805522208884, "percentage": 4.51, "elapsed_time": "1:13:31", "remaining_time": "1 day, 1:55:15", "throughput": 1745.68, "total_tokens": 7700480} -{"current_steps": 950, "total_steps": 20825, "loss": 0.9133, "learning_rate": 4.75e-05, "epoch": 0.04561824729891957, "percentage": 4.56, "elapsed_time": "1:14:15", "remaining_time": "1 day, 1:53:40", "throughput": 1746.57, "total_tokens": 7782400} -{"current_steps": 960, "total_steps": 20825, "loss": 0.8747, "learning_rate": 4.8e-05, "epoch": 0.0460984393757503, "percentage": 4.61, "elapsed_time": "1:15:00", "remaining_time": "1 day, 1:52:08", "throughput": 1747.41, "total_tokens": 7864320} -{"current_steps": 970, "total_steps": 20825, "loss": 1.0154, "learning_rate": 4.85e-05, "epoch": 0.04657863145258103, "percentage": 4.66, "elapsed_time": "1:15:45", "remaining_time": "1 day, 1:50:36", "throughput": 1748.26, "total_tokens": 7946240} -{"current_steps": 980, "total_steps": 20825, "loss": 0.8588, "learning_rate": 4.9e-05, "epoch": 0.047058823529411764, "percentage": 4.71, "elapsed_time": "1:16:29", "remaining_time": "1 day, 1:49:03", "throughput": 1749.12, "total_tokens": 8028160} -{"current_steps": 990, "total_steps": 20825, "loss": 0.8407, "learning_rate": 4.9500000000000004e-05, "epoch": 0.0475390156062425, "percentage": 4.75, "elapsed_time": "1:17:14", "remaining_time": "1 day, 1:47:39", "throughput": 1749.83, "total_tokens": 8110080} -{"current_steps": 1000, "total_steps": 20825, "loss": 0.8889, "learning_rate": 5e-05, "epoch": 0.04801920768307323, "percentage": 4.8, "elapsed_time": "1:17:59", "remaining_time": "1 day, 1:46:09", "throughput": 1750.65, "total_tokens": 8192000} -{"current_steps": 1010, "total_steps": 20825, "loss": 1.0226, "learning_rate": 4.9999968610581127e-05, "epoch": 0.048499399759903965, "percentage": 4.85, "elapsed_time": "1:19:18", "remaining_time": "1 day, 1:55:58", "throughput": 1738.73, "total_tokens": 8273920} -{"current_steps": 1020, "total_steps": 20825, "loss": 1.0976, "learning_rate": 4.9999874442403314e-05, "epoch": 0.04897959183673469, "percentage": 4.9, "elapsed_time": "1:20:03", "remaining_time": "1 day, 1:54:34", "throughput": 1739.41, "total_tokens": 8355840} -{"current_steps": 1030, "total_steps": 20825, "loss": 1.1658, "learning_rate": 4.999971749570305e-05, "epoch": 0.049459783913565425, "percentage": 4.95, "elapsed_time": "1:20:48", "remaining_time": "1 day, 1:53:09", "throughput": 1740.11, "total_tokens": 8437760} -{"current_steps": 1040, "total_steps": 20825, "loss": 0.9763, "learning_rate": 4.999949777087444e-05, "epoch": 0.04993997599039616, "percentage": 4.99, "elapsed_time": "1:21:33", "remaining_time": "1 day, 1:51:42", "throughput": 1740.86, "total_tokens": 8519680} -{"current_steps": 1050, "total_steps": 20825, "loss": 0.8407, "learning_rate": 4.999921526846925e-05, "epoch": 0.05042016806722689, "percentage": 5.04, "elapsed_time": "1:22:18", "remaining_time": "1 day, 1:50:14", "throughput": 1741.63, "total_tokens": 8601600} -{"current_steps": 1060, "total_steps": 20825, "loss": 0.9688, "learning_rate": 4.9998869989196885e-05, "epoch": 0.050900360144057626, "percentage": 5.09, "elapsed_time": "1:23:03", "remaining_time": "1 day, 1:48:47", "throughput": 1742.38, "total_tokens": 8683520} -{"current_steps": 1070, "total_steps": 20825, "loss": 0.9459, "learning_rate": 4.99984619339244e-05, "epoch": 0.05138055222088835, "percentage": 5.14, "elapsed_time": "1:23:48", "remaining_time": "1 day, 1:47:16", "throughput": 1743.2, "total_tokens": 8765440} -{"current_steps": 1080, "total_steps": 20825, "loss": 1.0055, "learning_rate": 4.999799110367648e-05, "epoch": 0.051860744297719086, "percentage": 5.19, "elapsed_time": "1:24:33", "remaining_time": "1 day, 1:45:54", "throughput": 1743.86, "total_tokens": 8847360} -{"current_steps": 1090, "total_steps": 20825, "loss": 1.0218, "learning_rate": 4.999745749963545e-05, "epoch": 0.05234093637454982, "percentage": 5.23, "elapsed_time": "1:25:18", "remaining_time": "1 day, 1:44:29", "throughput": 1744.57, "total_tokens": 8929280} -{"current_steps": 1100, "total_steps": 20825, "loss": 0.8797, "learning_rate": 4.999686112314127e-05, "epoch": 0.05282112845138055, "percentage": 5.28, "elapsed_time": "1:26:02", "remaining_time": "1 day, 1:43:01", "throughput": 1745.35, "total_tokens": 9011200} -{"current_steps": 1110, "total_steps": 20825, "loss": 1.1579, "learning_rate": 4.999620197569155e-05, "epoch": 0.053301320528211286, "percentage": 5.33, "elapsed_time": "1:26:47", "remaining_time": "1 day, 1:41:38", "throughput": 1746.03, "total_tokens": 9093120} -{"current_steps": 1120, "total_steps": 20825, "loss": 0.8893, "learning_rate": 4.9995480058941483e-05, "epoch": 0.05378151260504202, "percentage": 5.38, "elapsed_time": "1:27:32", "remaining_time": "1 day, 1:40:14", "throughput": 1746.73, "total_tokens": 9175040} -{"current_steps": 1130, "total_steps": 20825, "loss": 0.987, "learning_rate": 4.9994695374703934e-05, "epoch": 0.05426170468187275, "percentage": 5.43, "elapsed_time": "1:28:17", "remaining_time": "1 day, 1:38:49", "throughput": 1747.46, "total_tokens": 9256960} -{"current_steps": 1140, "total_steps": 20825, "loss": 0.8846, "learning_rate": 4.9993847924949364e-05, "epoch": 0.05474189675870348, "percentage": 5.47, "elapsed_time": "1:29:02", "remaining_time": "1 day, 1:37:26", "throughput": 1748.13, "total_tokens": 9338880} -{"current_steps": 1150, "total_steps": 20825, "loss": 0.9093, "learning_rate": 4.999293771180584e-05, "epoch": 0.055222088835534214, "percentage": 5.52, "elapsed_time": "1:29:46", "remaining_time": "1 day, 1:36:03", "throughput": 1748.81, "total_tokens": 9420800} -{"current_steps": 1160, "total_steps": 20825, "loss": 1.0216, "learning_rate": 4.999196473755905e-05, "epoch": 0.05570228091236495, "percentage": 5.57, "elapsed_time": "1:30:31", "remaining_time": "1 day, 1:34:41", "throughput": 1749.49, "total_tokens": 9502720} -{"current_steps": 1170, "total_steps": 20825, "loss": 1.0765, "learning_rate": 4.9990929004652287e-05, "epoch": 0.05618247298919568, "percentage": 5.62, "elapsed_time": "1:31:16", "remaining_time": "1 day, 1:33:17", "throughput": 1750.2, "total_tokens": 9584640} -{"current_steps": 1180, "total_steps": 20825, "loss": 0.9421, "learning_rate": 4.9989830515686434e-05, "epoch": 0.05666266506602641, "percentage": 5.67, "elapsed_time": "1:32:01", "remaining_time": "1 day, 1:31:57", "throughput": 1750.83, "total_tokens": 9666560} -{"current_steps": 1190, "total_steps": 20825, "loss": 1.0168, "learning_rate": 4.998866927341995e-05, "epoch": 0.05714285714285714, "percentage": 5.71, "elapsed_time": "1:32:45", "remaining_time": "1 day, 1:30:34", "throughput": 1751.52, "total_tokens": 9748480} -{"current_steps": 1200, "total_steps": 20825, "loss": 0.9398, "learning_rate": 4.9987445280768916e-05, "epoch": 0.057623049219687875, "percentage": 5.76, "elapsed_time": "1:33:30", "remaining_time": "1 day, 1:29:21", "throughput": 1752.03, "total_tokens": 9830400} -{"current_steps": 1210, "total_steps": 20825, "loss": 1.0907, "learning_rate": 4.998615854080695e-05, "epoch": 0.05810324129651861, "percentage": 5.81, "elapsed_time": "1:34:15", "remaining_time": "1 day, 1:28:03", "throughput": 1752.62, "total_tokens": 9912320} -{"current_steps": 1220, "total_steps": 20825, "loss": 0.9021, "learning_rate": 4.998480905676527e-05, "epoch": 0.05858343337334934, "percentage": 5.86, "elapsed_time": "1:35:00", "remaining_time": "1 day, 1:26:45", "throughput": 1753.21, "total_tokens": 9994240} -{"current_steps": 1230, "total_steps": 20825, "loss": 1.2031, "learning_rate": 4.998339683203261e-05, "epoch": 0.059063625450180075, "percentage": 5.91, "elapsed_time": "1:35:45", "remaining_time": "1 day, 1:25:26", "throughput": 1753.83, "total_tokens": 10076160} -{"current_steps": 1240, "total_steps": 20825, "loss": 1.0543, "learning_rate": 4.9981921870155314e-05, "epoch": 0.0595438175270108, "percentage": 5.95, "elapsed_time": "1:36:29", "remaining_time": "1 day, 1:24:05", "throughput": 1754.48, "total_tokens": 10158080} -{"current_steps": 1250, "total_steps": 20825, "loss": 1.0474, "learning_rate": 4.998038417483721e-05, "epoch": 0.060024009603841535, "percentage": 6.0, "elapsed_time": "1:37:15", "remaining_time": "1 day, 1:22:57", "throughput": 1754.9, "total_tokens": 10240000} -{"current_steps": 1260, "total_steps": 20825, "loss": 1.0161, "learning_rate": 4.9978783749939705e-05, "epoch": 0.06050420168067227, "percentage": 6.05, "elapsed_time": "1:37:59", "remaining_time": "1 day, 1:21:41", "throughput": 1755.46, "total_tokens": 10321920} -{"current_steps": 1270, "total_steps": 20825, "loss": 0.9022, "learning_rate": 4.997712059948171e-05, "epoch": 0.060984393757503, "percentage": 6.1, "elapsed_time": "1:38:44", "remaining_time": "1 day, 1:20:28", "throughput": 1755.97, "total_tokens": 10403840} -{"current_steps": 1280, "total_steps": 20825, "loss": 0.8682, "learning_rate": 4.997539472763964e-05, "epoch": 0.061464585834333736, "percentage": 6.15, "elapsed_time": "1:39:29", "remaining_time": "1 day, 1:19:13", "throughput": 1756.52, "total_tokens": 10485760} -{"current_steps": 1290, "total_steps": 20825, "loss": 1.147, "learning_rate": 4.9973606138747434e-05, "epoch": 0.06194477791116446, "percentage": 6.19, "elapsed_time": "1:40:14", "remaining_time": "1 day, 1:18:01", "throughput": 1757.01, "total_tokens": 10567680} -{"current_steps": 1300, "total_steps": 20825, "loss": 0.8778, "learning_rate": 4.9971754837296516e-05, "epoch": 0.062424969987995196, "percentage": 6.24, "elapsed_time": "1:40:59", "remaining_time": "1 day, 1:16:45", "throughput": 1757.57, "total_tokens": 10649600} -{"current_steps": 1310, "total_steps": 20825, "loss": 1.249, "learning_rate": 4.9969840827935776e-05, "epoch": 0.06290516206482594, "percentage": 6.29, "elapsed_time": "1:41:44", "remaining_time": "1 day, 1:15:41", "throughput": 1757.9, "total_tokens": 10731520} -{"current_steps": 1320, "total_steps": 20825, "loss": 0.6743, "learning_rate": 4.99678641154716e-05, "epoch": 0.06338535414165666, "percentage": 6.34, "elapsed_time": "1:42:30", "remaining_time": "1 day, 1:14:37", "throughput": 1758.25, "total_tokens": 10813440} -{"current_steps": 1330, "total_steps": 20825, "loss": 1.0631, "learning_rate": 4.9965824704867806e-05, "epoch": 0.06386554621848739, "percentage": 6.39, "elapsed_time": "1:43:15", "remaining_time": "1 day, 1:13:26", "throughput": 1758.73, "total_tokens": 10895360} -{"current_steps": 1340, "total_steps": 20825, "loss": 0.8721, "learning_rate": 4.996372260124567e-05, "epoch": 0.06434573829531813, "percentage": 6.43, "elapsed_time": "1:44:00", "remaining_time": "1 day, 1:12:19", "throughput": 1759.1, "total_tokens": 10977280} -{"current_steps": 1350, "total_steps": 20825, "loss": 0.7503, "learning_rate": 4.996155780988389e-05, "epoch": 0.06482593037214886, "percentage": 6.48, "elapsed_time": "1:44:45", "remaining_time": "1 day, 1:11:13", "throughput": 1759.48, "total_tokens": 11059200} -{"current_steps": 1360, "total_steps": 20825, "loss": 0.8589, "learning_rate": 4.9959330336218605e-05, "epoch": 0.0653061224489796, "percentage": 6.53, "elapsed_time": "1:45:30", "remaining_time": "1 day, 1:09:59", "throughput": 1760.01, "total_tokens": 11141120} -{"current_steps": 1370, "total_steps": 20825, "loss": 0.9261, "learning_rate": 4.995704018584334e-05, "epoch": 0.06578631452581032, "percentage": 6.58, "elapsed_time": "1:46:15", "remaining_time": "1 day, 1:08:50", "throughput": 1760.46, "total_tokens": 11223040} -{"current_steps": 1380, "total_steps": 20825, "loss": 0.7139, "learning_rate": 4.9954687364508996e-05, "epoch": 0.06626650660264105, "percentage": 6.63, "elapsed_time": "1:47:00", "remaining_time": "1 day, 1:07:43", "throughput": 1760.86, "total_tokens": 11304960} -{"current_steps": 1390, "total_steps": 20825, "loss": 0.8474, "learning_rate": 4.995227187812389e-05, "epoch": 0.06674669867947179, "percentage": 6.67, "elapsed_time": "1:47:44", "remaining_time": "1 day, 1:06:31", "throughput": 1761.35, "total_tokens": 11386880} -{"current_steps": 1400, "total_steps": 20825, "loss": 1.0527, "learning_rate": 4.9949793732753656e-05, "epoch": 0.06722689075630252, "percentage": 6.72, "elapsed_time": "1:48:29", "remaining_time": "1 day, 1:05:18", "throughput": 1761.87, "total_tokens": 11468800} -{"current_steps": 1410, "total_steps": 20825, "loss": 0.9405, "learning_rate": 4.994725293462132e-05, "epoch": 0.06770708283313326, "percentage": 6.77, "elapsed_time": "1:49:14", "remaining_time": "1 day, 1:04:06", "throughput": 1762.37, "total_tokens": 11550720} -{"current_steps": 1420, "total_steps": 20825, "loss": 0.9588, "learning_rate": 4.994464949010722e-05, "epoch": 0.06818727490996399, "percentage": 6.82, "elapsed_time": "1:49:58", "remaining_time": "1 day, 1:02:53", "throughput": 1762.88, "total_tokens": 11632640} -{"current_steps": 1430, "total_steps": 20825, "loss": 0.9032, "learning_rate": 4.994198340574898e-05, "epoch": 0.06866746698679471, "percentage": 6.87, "elapsed_time": "1:50:43", "remaining_time": "1 day, 1:01:44", "throughput": 1763.33, "total_tokens": 11714560} -{"current_steps": 1440, "total_steps": 20825, "loss": 0.8397, "learning_rate": 4.993925468824156e-05, "epoch": 0.06914765906362545, "percentage": 6.91, "elapsed_time": "1:51:28", "remaining_time": "1 day, 1:00:34", "throughput": 1763.79, "total_tokens": 11796480} -{"current_steps": 1450, "total_steps": 20825, "loss": 0.9019, "learning_rate": 4.99364633444372e-05, "epoch": 0.06962785114045618, "percentage": 6.96, "elapsed_time": "1:52:13", "remaining_time": "1 day, 0:59:28", "throughput": 1764.18, "total_tokens": 11878400} -{"current_steps": 1460, "total_steps": 20825, "loss": 0.999, "learning_rate": 4.993360938134537e-05, "epoch": 0.07010804321728692, "percentage": 7.01, "elapsed_time": "1:52:58", "remaining_time": "1 day, 0:58:21", "throughput": 1764.57, "total_tokens": 11960320} -{"current_steps": 1470, "total_steps": 20825, "loss": 1.0207, "learning_rate": 4.993069280613282e-05, "epoch": 0.07058823529411765, "percentage": 7.06, "elapsed_time": "1:53:42", "remaining_time": "1 day, 0:57:15", "throughput": 1764.96, "total_tokens": 12042240} -{"current_steps": 1480, "total_steps": 20825, "loss": 0.9636, "learning_rate": 4.9927713626123524e-05, "epoch": 0.07106842737094837, "percentage": 7.11, "elapsed_time": "1:54:27", "remaining_time": "1 day, 0:56:05", "throughput": 1765.43, "total_tokens": 12124160} -{"current_steps": 1490, "total_steps": 20825, "loss": 0.9386, "learning_rate": 4.992467184879865e-05, "epoch": 0.07154861944777911, "percentage": 7.15, "elapsed_time": "1:55:12", "remaining_time": "1 day, 0:55:03", "throughput": 1765.73, "total_tokens": 12206080} -{"current_steps": 1500, "total_steps": 20825, "loss": 1.0065, "learning_rate": 4.9921567481796585e-05, "epoch": 0.07202881152460984, "percentage": 7.2, "elapsed_time": "1:55:57", "remaining_time": "1 day, 0:53:55", "throughput": 1766.15, "total_tokens": 12288000} -{"current_steps": 1510, "total_steps": 20825, "loss": 0.9552, "learning_rate": 4.9918400532912845e-05, "epoch": 0.07250900360144058, "percentage": 7.25, "elapsed_time": "1:56:45", "remaining_time": "1 day, 0:53:27", "throughput": 1765.8, "total_tokens": 12369920} -{"current_steps": 1520, "total_steps": 20825, "loss": 0.9035, "learning_rate": 4.991517101010015e-05, "epoch": 0.07298919567827131, "percentage": 7.3, "elapsed_time": "1:57:30", "remaining_time": "1 day, 0:52:30", "throughput": 1766.01, "total_tokens": 12451840} -{"current_steps": 1530, "total_steps": 20825, "loss": 1.0423, "learning_rate": 4.9911878921468304e-05, "epoch": 0.07346938775510205, "percentage": 7.35, "elapsed_time": "1:58:15", "remaining_time": "1 day, 0:51:24", "throughput": 1766.4, "total_tokens": 12533760} -{"current_steps": 1540, "total_steps": 20825, "loss": 0.9216, "learning_rate": 4.990852427528427e-05, "epoch": 0.07394957983193277, "percentage": 7.39, "elapsed_time": "1:59:00", "remaining_time": "1 day, 0:50:16", "throughput": 1766.81, "total_tokens": 12615680} -{"current_steps": 1550, "total_steps": 20825, "loss": 0.9563, "learning_rate": 4.9905107079972064e-05, "epoch": 0.0744297719087635, "percentage": 7.44, "elapsed_time": "1:59:45", "remaining_time": "1 day, 0:49:13", "throughput": 1767.15, "total_tokens": 12697600} -{"current_steps": 1560, "total_steps": 20825, "loss": 0.9665, "learning_rate": 4.990162734411279e-05, "epoch": 0.07490996398559424, "percentage": 7.49, "elapsed_time": "2:00:30", "remaining_time": "1 day, 0:48:08", "throughput": 1767.52, "total_tokens": 12779520} -{"current_steps": 1570, "total_steps": 20825, "loss": 1.0059, "learning_rate": 4.989808507644461e-05, "epoch": 0.07539015606242497, "percentage": 7.54, "elapsed_time": "2:01:14", "remaining_time": "1 day, 0:46:59", "throughput": 1767.96, "total_tokens": 12861440} -{"current_steps": 1580, "total_steps": 20825, "loss": 0.9245, "learning_rate": 4.989448028586269e-05, "epoch": 0.07587034813925571, "percentage": 7.59, "elapsed_time": "2:01:59", "remaining_time": "1 day, 0:45:51", "throughput": 1768.39, "total_tokens": 12943360} -{"current_steps": 1590, "total_steps": 20825, "loss": 0.8285, "learning_rate": 4.989081298141921e-05, "epoch": 0.07635054021608643, "percentage": 7.64, "elapsed_time": "2:02:44", "remaining_time": "1 day, 0:44:49", "throughput": 1768.71, "total_tokens": 13025280} -{"current_steps": 1600, "total_steps": 20825, "loss": 0.8067, "learning_rate": 4.988708317232334e-05, "epoch": 0.07683073229291716, "percentage": 7.68, "elapsed_time": "2:03:29", "remaining_time": "1 day, 0:43:44", "throughput": 1769.09, "total_tokens": 13107200} -{"current_steps": 1610, "total_steps": 20825, "loss": 0.8029, "learning_rate": 4.988329086794122e-05, "epoch": 0.0773109243697479, "percentage": 7.73, "elapsed_time": "2:04:14", "remaining_time": "1 day, 0:42:42", "throughput": 1769.39, "total_tokens": 13189120} -{"current_steps": 1620, "total_steps": 20825, "loss": 1.1687, "learning_rate": 4.9879436077795884e-05, "epoch": 0.07779111644657863, "percentage": 7.78, "elapsed_time": "2:04:59", "remaining_time": "1 day, 0:41:41", "throughput": 1769.68, "total_tokens": 13271040} -{"current_steps": 1630, "total_steps": 20825, "loss": 0.9474, "learning_rate": 4.98755188115673e-05, "epoch": 0.07827130852340937, "percentage": 7.83, "elapsed_time": "2:05:44", "remaining_time": "1 day, 0:40:39", "throughput": 1770.0, "total_tokens": 13352960} -{"current_steps": 1640, "total_steps": 20825, "loss": 0.9421, "learning_rate": 4.9871539079092344e-05, "epoch": 0.0787515006002401, "percentage": 7.88, "elapsed_time": "2:06:28", "remaining_time": "1 day, 0:39:32", "throughput": 1770.4, "total_tokens": 13434880} -{"current_steps": 1650, "total_steps": 20825, "loss": 1.0174, "learning_rate": 4.9867496890364726e-05, "epoch": 0.07923169267707082, "percentage": 7.92, "elapsed_time": "2:07:13", "remaining_time": "1 day, 0:38:27", "throughput": 1770.79, "total_tokens": 13516800} -{"current_steps": 1660, "total_steps": 20825, "loss": 1.1363, "learning_rate": 4.9863392255535e-05, "epoch": 0.07971188475390156, "percentage": 7.97, "elapsed_time": "2:07:58", "remaining_time": "1 day, 0:37:31", "throughput": 1770.97, "total_tokens": 13598720} -{"current_steps": 1670, "total_steps": 20825, "loss": 0.9505, "learning_rate": 4.985922518491054e-05, "epoch": 0.08019207683073229, "percentage": 8.02, "elapsed_time": "2:08:43", "remaining_time": "1 day, 0:36:31", "throughput": 1771.25, "total_tokens": 13680640} -{"current_steps": 1680, "total_steps": 20825, "loss": 1.0416, "learning_rate": 4.9854995688955494e-05, "epoch": 0.08067226890756303, "percentage": 8.07, "elapsed_time": "2:09:28", "remaining_time": "1 day, 0:35:27", "throughput": 1771.61, "total_tokens": 13762560} -{"current_steps": 1690, "total_steps": 20825, "loss": 1.164, "learning_rate": 4.9850703778290784e-05, "epoch": 0.08115246098439376, "percentage": 8.12, "elapsed_time": "2:10:13", "remaining_time": "1 day, 0:34:23", "throughput": 1771.96, "total_tokens": 13844480} -{"current_steps": 1700, "total_steps": 20825, "loss": 1.0884, "learning_rate": 4.984634946369404e-05, "epoch": 0.08163265306122448, "percentage": 8.16, "elapsed_time": "2:10:58", "remaining_time": "1 day, 0:33:24", "throughput": 1772.21, "total_tokens": 13926400} -{"current_steps": 1710, "total_steps": 20825, "loss": 1.2702, "learning_rate": 4.984193275609964e-05, "epoch": 0.08211284513805522, "percentage": 8.21, "elapsed_time": "2:11:42", "remaining_time": "1 day, 0:32:21", "throughput": 1772.56, "total_tokens": 14008320} -{"current_steps": 1720, "total_steps": 20825, "loss": 0.9906, "learning_rate": 4.983745366659859e-05, "epoch": 0.08259303721488595, "percentage": 8.26, "elapsed_time": "2:12:27", "remaining_time": "1 day, 0:31:18", "throughput": 1772.89, "total_tokens": 14090240} -{"current_steps": 1730, "total_steps": 20825, "loss": 0.9924, "learning_rate": 4.983291220643858e-05, "epoch": 0.08307322929171669, "percentage": 8.31, "elapsed_time": "2:13:12", "remaining_time": "1 day, 0:30:14", "throughput": 1773.24, "total_tokens": 14172160} -{"current_steps": 1740, "total_steps": 20825, "loss": 1.0358, "learning_rate": 4.982830838702392e-05, "epoch": 0.08355342136854742, "percentage": 8.36, "elapsed_time": "2:13:56", "remaining_time": "1 day, 0:29:12", "throughput": 1773.56, "total_tokens": 14254080} -{"current_steps": 1750, "total_steps": 20825, "loss": 0.9054, "learning_rate": 4.98236422199155e-05, "epoch": 0.08403361344537816, "percentage": 8.4, "elapsed_time": "2:14:41", "remaining_time": "1 day, 0:28:10", "throughput": 1773.89, "total_tokens": 14336000} -{"current_steps": 1760, "total_steps": 20825, "loss": 0.985, "learning_rate": 4.9818913716830784e-05, "epoch": 0.08451380552220888, "percentage": 8.45, "elapsed_time": "2:15:26", "remaining_time": "1 day, 0:27:11", "throughput": 1774.13, "total_tokens": 14417920} -{"current_steps": 1770, "total_steps": 20825, "loss": 1.0279, "learning_rate": 4.981412288964377e-05, "epoch": 0.08499399759903961, "percentage": 8.5, "elapsed_time": "2:16:11", "remaining_time": "1 day, 0:26:10", "throughput": 1774.45, "total_tokens": 14499840} -{"current_steps": 1780, "total_steps": 20825, "loss": 1.01, "learning_rate": 4.9809269750384956e-05, "epoch": 0.08547418967587035, "percentage": 8.55, "elapsed_time": "2:16:56", "remaining_time": "1 day, 0:25:08", "throughput": 1774.76, "total_tokens": 14581760} -{"current_steps": 1790, "total_steps": 20825, "loss": 1.1156, "learning_rate": 4.980435431124133e-05, "epoch": 0.08595438175270108, "percentage": 8.6, "elapsed_time": "2:17:41", "remaining_time": "1 day, 0:24:08", "throughput": 1775.04, "total_tokens": 14663680} -{"current_steps": 1800, "total_steps": 20825, "loss": 0.9487, "learning_rate": 4.97993765845563e-05, "epoch": 0.08643457382953182, "percentage": 8.64, "elapsed_time": "2:18:26", "remaining_time": "1 day, 0:23:10", "throughput": 1775.28, "total_tokens": 14745600} -{"current_steps": 1810, "total_steps": 20825, "loss": 0.9613, "learning_rate": 4.9794336582829714e-05, "epoch": 0.08691476590636255, "percentage": 8.69, "elapsed_time": "2:19:10", "remaining_time": "1 day, 0:22:08", "throughput": 1775.6, "total_tokens": 14827520} -{"current_steps": 1820, "total_steps": 20825, "loss": 1.0248, "learning_rate": 4.9789234318717784e-05, "epoch": 0.08739495798319327, "percentage": 8.74, "elapsed_time": "2:19:55", "remaining_time": "1 day, 0:21:06", "throughput": 1775.91, "total_tokens": 14909440} -{"current_steps": 1830, "total_steps": 20825, "loss": 1.0187, "learning_rate": 4.978406980503308e-05, "epoch": 0.08787515006002401, "percentage": 8.79, "elapsed_time": "2:20:40", "remaining_time": "1 day, 0:20:05", "throughput": 1776.22, "total_tokens": 14991360} -{"current_steps": 1840, "total_steps": 20825, "loss": 0.9926, "learning_rate": 4.9778843054744494e-05, "epoch": 0.08835534213685474, "percentage": 8.84, "elapsed_time": "2:21:24", "remaining_time": "1 day, 0:19:07", "throughput": 1776.47, "total_tokens": 15073280} -{"current_steps": 1850, "total_steps": 20825, "loss": 0.9672, "learning_rate": 4.977355408097719e-05, "epoch": 0.08883553421368548, "percentage": 8.88, "elapsed_time": "2:22:09", "remaining_time": "1 day, 0:18:05", "throughput": 1776.79, "total_tokens": 15155200} -{"current_steps": 1860, "total_steps": 20825, "loss": 0.8497, "learning_rate": 4.9768202897012595e-05, "epoch": 0.0893157262905162, "percentage": 8.93, "elapsed_time": "2:22:54", "remaining_time": "1 day, 0:17:04", "throughput": 1777.09, "total_tokens": 15237120} -{"current_steps": 1870, "total_steps": 20825, "loss": 1.0258, "learning_rate": 4.9762789516288354e-05, "epoch": 0.08979591836734693, "percentage": 8.98, "elapsed_time": "2:23:38", "remaining_time": "1 day, 0:16:02", "throughput": 1777.42, "total_tokens": 15319040} -{"current_steps": 1880, "total_steps": 20825, "loss": 0.9799, "learning_rate": 4.97573139523983e-05, "epoch": 0.09027611044417767, "percentage": 9.03, "elapsed_time": "2:24:23", "remaining_time": "1 day, 0:15:03", "throughput": 1777.69, "total_tokens": 15400960} -{"current_steps": 1890, "total_steps": 20825, "loss": 1.0616, "learning_rate": 4.9751776219092405e-05, "epoch": 0.0907563025210084, "percentage": 9.08, "elapsed_time": "2:25:08", "remaining_time": "1 day, 0:14:03", "throughput": 1777.96, "total_tokens": 15482880} -{"current_steps": 1900, "total_steps": 20825, "loss": 0.894, "learning_rate": 4.9746176330276783e-05, "epoch": 0.09123649459783914, "percentage": 9.12, "elapsed_time": "2:25:53", "remaining_time": "1 day, 0:13:06", "throughput": 1778.17, "total_tokens": 15564800} -{"current_steps": 1910, "total_steps": 20825, "loss": 1.069, "learning_rate": 4.97405143000136e-05, "epoch": 0.09171668667466987, "percentage": 9.17, "elapsed_time": "2:26:38", "remaining_time": "1 day, 0:12:08", "throughput": 1778.43, "total_tokens": 15646720} -{"current_steps": 1920, "total_steps": 20825, "loss": 1.0716, "learning_rate": 4.9734790142521096e-05, "epoch": 0.0921968787515006, "percentage": 9.22, "elapsed_time": "2:27:23", "remaining_time": "1 day, 0:11:12", "throughput": 1778.63, "total_tokens": 15728640} -{"current_steps": 1930, "total_steps": 20825, "loss": 1.1271, "learning_rate": 4.9729003872173494e-05, "epoch": 0.09267707082833133, "percentage": 9.27, "elapsed_time": "2:28:08", "remaining_time": "1 day, 0:10:15", "throughput": 1778.86, "total_tokens": 15810560} -{"current_steps": 1940, "total_steps": 20825, "loss": 0.9171, "learning_rate": 4.972315550350102e-05, "epoch": 0.09315726290516206, "percentage": 9.32, "elapsed_time": "2:28:53", "remaining_time": "1 day, 0:09:19", "throughput": 1779.06, "total_tokens": 15892480} -{"current_steps": 1950, "total_steps": 20825, "loss": 0.9881, "learning_rate": 4.971724505118982e-05, "epoch": 0.0936374549819928, "percentage": 9.36, "elapsed_time": "2:29:37", "remaining_time": "1 day, 0:08:20", "throughput": 1779.33, "total_tokens": 15974400} -{"current_steps": 1960, "total_steps": 20825, "loss": 1.0533, "learning_rate": 4.971127253008194e-05, "epoch": 0.09411764705882353, "percentage": 9.41, "elapsed_time": "2:30:22", "remaining_time": "1 day, 0:07:24", "throughput": 1779.54, "total_tokens": 16056320} -{"current_steps": 1970, "total_steps": 20825, "loss": 1.0697, "learning_rate": 4.970523795517532e-05, "epoch": 0.09459783913565427, "percentage": 9.46, "elapsed_time": "2:31:07", "remaining_time": "1 day, 0:06:25", "throughput": 1779.8, "total_tokens": 16138240} -{"current_steps": 1980, "total_steps": 20825, "loss": 0.8598, "learning_rate": 4.969914134162368e-05, "epoch": 0.095078031212485, "percentage": 9.51, "elapsed_time": "2:31:52", "remaining_time": "1 day, 0:05:30", "throughput": 1779.98, "total_tokens": 16220160} -{"current_steps": 1990, "total_steps": 20825, "loss": 0.9143, "learning_rate": 4.9692982704736566e-05, "epoch": 0.09555822328931572, "percentage": 9.56, "elapsed_time": "2:32:37", "remaining_time": "1 day, 0:04:33", "throughput": 1780.21, "total_tokens": 16302080} -{"current_steps": 2000, "total_steps": 20825, "loss": 0.8093, "learning_rate": 4.968676205997925e-05, "epoch": 0.09603841536614646, "percentage": 9.6, "elapsed_time": "2:33:22", "remaining_time": "1 day, 0:03:36", "throughput": 1780.42, "total_tokens": 16384000} -{"current_steps": 2010, "total_steps": 20825, "loss": 1.0241, "learning_rate": 4.9680479422972735e-05, "epoch": 0.09651860744297719, "percentage": 9.65, "elapsed_time": "2:34:17", "remaining_time": "1 day, 0:04:13", "throughput": 1778.72, "total_tokens": 16465920} -{"current_steps": 2020, "total_steps": 20825, "loss": 0.9488, "learning_rate": 4.9674134809493686e-05, "epoch": 0.09699879951980793, "percentage": 9.7, "elapsed_time": "2:35:01", "remaining_time": "1 day, 0:03:13", "throughput": 1779.01, "total_tokens": 16547840} -{"current_steps": 2030, "total_steps": 20825, "loss": 0.9864, "learning_rate": 4.9667728235474396e-05, "epoch": 0.09747899159663866, "percentage": 9.75, "elapsed_time": "2:35:46", "remaining_time": "1 day, 0:02:14", "throughput": 1779.27, "total_tokens": 16629760} -{"current_steps": 2040, "total_steps": 20825, "loss": 0.8736, "learning_rate": 4.9661259717002764e-05, "epoch": 0.09795918367346938, "percentage": 9.8, "elapsed_time": "2:36:31", "remaining_time": "1 day, 0:01:18", "throughput": 1779.48, "total_tokens": 16711680} -{"current_steps": 2050, "total_steps": 20825, "loss": 1.0361, "learning_rate": 4.9654729270322234e-05, "epoch": 0.09843937575030012, "percentage": 9.84, "elapsed_time": "2:37:15", "remaining_time": "1 day, 0:00:18", "throughput": 1779.78, "total_tokens": 16793600} -{"current_steps": 2060, "total_steps": 20825, "loss": 0.9958, "learning_rate": 4.964813691183174e-05, "epoch": 0.09891956782713085, "percentage": 9.89, "elapsed_time": "2:38:00", "remaining_time": "23:59:18", "throughput": 1780.05, "total_tokens": 16875520} -{"current_steps": 2070, "total_steps": 20825, "loss": 0.8843, "learning_rate": 4.964148265808573e-05, "epoch": 0.09939975990396159, "percentage": 9.94, "elapsed_time": "2:38:44", "remaining_time": "23:58:18", "throughput": 1780.34, "total_tokens": 16957440} -{"current_steps": 2080, "total_steps": 20825, "loss": 0.8698, "learning_rate": 4.963476652579404e-05, "epoch": 0.09987995198079232, "percentage": 9.99, "elapsed_time": "2:39:29", "remaining_time": "23:57:20", "throughput": 1780.59, "total_tokens": 17039360} -{"current_steps": 2090, "total_steps": 20825, "loss": 1.1505, "learning_rate": 4.962798853182192e-05, "epoch": 0.10036014405762304, "percentage": 10.04, "elapsed_time": "2:40:14", "remaining_time": "23:56:24", "throughput": 1780.8, "total_tokens": 17121280} -{"current_steps": 2100, "total_steps": 20825, "loss": 1.131, "learning_rate": 4.9621148693189954e-05, "epoch": 0.10084033613445378, "percentage": 10.08, "elapsed_time": "2:40:59", "remaining_time": "23:55:26", "throughput": 1781.04, "total_tokens": 17203200} -{"current_steps": 2110, "total_steps": 20825, "loss": 1.2084, "learning_rate": 4.9614247027074024e-05, "epoch": 0.10132052821128451, "percentage": 10.13, "elapsed_time": "2:41:43", "remaining_time": "23:54:29", "throughput": 1781.28, "total_tokens": 17285120} -{"current_steps": 2120, "total_steps": 20825, "loss": 0.822, "learning_rate": 4.960728355080527e-05, "epoch": 0.10180072028811525, "percentage": 10.18, "elapsed_time": "2:42:28", "remaining_time": "23:53:31", "throughput": 1781.53, "total_tokens": 17367040} -{"current_steps": 2130, "total_steps": 20825, "loss": 0.9156, "learning_rate": 4.9600258281870046e-05, "epoch": 0.10228091236494598, "percentage": 10.23, "elapsed_time": "2:43:13", "remaining_time": "23:52:34", "throughput": 1781.75, "total_tokens": 17448960} -{"current_steps": 2140, "total_steps": 20825, "loss": 0.9211, "learning_rate": 4.959317123790988e-05, "epoch": 0.1027611044417767, "percentage": 10.28, "elapsed_time": "2:43:57", "remaining_time": "23:51:37", "throughput": 1781.98, "total_tokens": 17530880} -{"current_steps": 2150, "total_steps": 20825, "loss": 0.9979, "learning_rate": 4.958602243672145e-05, "epoch": 0.10324129651860744, "percentage": 10.32, "elapsed_time": "2:44:42", "remaining_time": "23:50:38", "throughput": 1782.24, "total_tokens": 17612800} -{"current_steps": 2160, "total_steps": 20825, "loss": 0.9711, "learning_rate": 4.9578811896256475e-05, "epoch": 0.10372148859543817, "percentage": 10.37, "elapsed_time": "2:45:27", "remaining_time": "23:49:41", "throughput": 1782.48, "total_tokens": 17694720} -{"current_steps": 2170, "total_steps": 20825, "loss": 0.9847, "learning_rate": 4.957153963462172e-05, "epoch": 0.10420168067226891, "percentage": 10.42, "elapsed_time": "2:46:11", "remaining_time": "23:48:43", "throughput": 1782.74, "total_tokens": 17776640} -{"current_steps": 2180, "total_steps": 20825, "loss": 0.9521, "learning_rate": 4.9564205670078965e-05, "epoch": 0.10468187274909964, "percentage": 10.47, "elapsed_time": "2:46:56", "remaining_time": "23:47:51", "throughput": 1782.85, "total_tokens": 17858560} -{"current_steps": 2190, "total_steps": 20825, "loss": 0.9161, "learning_rate": 4.955681002104492e-05, "epoch": 0.10516206482593037, "percentage": 10.52, "elapsed_time": "2:47:41", "remaining_time": "23:46:55", "throughput": 1783.07, "total_tokens": 17940480} -{"current_steps": 2200, "total_steps": 20825, "loss": 0.944, "learning_rate": 4.954935270609119e-05, "epoch": 0.1056422569027611, "percentage": 10.56, "elapsed_time": "2:48:26", "remaining_time": "23:45:57", "throughput": 1783.32, "total_tokens": 18022400} -{"current_steps": 2210, "total_steps": 20825, "loss": 1.0233, "learning_rate": 4.9541833743944244e-05, "epoch": 0.10612244897959183, "percentage": 10.61, "elapsed_time": "2:49:10", "remaining_time": "23:45:02", "throughput": 1783.51, "total_tokens": 18104320} -{"current_steps": 2220, "total_steps": 20825, "loss": 0.9329, "learning_rate": 4.953425315348534e-05, "epoch": 0.10660264105642257, "percentage": 10.66, "elapsed_time": "2:49:55", "remaining_time": "23:44:04", "throughput": 1783.75, "total_tokens": 18186240} -{"current_steps": 2230, "total_steps": 20825, "loss": 0.9987, "learning_rate": 4.952661095375051e-05, "epoch": 0.1070828331332533, "percentage": 10.71, "elapsed_time": "2:50:40", "remaining_time": "23:43:09", "throughput": 1783.95, "total_tokens": 18268160} -{"current_steps": 2240, "total_steps": 20825, "loss": 0.8519, "learning_rate": 4.95189071639305e-05, "epoch": 0.10756302521008404, "percentage": 10.76, "elapsed_time": "2:51:24", "remaining_time": "23:42:12", "throughput": 1784.17, "total_tokens": 18350080} -{"current_steps": 2250, "total_steps": 20825, "loss": 0.8418, "learning_rate": 4.951114180337069e-05, "epoch": 0.10804321728691477, "percentage": 10.8, "elapsed_time": "2:52:09", "remaining_time": "23:41:19", "throughput": 1784.33, "total_tokens": 18432000} -{"current_steps": 2260, "total_steps": 20825, "loss": 0.7989, "learning_rate": 4.95033148915711e-05, "epoch": 0.1085234093637455, "percentage": 10.85, "elapsed_time": "2:52:54", "remaining_time": "23:40:25", "throughput": 1784.49, "total_tokens": 18513920} -{"current_steps": 2270, "total_steps": 20825, "loss": 0.8756, "learning_rate": 4.949542644818631e-05, "epoch": 0.10900360144057623, "percentage": 10.9, "elapsed_time": "2:53:39", "remaining_time": "23:39:30", "throughput": 1784.69, "total_tokens": 18595840} -{"current_steps": 2280, "total_steps": 20825, "loss": 1.0697, "learning_rate": 4.948747649302542e-05, "epoch": 0.10948379351740696, "percentage": 10.95, "elapsed_time": "2:54:24", "remaining_time": "23:38:33", "throughput": 1784.91, "total_tokens": 18677760} -{"current_steps": 2290, "total_steps": 20825, "loss": 0.9839, "learning_rate": 4.947946504605198e-05, "epoch": 0.1099639855942377, "percentage": 11.0, "elapsed_time": "2:55:08", "remaining_time": "23:37:36", "throughput": 1785.16, "total_tokens": 18759680} -{"current_steps": 2300, "total_steps": 20825, "loss": 0.9213, "learning_rate": 4.947139212738395e-05, "epoch": 0.11044417767106843, "percentage": 11.04, "elapsed_time": "2:55:53", "remaining_time": "23:36:40", "throughput": 1785.36, "total_tokens": 18841600} -{"current_steps": 2310, "total_steps": 20825, "loss": 1.0463, "learning_rate": 4.946325775729368e-05, "epoch": 0.11092436974789915, "percentage": 11.09, "elapsed_time": "2:56:38", "remaining_time": "23:35:46", "throughput": 1785.53, "total_tokens": 18923520} -{"current_steps": 2320, "total_steps": 20825, "loss": 0.9103, "learning_rate": 4.945506195620784e-05, "epoch": 0.1114045618247299, "percentage": 11.14, "elapsed_time": "2:57:23", "remaining_time": "23:34:52", "throughput": 1785.7, "total_tokens": 19005440} -{"current_steps": 2330, "total_steps": 20825, "loss": 0.9041, "learning_rate": 4.944680474470731e-05, "epoch": 0.11188475390156062, "percentage": 11.19, "elapsed_time": "2:58:07", "remaining_time": "23:33:57", "throughput": 1785.89, "total_tokens": 19087360} -{"current_steps": 2340, "total_steps": 20825, "loss": 1.1012, "learning_rate": 4.943848614352724e-05, "epoch": 0.11236494597839136, "percentage": 11.24, "elapsed_time": "2:58:52", "remaining_time": "23:33:02", "throughput": 1786.09, "total_tokens": 19169280} -{"current_steps": 2350, "total_steps": 20825, "loss": 0.8855, "learning_rate": 4.943010617355691e-05, "epoch": 0.11284513805522209, "percentage": 11.28, "elapsed_time": "2:59:37", "remaining_time": "23:32:07", "throughput": 1786.28, "total_tokens": 19251200} -{"current_steps": 2360, "total_steps": 20825, "loss": 0.9905, "learning_rate": 4.94216648558397e-05, "epoch": 0.11332533013205282, "percentage": 11.33, "elapsed_time": "3:00:21", "remaining_time": "23:31:12", "throughput": 1786.48, "total_tokens": 19333120} -{"current_steps": 2370, "total_steps": 20825, "loss": 0.8465, "learning_rate": 4.9413162211573075e-05, "epoch": 0.11380552220888356, "percentage": 11.38, "elapsed_time": "3:01:06", "remaining_time": "23:30:19", "throughput": 1786.63, "total_tokens": 19415040} -{"current_steps": 2380, "total_steps": 20825, "loss": 1.3091, "learning_rate": 4.9404598262108456e-05, "epoch": 0.11428571428571428, "percentage": 11.43, "elapsed_time": "3:01:51", "remaining_time": "23:29:27", "throughput": 1786.76, "total_tokens": 19496960} -{"current_steps": 2390, "total_steps": 20825, "loss": 1.0505, "learning_rate": 4.939597302895125e-05, "epoch": 0.11476590636254502, "percentage": 11.48, "elapsed_time": "3:02:36", "remaining_time": "23:28:32", "throughput": 1786.94, "total_tokens": 19578880} -{"current_steps": 2400, "total_steps": 20825, "loss": 0.9624, "learning_rate": 4.938728653376075e-05, "epoch": 0.11524609843937575, "percentage": 11.52, "elapsed_time": "3:03:21", "remaining_time": "23:27:37", "throughput": 1787.15, "total_tokens": 19660800} -{"current_steps": 2410, "total_steps": 20825, "loss": 0.882, "learning_rate": 4.9378538798350046e-05, "epoch": 0.11572629051620648, "percentage": 11.57, "elapsed_time": "3:04:05", "remaining_time": "23:26:43", "throughput": 1787.32, "total_tokens": 19742720} -{"current_steps": 2420, "total_steps": 20825, "loss": 0.802, "learning_rate": 4.936972984468608e-05, "epoch": 0.11620648259303722, "percentage": 11.62, "elapsed_time": "3:04:51", "remaining_time": "23:25:54", "throughput": 1787.39, "total_tokens": 19824640} -{"current_steps": 2430, "total_steps": 20825, "loss": 0.8687, "learning_rate": 4.936085969488947e-05, "epoch": 0.11668667466986794, "percentage": 11.67, "elapsed_time": "3:05:36", "remaining_time": "23:25:00", "throughput": 1787.56, "total_tokens": 19906560} -{"current_steps": 2440, "total_steps": 20825, "loss": 0.7774, "learning_rate": 4.9351928371234525e-05, "epoch": 0.11716686674669868, "percentage": 11.72, "elapsed_time": "3:06:21", "remaining_time": "23:24:07", "throughput": 1787.71, "total_tokens": 19988480} -{"current_steps": 2450, "total_steps": 20825, "loss": 0.8777, "learning_rate": 4.934293589614917e-05, "epoch": 0.11764705882352941, "percentage": 11.76, "elapsed_time": "3:07:05", "remaining_time": "23:23:12", "throughput": 1787.9, "total_tokens": 20070400} -{"current_steps": 2460, "total_steps": 20825, "loss": 1.0353, "learning_rate": 4.93338822922149e-05, "epoch": 0.11812725090036015, "percentage": 11.81, "elapsed_time": "3:07:50", "remaining_time": "23:22:18", "throughput": 1788.07, "total_tokens": 20152320} -{"current_steps": 2470, "total_steps": 20825, "loss": 0.9866, "learning_rate": 4.932476758216669e-05, "epoch": 0.11860744297719088, "percentage": 11.86, "elapsed_time": "3:08:35", "remaining_time": "23:21:25", "throughput": 1788.22, "total_tokens": 20234240} -{"current_steps": 2480, "total_steps": 20825, "loss": 0.9443, "learning_rate": 4.931559178889297e-05, "epoch": 0.1190876350540216, "percentage": 11.91, "elapsed_time": "3:09:19", "remaining_time": "23:20:31", "throughput": 1788.41, "total_tokens": 20316160} -{"current_steps": 2490, "total_steps": 20825, "loss": 1.0362, "learning_rate": 4.9306354935435594e-05, "epoch": 0.11956782713085234, "percentage": 11.96, "elapsed_time": "3:10:04", "remaining_time": "23:19:37", "throughput": 1788.57, "total_tokens": 20398080} -{"current_steps": 2500, "total_steps": 20825, "loss": 1.0075, "learning_rate": 4.929705704498969e-05, "epoch": 0.12004801920768307, "percentage": 12.0, "elapsed_time": "3:10:49", "remaining_time": "23:18:43", "throughput": 1788.76, "total_tokens": 20480000} -{"current_steps": 2510, "total_steps": 20825, "loss": 0.9074, "learning_rate": 4.928769814090371e-05, "epoch": 0.12052821128451381, "percentage": 12.05, "elapsed_time": "3:11:33", "remaining_time": "23:17:49", "throughput": 1788.93, "total_tokens": 20561920} -{"current_steps": 2520, "total_steps": 20825, "loss": 1.0916, "learning_rate": 4.927827824667929e-05, "epoch": 0.12100840336134454, "percentage": 12.1, "elapsed_time": "3:12:18", "remaining_time": "23:16:54", "throughput": 1789.13, "total_tokens": 20643840} -{"current_steps": 2530, "total_steps": 20825, "loss": 1.0548, "learning_rate": 4.926879738597122e-05, "epoch": 0.12148859543817526, "percentage": 12.15, "elapsed_time": "3:13:03", "remaining_time": "23:16:00", "throughput": 1789.3, "total_tokens": 20725760} -{"current_steps": 2540, "total_steps": 20825, "loss": 1.1967, "learning_rate": 4.925925558258741e-05, "epoch": 0.121968787515006, "percentage": 12.2, "elapsed_time": "3:13:48", "remaining_time": "23:15:09", "throughput": 1789.4, "total_tokens": 20807680} -{"current_steps": 2550, "total_steps": 20825, "loss": 0.9201, "learning_rate": 4.924965286048879e-05, "epoch": 0.12244897959183673, "percentage": 12.24, "elapsed_time": "3:14:33", "remaining_time": "23:14:16", "throughput": 1789.56, "total_tokens": 20889600} -{"current_steps": 2560, "total_steps": 20825, "loss": 1.0407, "learning_rate": 4.9239989243789275e-05, "epoch": 0.12292917166866747, "percentage": 12.29, "elapsed_time": "3:15:17", "remaining_time": "23:13:24", "throughput": 1789.7, "total_tokens": 20971520} -{"current_steps": 2570, "total_steps": 20825, "loss": 1.0231, "learning_rate": 4.9230264756755685e-05, "epoch": 0.1234093637454982, "percentage": 12.34, "elapsed_time": "3:16:02", "remaining_time": "23:12:31", "throughput": 1789.86, "total_tokens": 21053440} -{"current_steps": 2580, "total_steps": 20825, "loss": 0.9814, "learning_rate": 4.9220479423807694e-05, "epoch": 0.12388955582232893, "percentage": 12.39, "elapsed_time": "3:16:47", "remaining_time": "23:11:38", "throughput": 1790.0, "total_tokens": 21135360} -{"current_steps": 2590, "total_steps": 20825, "loss": 1.0074, "learning_rate": 4.9210633269517776e-05, "epoch": 0.12436974789915967, "percentage": 12.44, "elapsed_time": "3:17:32", "remaining_time": "23:10:44", "throughput": 1790.18, "total_tokens": 21217280} -{"current_steps": 2600, "total_steps": 20825, "loss": 0.9252, "learning_rate": 4.920072631861115e-05, "epoch": 0.12484993997599039, "percentage": 12.48, "elapsed_time": "3:18:16", "remaining_time": "23:09:51", "throughput": 1790.35, "total_tokens": 21299200} -{"current_steps": 2610, "total_steps": 20825, "loss": 1.1132, "learning_rate": 4.919075859596567e-05, "epoch": 0.12533013205282112, "percentage": 12.53, "elapsed_time": "3:19:01", "remaining_time": "23:08:57", "throughput": 1790.51, "total_tokens": 21381120} -{"current_steps": 2620, "total_steps": 20825, "loss": 1.1313, "learning_rate": 4.918073012661183e-05, "epoch": 0.12581032412965187, "percentage": 12.58, "elapsed_time": "3:19:45", "remaining_time": "23:08:04", "throughput": 1790.68, "total_tokens": 21463040} -{"current_steps": 2630, "total_steps": 20825, "loss": 1.0631, "learning_rate": 4.9170640935732654e-05, "epoch": 0.1262905162064826, "percentage": 12.63, "elapsed_time": "3:20:30", "remaining_time": "23:07:13", "throughput": 1790.79, "total_tokens": 21544960} -{"current_steps": 2640, "total_steps": 20825, "loss": 0.8485, "learning_rate": 4.916049104866365e-05, "epoch": 0.12677070828331333, "percentage": 12.68, "elapsed_time": "3:21:15", "remaining_time": "23:06:22", "throughput": 1790.91, "total_tokens": 21626880} -{"current_steps": 2650, "total_steps": 20825, "loss": 0.9922, "learning_rate": 4.915028049089274e-05, "epoch": 0.12725090036014405, "percentage": 12.73, "elapsed_time": "3:22:00", "remaining_time": "23:05:29", "throughput": 1791.06, "total_tokens": 21708800} -{"current_steps": 2660, "total_steps": 20825, "loss": 0.9331, "learning_rate": 4.914000928806021e-05, "epoch": 0.12773109243697478, "percentage": 12.77, "elapsed_time": "3:22:45", "remaining_time": "23:04:36", "throughput": 1791.22, "total_tokens": 21790720} -{"current_steps": 2670, "total_steps": 20825, "loss": 1.0793, "learning_rate": 4.912967746595861e-05, "epoch": 0.12821128451380553, "percentage": 12.82, "elapsed_time": "3:23:30", "remaining_time": "23:03:44", "throughput": 1791.34, "total_tokens": 21872640} -{"current_steps": 2680, "total_steps": 20825, "loss": 1.1306, "learning_rate": 4.911928505053275e-05, "epoch": 0.12869147659063626, "percentage": 12.87, "elapsed_time": "3:24:15", "remaining_time": "23:02:53", "throughput": 1791.45, "total_tokens": 21954560} -{"current_steps": 2690, "total_steps": 20825, "loss": 0.9962, "learning_rate": 4.9108832067879574e-05, "epoch": 0.129171668667467, "percentage": 12.92, "elapsed_time": "3:25:00", "remaining_time": "23:02:02", "throughput": 1791.58, "total_tokens": 22036480} -{"current_steps": 2700, "total_steps": 20825, "loss": 0.8064, "learning_rate": 4.909831854424812e-05, "epoch": 0.12965186074429771, "percentage": 12.97, "elapsed_time": "3:25:45", "remaining_time": "23:01:11", "throughput": 1791.69, "total_tokens": 22118400} -{"current_steps": 2710, "total_steps": 20825, "loss": 0.9561, "learning_rate": 4.908774450603946e-05, "epoch": 0.13013205282112844, "percentage": 13.01, "elapsed_time": "3:26:29", "remaining_time": "23:00:18", "throughput": 1791.84, "total_tokens": 22200320} -{"current_steps": 2720, "total_steps": 20825, "loss": 1.0554, "learning_rate": 4.907710997980664e-05, "epoch": 0.1306122448979592, "percentage": 13.06, "elapsed_time": "3:27:14", "remaining_time": "22:59:25", "throughput": 1792.0, "total_tokens": 22282240} -{"current_steps": 2730, "total_steps": 20825, "loss": 0.9203, "learning_rate": 4.906641499225457e-05, "epoch": 0.13109243697478992, "percentage": 13.11, "elapsed_time": "3:27:58", "remaining_time": "22:58:33", "throughput": 1792.15, "total_tokens": 22364160} -{"current_steps": 2740, "total_steps": 20825, "loss": 0.9199, "learning_rate": 4.905565957024003e-05, "epoch": 0.13157262905162065, "percentage": 13.16, "elapsed_time": "3:28:44", "remaining_time": "22:57:44", "throughput": 1792.22, "total_tokens": 22446080} -{"current_steps": 2750, "total_steps": 20825, "loss": 0.9683, "learning_rate": 4.9044843740771505e-05, "epoch": 0.13205282112845138, "percentage": 13.21, "elapsed_time": "3:29:28", "remaining_time": "22:56:50", "throughput": 1792.38, "total_tokens": 22528000} -{"current_steps": 2760, "total_steps": 20825, "loss": 1.1265, "learning_rate": 4.9033967531009225e-05, "epoch": 0.1325330132052821, "percentage": 13.25, "elapsed_time": "3:30:13", "remaining_time": "22:55:59", "throughput": 1792.5, "total_tokens": 22609920} -{"current_steps": 2770, "total_steps": 20825, "loss": 1.1676, "learning_rate": 4.902303096826502e-05, "epoch": 0.13301320528211286, "percentage": 13.3, "elapsed_time": "3:30:58", "remaining_time": "22:55:06", "throughput": 1792.65, "total_tokens": 22691840} -{"current_steps": 2780, "total_steps": 20825, "loss": 0.8947, "learning_rate": 4.901203408000227e-05, "epoch": 0.13349339735894358, "percentage": 13.35, "elapsed_time": "3:31:43", "remaining_time": "22:54:15", "throughput": 1792.78, "total_tokens": 22773760} -{"current_steps": 2790, "total_steps": 20825, "loss": 1.1018, "learning_rate": 4.9000976893835856e-05, "epoch": 0.1339735894357743, "percentage": 13.4, "elapsed_time": "3:32:27", "remaining_time": "22:53:21", "throughput": 1792.95, "total_tokens": 22855680} -{"current_steps": 2800, "total_steps": 20825, "loss": 0.9954, "learning_rate": 4.898985943753207e-05, "epoch": 0.13445378151260504, "percentage": 13.45, "elapsed_time": "3:33:12", "remaining_time": "22:52:32", "throughput": 1793.03, "total_tokens": 22937600} -{"current_steps": 2810, "total_steps": 20825, "loss": 0.7595, "learning_rate": 4.897868173900854e-05, "epoch": 0.13493397358943576, "percentage": 13.49, "elapsed_time": "3:33:57", "remaining_time": "22:51:39", "throughput": 1793.19, "total_tokens": 23019520} -{"current_steps": 2820, "total_steps": 20825, "loss": 1.0, "learning_rate": 4.89674438263342e-05, "epoch": 0.13541416566626652, "percentage": 13.54, "elapsed_time": "3:34:41", "remaining_time": "22:50:48", "throughput": 1793.32, "total_tokens": 23101440} -{"current_steps": 2830, "total_steps": 20825, "loss": 0.9093, "learning_rate": 4.8956145727729156e-05, "epoch": 0.13589435774309724, "percentage": 13.59, "elapsed_time": "3:35:26", "remaining_time": "22:49:55", "throughput": 1793.46, "total_tokens": 23183360} -{"current_steps": 2840, "total_steps": 20825, "loss": 0.8391, "learning_rate": 4.8944787471564686e-05, "epoch": 0.13637454981992797, "percentage": 13.64, "elapsed_time": "3:36:11", "remaining_time": "22:49:04", "throughput": 1793.59, "total_tokens": 23265280} -{"current_steps": 2850, "total_steps": 20825, "loss": 0.8903, "learning_rate": 4.89333690863631e-05, "epoch": 0.1368547418967587, "percentage": 13.69, "elapsed_time": "3:36:55", "remaining_time": "22:48:11", "throughput": 1793.74, "total_tokens": 23347200} -{"current_steps": 2860, "total_steps": 20825, "loss": 0.9087, "learning_rate": 4.892189060079773e-05, "epoch": 0.13733493397358942, "percentage": 13.73, "elapsed_time": "3:37:40", "remaining_time": "22:47:22", "throughput": 1793.83, "total_tokens": 23429120} -{"current_steps": 2870, "total_steps": 20825, "loss": 0.8255, "learning_rate": 4.8910352043692806e-05, "epoch": 0.13781512605042018, "percentage": 13.78, "elapsed_time": "3:38:26", "remaining_time": "22:46:34", "throughput": 1793.87, "total_tokens": 23511040} -{"current_steps": 2880, "total_steps": 20825, "loss": 0.9486, "learning_rate": 4.889875344402342e-05, "epoch": 0.1382953181272509, "percentage": 13.83, "elapsed_time": "3:39:10", "remaining_time": "22:45:41", "throughput": 1794.03, "total_tokens": 23592960} -{"current_steps": 2890, "total_steps": 20825, "loss": 1.0803, "learning_rate": 4.8887094830915427e-05, "epoch": 0.13877551020408163, "percentage": 13.88, "elapsed_time": "3:39:55", "remaining_time": "22:44:48", "throughput": 1794.18, "total_tokens": 23674880} -{"current_steps": 2900, "total_steps": 20825, "loss": 0.9572, "learning_rate": 4.8875376233645396e-05, "epoch": 0.13925570228091236, "percentage": 13.93, "elapsed_time": "3:40:39", "remaining_time": "22:43:55", "throughput": 1794.34, "total_tokens": 23756800} -{"current_steps": 2910, "total_steps": 20825, "loss": 0.9725, "learning_rate": 4.886359768164054e-05, "epoch": 0.13973589435774308, "percentage": 13.97, "elapsed_time": "3:41:24", "remaining_time": "22:43:04", "throughput": 1794.47, "total_tokens": 23838720} -{"current_steps": 2920, "total_steps": 20825, "loss": 0.9, "learning_rate": 4.88517592044786e-05, "epoch": 0.14021608643457384, "percentage": 14.02, "elapsed_time": "3:42:09", "remaining_time": "22:42:12", "throughput": 1794.6, "total_tokens": 23920640} -{"current_steps": 2930, "total_steps": 20825, "loss": 1.0477, "learning_rate": 4.8839860831887805e-05, "epoch": 0.14069627851140457, "percentage": 14.07, "elapsed_time": "3:42:54", "remaining_time": "22:41:22", "throughput": 1794.7, "total_tokens": 24002560} -{"current_steps": 2940, "total_steps": 20825, "loss": 0.8685, "learning_rate": 4.882790259374681e-05, "epoch": 0.1411764705882353, "percentage": 14.12, "elapsed_time": "3:43:38", "remaining_time": "22:40:30", "throughput": 1794.85, "total_tokens": 24084480} -{"current_steps": 2950, "total_steps": 20825, "loss": 0.9956, "learning_rate": 4.881588452008456e-05, "epoch": 0.14165666266506602, "percentage": 14.17, "elapsed_time": "3:44:23", "remaining_time": "22:39:39", "throughput": 1794.97, "total_tokens": 24166400} -{"current_steps": 2960, "total_steps": 20825, "loss": 1.0358, "learning_rate": 4.880380664108032e-05, "epoch": 0.14213685474189675, "percentage": 14.21, "elapsed_time": "3:45:08", "remaining_time": "22:38:47", "throughput": 1795.1, "total_tokens": 24248320} -{"current_steps": 2970, "total_steps": 20825, "loss": 0.8954, "learning_rate": 4.879166898706347e-05, "epoch": 0.1426170468187275, "percentage": 14.26, "elapsed_time": "3:45:52", "remaining_time": "22:37:55", "throughput": 1795.24, "total_tokens": 24330240} -{"current_steps": 2980, "total_steps": 20825, "loss": 0.9882, "learning_rate": 4.877947158851352e-05, "epoch": 0.14309723889555823, "percentage": 14.31, "elapsed_time": "3:46:37", "remaining_time": "22:37:05", "throughput": 1795.34, "total_tokens": 24412160} -{"current_steps": 2990, "total_steps": 20825, "loss": 0.8396, "learning_rate": 4.876721447606002e-05, "epoch": 0.14357743097238895, "percentage": 14.36, "elapsed_time": "3:47:22", "remaining_time": "22:36:13", "throughput": 1795.47, "total_tokens": 24494080} -{"current_steps": 3000, "total_steps": 20825, "loss": 1.0854, "learning_rate": 4.875489768048247e-05, "epoch": 0.14405762304921968, "percentage": 14.41, "elapsed_time": "3:48:06", "remaining_time": "22:35:21", "throughput": 1795.61, "total_tokens": 24576000} -{"current_steps": 3010, "total_steps": 20825, "loss": 0.9147, "learning_rate": 4.8742521232710234e-05, "epoch": 0.14453781512605043, "percentage": 14.45, "elapsed_time": "3:48:58", "remaining_time": "22:35:12", "throughput": 1794.8, "total_tokens": 24657920} -{"current_steps": 3020, "total_steps": 20825, "loss": 0.956, "learning_rate": 4.873008516382245e-05, "epoch": 0.14501800720288116, "percentage": 14.5, "elapsed_time": "3:49:43", "remaining_time": "22:34:22", "throughput": 1794.9, "total_tokens": 24739840} -{"current_steps": 3030, "total_steps": 20825, "loss": 0.9568, "learning_rate": 4.871758950504801e-05, "epoch": 0.1454981992797119, "percentage": 14.55, "elapsed_time": "3:50:27", "remaining_time": "22:33:30", "throughput": 1795.04, "total_tokens": 24821760} -{"current_steps": 3040, "total_steps": 20825, "loss": 0.95, "learning_rate": 4.870503428776544e-05, "epoch": 0.14597839135654261, "percentage": 14.6, "elapsed_time": "3:51:12", "remaining_time": "22:32:39", "throughput": 1795.16, "total_tokens": 24903680} -{"current_steps": 3050, "total_steps": 20825, "loss": 1.0183, "learning_rate": 4.869241954350281e-05, "epoch": 0.14645858343337334, "percentage": 14.65, "elapsed_time": "3:51:57", "remaining_time": "22:31:48", "throughput": 1795.29, "total_tokens": 24985600} -{"current_steps": 3060, "total_steps": 20825, "loss": 0.9581, "learning_rate": 4.867974530393767e-05, "epoch": 0.1469387755102041, "percentage": 14.69, "elapsed_time": "3:52:41", "remaining_time": "22:30:55", "throughput": 1795.44, "total_tokens": 25067520} -{"current_steps": 3070, "total_steps": 20825, "loss": 0.8628, "learning_rate": 4.8667011600896994e-05, "epoch": 0.14741896758703482, "percentage": 14.74, "elapsed_time": "3:53:26", "remaining_time": "22:30:04", "throughput": 1795.57, "total_tokens": 25149440} -{"current_steps": 3080, "total_steps": 20825, "loss": 0.8973, "learning_rate": 4.8654218466357064e-05, "epoch": 0.14789915966386555, "percentage": 14.79, "elapsed_time": "3:54:10", "remaining_time": "22:29:12", "throughput": 1795.7, "total_tokens": 25231360} -{"current_steps": 3090, "total_steps": 20825, "loss": 0.9561, "learning_rate": 4.86413659324434e-05, "epoch": 0.14837935174069627, "percentage": 14.84, "elapsed_time": "3:54:55", "remaining_time": "22:28:21", "throughput": 1795.83, "total_tokens": 25313280} -{"current_steps": 3100, "total_steps": 20825, "loss": 0.8549, "learning_rate": 4.8628454031430694e-05, "epoch": 0.148859543817527, "percentage": 14.89, "elapsed_time": "3:55:40", "remaining_time": "22:27:30", "throughput": 1795.96, "total_tokens": 25395200} -{"current_steps": 3110, "total_steps": 20825, "loss": 1.1022, "learning_rate": 4.8615482795742696e-05, "epoch": 0.14933973589435776, "percentage": 14.93, "elapsed_time": "3:56:24", "remaining_time": "22:26:39", "throughput": 1796.07, "total_tokens": 25477120} -{"current_steps": 3120, "total_steps": 20825, "loss": 1.108, "learning_rate": 4.860245225795219e-05, "epoch": 0.14981992797118848, "percentage": 14.98, "elapsed_time": "3:57:10", "remaining_time": "22:25:51", "throughput": 1796.12, "total_tokens": 25559040} -{"current_steps": 3130, "total_steps": 20825, "loss": 1.1467, "learning_rate": 4.858936245078084e-05, "epoch": 0.1503001200480192, "percentage": 15.03, "elapsed_time": "3:57:54", "remaining_time": "22:25:01", "throughput": 1796.22, "total_tokens": 25640960} -{"current_steps": 3140, "total_steps": 20825, "loss": 1.0484, "learning_rate": 4.857621340709917e-05, "epoch": 0.15078031212484994, "percentage": 15.08, "elapsed_time": "3:58:39", "remaining_time": "22:24:10", "throughput": 1796.34, "total_tokens": 25722880} -{"current_steps": 3150, "total_steps": 20825, "loss": 0.8896, "learning_rate": 4.856300515992646e-05, "epoch": 0.15126050420168066, "percentage": 15.13, "elapsed_time": "3:59:24", "remaining_time": "22:23:21", "throughput": 1796.42, "total_tokens": 25804800} -{"current_steps": 3160, "total_steps": 20825, "loss": 0.9816, "learning_rate": 4.854973774243062e-05, "epoch": 0.15174069627851142, "percentage": 15.17, "elapsed_time": "4:00:09", "remaining_time": "22:22:29", "throughput": 1796.54, "total_tokens": 25886720} -{"current_steps": 3170, "total_steps": 20825, "loss": 0.974, "learning_rate": 4.8536411187928186e-05, "epoch": 0.15222088835534214, "percentage": 15.22, "elapsed_time": "4:00:53", "remaining_time": "22:21:38", "throughput": 1796.68, "total_tokens": 25968640} -{"current_steps": 3180, "total_steps": 20825, "loss": 0.9798, "learning_rate": 4.852302552988418e-05, "epoch": 0.15270108043217287, "percentage": 15.27, "elapsed_time": "4:01:38", "remaining_time": "22:20:48", "throughput": 1796.77, "total_tokens": 26050560} -{"current_steps": 3190, "total_steps": 20825, "loss": 1.0298, "learning_rate": 4.850958080191205e-05, "epoch": 0.1531812725090036, "percentage": 15.32, "elapsed_time": "4:02:23", "remaining_time": "22:19:58", "throughput": 1796.88, "total_tokens": 26132480} -{"current_steps": 3200, "total_steps": 20825, "loss": 0.9407, "learning_rate": 4.849607703777356e-05, "epoch": 0.15366146458583432, "percentage": 15.37, "elapsed_time": "4:03:08", "remaining_time": "22:19:08", "throughput": 1796.98, "total_tokens": 26214400} -{"current_steps": 3210, "total_steps": 20825, "loss": 0.7755, "learning_rate": 4.8482514271378745e-05, "epoch": 0.15414165666266508, "percentage": 15.41, "elapsed_time": "4:03:52", "remaining_time": "22:18:16", "throughput": 1797.11, "total_tokens": 26296320} -{"current_steps": 3220, "total_steps": 20825, "loss": 0.8748, "learning_rate": 4.846889253678578e-05, "epoch": 0.1546218487394958, "percentage": 15.46, "elapsed_time": "4:04:37", "remaining_time": "22:17:27", "throughput": 1797.2, "total_tokens": 26378240} -{"current_steps": 3230, "total_steps": 20825, "loss": 0.9308, "learning_rate": 4.845521186820096e-05, "epoch": 0.15510204081632653, "percentage": 15.51, "elapsed_time": "4:05:21", "remaining_time": "22:16:35", "throughput": 1797.33, "total_tokens": 26460160} -{"current_steps": 3240, "total_steps": 20825, "loss": 0.9556, "learning_rate": 4.8441472299978504e-05, "epoch": 0.15558223289315726, "percentage": 15.56, "elapsed_time": "4:06:06", "remaining_time": "22:15:46", "throughput": 1797.41, "total_tokens": 26542080} -{"current_steps": 3250, "total_steps": 20825, "loss": 0.9465, "learning_rate": 4.8427673866620615e-05, "epoch": 0.15606242496998798, "percentage": 15.61, "elapsed_time": "4:07:03", "remaining_time": "22:16:02", "throughput": 1796.03, "total_tokens": 26624000} -{"current_steps": 3260, "total_steps": 20825, "loss": 0.8611, "learning_rate": 4.841381660277725e-05, "epoch": 0.15654261704681874, "percentage": 15.65, "elapsed_time": "4:07:51", "remaining_time": "22:15:26", "throughput": 1795.82, "total_tokens": 26705920} -{"current_steps": 3270, "total_steps": 20825, "loss": 0.9294, "learning_rate": 4.839990054324614e-05, "epoch": 0.15702280912364946, "percentage": 15.7, "elapsed_time": "4:08:41", "remaining_time": "22:15:05", "throughput": 1795.26, "total_tokens": 26787840} -{"current_steps": 3280, "total_steps": 20825, "loss": 1.0522, "learning_rate": 4.838592572297265e-05, "epoch": 0.1575030012004802, "percentage": 15.75, "elapsed_time": "4:09:41", "remaining_time": "22:15:39", "throughput": 1793.47, "total_tokens": 26869760} -{"current_steps": 3290, "total_steps": 20825, "loss": 0.9068, "learning_rate": 4.837189217704968e-05, "epoch": 0.15798319327731092, "percentage": 15.8, "elapsed_time": "4:10:37", "remaining_time": "22:15:47", "throughput": 1792.27, "total_tokens": 26951680} -{"current_steps": 3300, "total_steps": 20825, "loss": 0.8502, "learning_rate": 4.835779994071764e-05, "epoch": 0.15846338535414164, "percentage": 15.85, "elapsed_time": "4:11:26", "remaining_time": "22:15:17", "throughput": 1791.94, "total_tokens": 27033600} -{"current_steps": 3310, "total_steps": 20825, "loss": 0.9537, "learning_rate": 4.8343649049364284e-05, "epoch": 0.1589435774309724, "percentage": 15.89, "elapsed_time": "4:12:13", "remaining_time": "22:14:37", "throughput": 1791.81, "total_tokens": 27115520} -{"current_steps": 3320, "total_steps": 20825, "loss": 0.9564, "learning_rate": 4.832943953852468e-05, "epoch": 0.15942376950780313, "percentage": 15.94, "elapsed_time": "4:12:59", "remaining_time": "22:13:54", "throughput": 1791.74, "total_tokens": 27197440} -{"current_steps": 3330, "total_steps": 20825, "loss": 0.8895, "learning_rate": 4.831517144388109e-05, "epoch": 0.15990396158463385, "percentage": 15.99, "elapsed_time": "4:13:45", "remaining_time": "22:13:12", "throughput": 1791.65, "total_tokens": 27279360} -{"current_steps": 3340, "total_steps": 20825, "loss": 0.765, "learning_rate": 4.830084480126288e-05, "epoch": 0.16038415366146458, "percentage": 16.04, "elapsed_time": "4:14:32", "remaining_time": "22:12:31", "throughput": 1791.56, "total_tokens": 27361280} -{"current_steps": 3350, "total_steps": 20825, "loss": 0.9538, "learning_rate": 4.828645964664647e-05, "epoch": 0.1608643457382953, "percentage": 16.09, "elapsed_time": "4:15:19", "remaining_time": "22:11:51", "throughput": 1791.43, "total_tokens": 27443200} -{"current_steps": 3360, "total_steps": 20825, "loss": 1.0036, "learning_rate": 4.8272016016155166e-05, "epoch": 0.16134453781512606, "percentage": 16.13, "elapsed_time": "4:16:05", "remaining_time": "22:11:10", "throughput": 1791.31, "total_tokens": 27525120} -{"current_steps": 3370, "total_steps": 20825, "loss": 1.1447, "learning_rate": 4.825751394605916e-05, "epoch": 0.1618247298919568, "percentage": 16.18, "elapsed_time": "4:16:52", "remaining_time": "22:10:28", "throughput": 1791.22, "total_tokens": 27607040} -{"current_steps": 3380, "total_steps": 20825, "loss": 0.8392, "learning_rate": 4.824295347277537e-05, "epoch": 0.1623049219687875, "percentage": 16.23, "elapsed_time": "4:17:39", "remaining_time": "22:09:47", "throughput": 1791.12, "total_tokens": 27688960} -{"current_steps": 3390, "total_steps": 20825, "loss": 1.1125, "learning_rate": 4.8228334632867375e-05, "epoch": 0.16278511404561824, "percentage": 16.28, "elapsed_time": "4:18:26", "remaining_time": "22:09:08", "throughput": 1790.97, "total_tokens": 27770880} -{"current_steps": 3400, "total_steps": 20825, "loss": 1.059, "learning_rate": 4.8213657463045344e-05, "epoch": 0.16326530612244897, "percentage": 16.33, "elapsed_time": "4:19:12", "remaining_time": "22:08:27", "throughput": 1790.87, "total_tokens": 27852800} -{"current_steps": 3410, "total_steps": 20825, "loss": 1.0134, "learning_rate": 4.819892200016588e-05, "epoch": 0.16374549819927972, "percentage": 16.37, "elapsed_time": "4:19:58", "remaining_time": "22:07:44", "throughput": 1790.8, "total_tokens": 27934720} -{"current_steps": 3420, "total_steps": 20825, "loss": 0.8942, "learning_rate": 4.818412828123201e-05, "epoch": 0.16422569027611045, "percentage": 16.42, "elapsed_time": "4:20:45", "remaining_time": "22:07:03", "throughput": 1790.71, "total_tokens": 28016640} -{"current_steps": 3430, "total_steps": 20825, "loss": 0.8664, "learning_rate": 4.816927634339302e-05, "epoch": 0.16470588235294117, "percentage": 16.47, "elapsed_time": "4:21:32", "remaining_time": "22:06:21", "throughput": 1790.61, "total_tokens": 28098560} -{"current_steps": 3440, "total_steps": 20825, "loss": 0.7622, "learning_rate": 4.815436622394441e-05, "epoch": 0.1651860744297719, "percentage": 16.52, "elapsed_time": "4:22:18", "remaining_time": "22:05:39", "throughput": 1790.54, "total_tokens": 28180480} -{"current_steps": 3450, "total_steps": 20825, "loss": 1.0249, "learning_rate": 4.813939796032779e-05, "epoch": 0.16566626650660263, "percentage": 16.57, "elapsed_time": "4:23:05", "remaining_time": "22:04:58", "throughput": 1790.43, "total_tokens": 28262400} -{"current_steps": 3460, "total_steps": 20825, "loss": 0.9852, "learning_rate": 4.812437159013076e-05, "epoch": 0.16614645858343338, "percentage": 16.61, "elapsed_time": "4:23:51", "remaining_time": "22:04:16", "throughput": 1790.34, "total_tokens": 28344320} -{"current_steps": 3470, "total_steps": 20825, "loss": 0.8945, "learning_rate": 4.810928715108683e-05, "epoch": 0.1666266506602641, "percentage": 16.66, "elapsed_time": "4:24:38", "remaining_time": "22:03:34", "throughput": 1790.26, "total_tokens": 28426240} -{"current_steps": 3480, "total_steps": 20825, "loss": 0.8606, "learning_rate": 4.809414468107536e-05, "epoch": 0.16710684273709484, "percentage": 16.71, "elapsed_time": "4:25:24", "remaining_time": "22:02:51", "throughput": 1790.19, "total_tokens": 28508160} -{"current_steps": 3490, "total_steps": 20825, "loss": 0.7668, "learning_rate": 4.8078944218121404e-05, "epoch": 0.16758703481392556, "percentage": 16.76, "elapsed_time": "4:26:11", "remaining_time": "22:02:09", "throughput": 1790.11, "total_tokens": 28590080} -{"current_steps": 3500, "total_steps": 20825, "loss": 1.1072, "learning_rate": 4.806368580039566e-05, "epoch": 0.16806722689075632, "percentage": 16.81, "elapsed_time": "4:26:57", "remaining_time": "22:01:26", "throughput": 1790.04, "total_tokens": 28672000} -{"current_steps": 3510, "total_steps": 20825, "loss": 0.7905, "learning_rate": 4.804836946621437e-05, "epoch": 0.16854741896758704, "percentage": 16.85, "elapsed_time": "4:27:44", "remaining_time": "22:00:45", "throughput": 1789.94, "total_tokens": 28753920} -{"current_steps": 3520, "total_steps": 20825, "loss": 0.9979, "learning_rate": 4.803299525403919e-05, "epoch": 0.16902761104441777, "percentage": 16.9, "elapsed_time": "4:28:31", "remaining_time": "22:00:08", "throughput": 1789.75, "total_tokens": 28835840} -{"current_steps": 3530, "total_steps": 20825, "loss": 1.1211, "learning_rate": 4.801756320247713e-05, "epoch": 0.1695078031212485, "percentage": 16.95, "elapsed_time": "4:29:18", "remaining_time": "21:59:28", "throughput": 1789.61, "total_tokens": 28917760} -{"current_steps": 3540, "total_steps": 20825, "loss": 0.9346, "learning_rate": 4.800207335028044e-05, "epoch": 0.16998799519807922, "percentage": 17.0, "elapsed_time": "4:30:06", "remaining_time": "21:58:54", "throughput": 1789.34, "total_tokens": 28999680} -{"current_steps": 3550, "total_steps": 20825, "loss": 0.8605, "learning_rate": 4.798652573634651e-05, "epoch": 0.17046818727490998, "percentage": 17.05, "elapsed_time": "4:31:58", "remaining_time": "22:03:29", "throughput": 1782.12, "total_tokens": 29081600} -{"current_steps": 3560, "total_steps": 20825, "loss": 0.631, "learning_rate": 4.797092039971779e-05, "epoch": 0.1709483793517407, "percentage": 17.09, "elapsed_time": "4:33:11", "remaining_time": "22:04:55", "throughput": 1779.15, "total_tokens": 29163520} -{"current_steps": 3570, "total_steps": 20825, "loss": 0.8789, "learning_rate": 4.7955257379581675e-05, "epoch": 0.17142857142857143, "percentage": 17.14, "elapsed_time": "4:34:00", "remaining_time": "22:04:20", "throughput": 1778.91, "total_tokens": 29245440} -{"current_steps": 3580, "total_steps": 20825, "loss": 1.2783, "learning_rate": 4.7939536715270415e-05, "epoch": 0.17190876350540216, "percentage": 17.19, "elapsed_time": "4:35:14", "remaining_time": "22:05:50", "throughput": 1775.86, "total_tokens": 29327360} -{"current_steps": 3590, "total_steps": 20825, "loss": 0.7012, "learning_rate": 4.792375844626101e-05, "epoch": 0.17238895558223288, "percentage": 17.24, "elapsed_time": "4:37:52", "remaining_time": "22:14:01", "throughput": 1763.94, "total_tokens": 29409280} -{"current_steps": 3600, "total_steps": 20825, "loss": 0.976, "learning_rate": 4.790792261217512e-05, "epoch": 0.17286914765906364, "percentage": 17.29, "elapsed_time": "4:38:56", "remaining_time": "22:14:38", "throughput": 1762.1, "total_tokens": 29491200} -{"current_steps": 3610, "total_steps": 20825, "loss": 0.9292, "learning_rate": 4.789202925277895e-05, "epoch": 0.17334933973589436, "percentage": 17.33, "elapsed_time": "4:39:51", "remaining_time": "22:14:32", "throughput": 1761.23, "total_tokens": 29573120} -{"current_steps": 3620, "total_steps": 20825, "loss": 0.8974, "learning_rate": 4.787607840798317e-05, "epoch": 0.1738295318127251, "percentage": 17.38, "elapsed_time": "4:40:40", "remaining_time": "22:13:59", "throughput": 1760.92, "total_tokens": 29655040} -{"current_steps": 3630, "total_steps": 20825, "loss": 0.9049, "learning_rate": 4.786007011784279e-05, "epoch": 0.17430972388955582, "percentage": 17.43, "elapsed_time": "4:41:29", "remaining_time": "22:13:24", "throughput": 1760.66, "total_tokens": 29736960} -{"current_steps": 3640, "total_steps": 20825, "loss": 0.8813, "learning_rate": 4.78440044225571e-05, "epoch": 0.17478991596638654, "percentage": 17.48, "elapsed_time": "4:42:18", "remaining_time": "22:12:49", "throughput": 1760.42, "total_tokens": 29818880} -{"current_steps": 3650, "total_steps": 20825, "loss": 0.7923, "learning_rate": 4.7827881362469506e-05, "epoch": 0.1752701080432173, "percentage": 17.53, "elapsed_time": "4:43:08", "remaining_time": "22:12:21", "throughput": 1760.01, "total_tokens": 29900800} -{"current_steps": 3660, "total_steps": 20825, "loss": 0.9563, "learning_rate": 4.781170097806751e-05, "epoch": 0.17575030012004803, "percentage": 17.58, "elapsed_time": "4:45:21", "remaining_time": "22:18:16", "throughput": 1751.21, "total_tokens": 29982720} -{"current_steps": 3670, "total_steps": 20825, "loss": 0.9327, "learning_rate": 4.779546330998253e-05, "epoch": 0.17623049219687875, "percentage": 17.62, "elapsed_time": "4:46:12", "remaining_time": "22:17:48", "throughput": 1750.79, "total_tokens": 30064640} -{"current_steps": 3680, "total_steps": 20825, "loss": 1.2167, "learning_rate": 4.7779168398989826e-05, "epoch": 0.17671068427370948, "percentage": 17.67, "elapsed_time": "4:47:03", "remaining_time": "22:17:23", "throughput": 1750.31, "total_tokens": 30146560} -{"current_steps": 3690, "total_steps": 20825, "loss": 0.9795, "learning_rate": 4.7762816286008454e-05, "epoch": 0.1771908763505402, "percentage": 17.72, "elapsed_time": "4:47:55", "remaining_time": "22:16:59", "throughput": 1749.81, "total_tokens": 30228480} -{"current_steps": 3700, "total_steps": 20825, "loss": 1.108, "learning_rate": 4.774640701210106e-05, "epoch": 0.17767106842737096, "percentage": 17.77, "elapsed_time": "4:48:46", "remaining_time": "22:16:35", "throughput": 1749.32, "total_tokens": 30310400} -{"current_steps": 3710, "total_steps": 20825, "loss": 1.0156, "learning_rate": 4.7729940618473854e-05, "epoch": 0.1781512605042017, "percentage": 17.82, "elapsed_time": "4:49:38", "remaining_time": "22:16:09", "throughput": 1748.88, "total_tokens": 30392320} -{"current_steps": 3720, "total_steps": 20825, "loss": 0.9543, "learning_rate": 4.771341714647648e-05, "epoch": 0.1786314525810324, "percentage": 17.86, "elapsed_time": "4:50:28", "remaining_time": "22:15:36", "throughput": 1748.57, "total_tokens": 30474240} -{"current_steps": 3730, "total_steps": 20825, "loss": 0.875, "learning_rate": 4.76968366376019e-05, "epoch": 0.17911164465786314, "percentage": 17.91, "elapsed_time": "4:51:17", "remaining_time": "22:14:59", "throughput": 1748.34, "total_tokens": 30556160} -{"current_steps": 3740, "total_steps": 20825, "loss": 0.9798, "learning_rate": 4.768019913348634e-05, "epoch": 0.17959183673469387, "percentage": 17.96, "elapsed_time": "4:52:05", "remaining_time": "22:14:20", "throughput": 1748.18, "total_tokens": 30638080} -{"current_steps": 3750, "total_steps": 20825, "loss": 0.8985, "learning_rate": 4.766350467590911e-05, "epoch": 0.18007202881152462, "percentage": 18.01, "elapsed_time": "4:52:54", "remaining_time": "22:13:41", "throughput": 1748.02, "total_tokens": 30720000} -{"current_steps": 3760, "total_steps": 20825, "loss": 0.9849, "learning_rate": 4.764675330679256e-05, "epoch": 0.18055222088835535, "percentage": 18.06, "elapsed_time": "4:53:42", "remaining_time": "22:13:02", "throughput": 1747.83, "total_tokens": 30801920} -{"current_steps": 3770, "total_steps": 20825, "loss": 0.9484, "learning_rate": 4.7629945068201954e-05, "epoch": 0.18103241296518607, "percentage": 18.1, "elapsed_time": "4:54:32", "remaining_time": "22:12:30", "throughput": 1747.52, "total_tokens": 30883840} -{"current_steps": 3780, "total_steps": 20825, "loss": 0.8183, "learning_rate": 4.7613080002345345e-05, "epoch": 0.1815126050420168, "percentage": 18.15, "elapsed_time": "4:55:22", "remaining_time": "22:11:55", "throughput": 1747.25, "total_tokens": 30965760} -{"current_steps": 3790, "total_steps": 20825, "loss": 1.0653, "learning_rate": 4.759615815157352e-05, "epoch": 0.18199279711884753, "percentage": 18.2, "elapsed_time": "4:56:12", "remaining_time": "22:11:23", "throughput": 1746.93, "total_tokens": 31047680} -{"current_steps": 3800, "total_steps": 20825, "loss": 0.8532, "learning_rate": 4.7579179558379836e-05, "epoch": 0.18247298919567828, "percentage": 18.25, "elapsed_time": "4:58:18", "remaining_time": "22:16:28", "throughput": 1739.25, "total_tokens": 31129600} -{"current_steps": 3810, "total_steps": 20825, "loss": 0.7594, "learning_rate": 4.7562144265400146e-05, "epoch": 0.182953181272509, "percentage": 18.3, "elapsed_time": "4:59:25", "remaining_time": "22:17:12", "throughput": 1737.29, "total_tokens": 31211520} -{"current_steps": 3820, "total_steps": 20825, "loss": 1.0458, "learning_rate": 4.754505231541268e-05, "epoch": 0.18343337334933973, "percentage": 18.34, "elapsed_time": "5:00:13", "remaining_time": "22:16:29", "throughput": 1737.2, "total_tokens": 31293440} -{"current_steps": 3830, "total_steps": 20825, "loss": 0.8403, "learning_rate": 4.752790375133797e-05, "epoch": 0.18391356542617046, "percentage": 18.39, "elapsed_time": "5:01:02", "remaining_time": "22:15:49", "throughput": 1737.05, "total_tokens": 31375360} -{"current_steps": 3840, "total_steps": 20825, "loss": 0.9284, "learning_rate": 4.751069861623867e-05, "epoch": 0.1843937575030012, "percentage": 18.44, "elapsed_time": "5:01:58", "remaining_time": "22:15:40", "throughput": 1736.2, "total_tokens": 31457280} -{"current_steps": 3850, "total_steps": 20825, "loss": 1.0164, "learning_rate": 4.749343695331952e-05, "epoch": 0.18487394957983194, "percentage": 18.49, "elapsed_time": "5:03:26", "remaining_time": "22:17:53", "throughput": 1732.32, "total_tokens": 31539200} -{"current_steps": 3860, "total_steps": 20825, "loss": 0.8328, "learning_rate": 4.747611880592721e-05, "epoch": 0.18535414165666267, "percentage": 18.54, "elapsed_time": "5:04:25", "remaining_time": "22:17:56", "throughput": 1731.23, "total_tokens": 31621120} -{"current_steps": 3870, "total_steps": 20825, "loss": 1.0115, "learning_rate": 4.745874421755027e-05, "epoch": 0.1858343337334934, "percentage": 18.58, "elapsed_time": "5:05:12", "remaining_time": "22:17:08", "throughput": 1731.26, "total_tokens": 31703040} -{"current_steps": 3880, "total_steps": 20825, "loss": 0.8417, "learning_rate": 4.744131323181895e-05, "epoch": 0.18631452581032412, "percentage": 18.63, "elapsed_time": "5:06:00", "remaining_time": "22:16:27", "throughput": 1731.12, "total_tokens": 31784960} -{"current_steps": 3890, "total_steps": 20825, "loss": 0.9902, "learning_rate": 4.742382589250514e-05, "epoch": 0.18679471788715485, "percentage": 18.68, "elapsed_time": "5:06:55", "remaining_time": "22:16:11", "throughput": 1730.44, "total_tokens": 31866880} -{"current_steps": 3900, "total_steps": 20825, "loss": 1.0409, "learning_rate": 4.740628224352222e-05, "epoch": 0.1872749099639856, "percentage": 18.73, "elapsed_time": "5:07:50", "remaining_time": "22:15:55", "throughput": 1729.77, "total_tokens": 31948800} -{"current_steps": 3910, "total_steps": 20825, "loss": 0.9343, "learning_rate": 4.7388682328925e-05, "epoch": 0.18775510204081633, "percentage": 18.78, "elapsed_time": "5:08:44", "remaining_time": "22:15:37", "throughput": 1729.12, "total_tokens": 32030720} -{"current_steps": 3920, "total_steps": 20825, "loss": 0.9198, "learning_rate": 4.737102619290956e-05, "epoch": 0.18823529411764706, "percentage": 18.82, "elapsed_time": "5:09:36", "remaining_time": "22:15:12", "throughput": 1728.64, "total_tokens": 32112640} -{"current_steps": 3930, "total_steps": 20825, "loss": 0.9707, "learning_rate": 4.7353313879813165e-05, "epoch": 0.18871548619447778, "percentage": 18.87, "elapsed_time": "5:10:27", "remaining_time": "22:14:37", "throughput": 1728.36, "total_tokens": 32194560} -{"current_steps": 3940, "total_steps": 20825, "loss": 1.0691, "learning_rate": 4.733554543411417e-05, "epoch": 0.18919567827130854, "percentage": 18.92, "elapsed_time": "5:11:17", "remaining_time": "22:14:02", "throughput": 1728.11, "total_tokens": 32276480} -{"current_steps": 3950, "total_steps": 20825, "loss": 0.9361, "learning_rate": 4.731772090043184e-05, "epoch": 0.18967587034813926, "percentage": 18.97, "elapsed_time": "5:12:07", "remaining_time": "22:13:27", "throughput": 1727.84, "total_tokens": 32358400} -{"current_steps": 3960, "total_steps": 20825, "loss": 0.8927, "learning_rate": 4.729984032352635e-05, "epoch": 0.19015606242497, "percentage": 19.02, "elapsed_time": "5:12:59", "remaining_time": "22:12:58", "throughput": 1727.44, "total_tokens": 32440320} -{"current_steps": 3970, "total_steps": 20825, "loss": 0.9308, "learning_rate": 4.728190374829854e-05, "epoch": 0.19063625450180072, "percentage": 19.06, "elapsed_time": "5:13:49", "remaining_time": "22:12:24", "throughput": 1727.15, "total_tokens": 32522240} -{"current_steps": 3980, "total_steps": 20825, "loss": 0.9229, "learning_rate": 4.726391121978992e-05, "epoch": 0.19111644657863144, "percentage": 19.11, "elapsed_time": "5:14:40", "remaining_time": "22:11:51", "throughput": 1726.84, "total_tokens": 32604160} -{"current_steps": 3990, "total_steps": 20825, "loss": 0.9033, "learning_rate": 4.7245862783182496e-05, "epoch": 0.1915966386554622, "percentage": 19.16, "elapsed_time": "5:15:52", "remaining_time": "22:12:44", "throughput": 1724.66, "total_tokens": 32686080} -{"current_steps": 4000, "total_steps": 20825, "loss": 1.0315, "learning_rate": 4.722775848379866e-05, "epoch": 0.19207683073229292, "percentage": 19.21, "elapsed_time": "5:17:28", "remaining_time": "22:15:21", "throughput": 1720.28, "total_tokens": 32768000} -{"current_steps": 4010, "total_steps": 20825, "loss": 0.8195, "learning_rate": 4.720959836710107e-05, "epoch": 0.19255702280912365, "percentage": 19.26, "elapsed_time": "5:18:45", "remaining_time": "22:16:40", "throughput": 1717.56, "total_tokens": 32849920} -{"current_steps": 4020, "total_steps": 20825, "loss": 0.9489, "learning_rate": 4.7191382478692594e-05, "epoch": 0.19303721488595438, "percentage": 19.3, "elapsed_time": "5:19:51", "remaining_time": "22:17:05", "throughput": 1716.0, "total_tokens": 32931840} -{"current_steps": 4030, "total_steps": 20825, "loss": 0.814, "learning_rate": 4.7173110864316104e-05, "epoch": 0.1935174069627851, "percentage": 19.35, "elapsed_time": "5:20:55", "remaining_time": "22:17:27", "throughput": 1714.51, "total_tokens": 33013760} -{"current_steps": 4040, "total_steps": 20825, "loss": 0.811, "learning_rate": 4.7154783569854444e-05, "epoch": 0.19399759903961586, "percentage": 19.4, "elapsed_time": "5:22:00", "remaining_time": "22:17:51", "throughput": 1712.98, "total_tokens": 33095680} -{"current_steps": 4050, "total_steps": 20825, "loss": 0.9777, "learning_rate": 4.713640064133025e-05, "epoch": 0.19447779111644659, "percentage": 19.45, "elapsed_time": "5:23:00", "remaining_time": "22:17:54", "throughput": 1711.89, "total_tokens": 33177600} -{"current_steps": 4060, "total_steps": 20825, "loss": 0.8785, "learning_rate": 4.7117962124905885e-05, "epoch": 0.1949579831932773, "percentage": 19.5, "elapsed_time": "5:23:50", "remaining_time": "22:17:16", "throughput": 1711.68, "total_tokens": 33259520} -{"current_steps": 4070, "total_steps": 20825, "loss": 0.9837, "learning_rate": 4.709946806688329e-05, "epoch": 0.19543817527010804, "percentage": 19.54, "elapsed_time": "5:24:41", "remaining_time": "22:16:37", "throughput": 1711.48, "total_tokens": 33341440} -{"current_steps": 4080, "total_steps": 20825, "loss": 0.8769, "learning_rate": 4.708091851370389e-05, "epoch": 0.19591836734693877, "percentage": 19.59, "elapsed_time": "5:25:37", "remaining_time": "22:16:25", "throughput": 1710.72, "total_tokens": 33423360} -{"current_steps": 4090, "total_steps": 20825, "loss": 0.9604, "learning_rate": 4.706231351194845e-05, "epoch": 0.19639855942376952, "percentage": 19.64, "elapsed_time": "5:26:29", "remaining_time": "22:15:52", "throughput": 1710.4, "total_tokens": 33505280} -{"current_steps": 4100, "total_steps": 20825, "loss": 0.8028, "learning_rate": 4.7043653108336994e-05, "epoch": 0.19687875150060025, "percentage": 19.69, "elapsed_time": "5:27:33", "remaining_time": "22:16:09", "throughput": 1709.01, "total_tokens": 33587200} -{"current_steps": 4110, "total_steps": 20825, "loss": 0.9994, "learning_rate": 4.702493734972866e-05, "epoch": 0.19735894357743097, "percentage": 19.74, "elapsed_time": "5:28:56", "remaining_time": "22:17:47", "throughput": 1705.91, "total_tokens": 33669120} -{"current_steps": 4120, "total_steps": 20825, "loss": 1.0073, "learning_rate": 4.700616628312158e-05, "epoch": 0.1978391356542617, "percentage": 19.78, "elapsed_time": "5:29:47", "remaining_time": "22:17:08", "throughput": 1705.72, "total_tokens": 33751040} -{"current_steps": 4130, "total_steps": 20825, "loss": 0.8428, "learning_rate": 4.69873399556528e-05, "epoch": 0.19831932773109243, "percentage": 19.83, "elapsed_time": "5:30:39", "remaining_time": "22:16:37", "throughput": 1705.35, "total_tokens": 33832960} -{"current_steps": 4140, "total_steps": 20825, "loss": 1.0941, "learning_rate": 4.696845841459811e-05, "epoch": 0.19879951980792318, "percentage": 19.88, "elapsed_time": "5:31:33", "remaining_time": "22:16:13", "throughput": 1704.86, "total_tokens": 33914880} -{"current_steps": 4150, "total_steps": 20825, "loss": 0.8673, "learning_rate": 4.6949521707371965e-05, "epoch": 0.1992797118847539, "percentage": 19.93, "elapsed_time": "5:32:29", "remaining_time": "22:15:56", "throughput": 1704.18, "total_tokens": 33996800} -{"current_steps": 4160, "total_steps": 20825, "loss": 0.8488, "learning_rate": 4.693052988152733e-05, "epoch": 0.19975990396158463, "percentage": 19.98, "elapsed_time": "5:33:26", "remaining_time": "22:15:46", "throughput": 1703.39, "total_tokens": 34078720} -{"current_steps": 4170, "total_steps": 20825, "loss": 1.0891, "learning_rate": 4.691148298475561e-05, "epoch": 0.20024009603841536, "percentage": 20.02, "elapsed_time": "5:34:22", "remaining_time": "22:15:29", "throughput": 1702.72, "total_tokens": 34160640} -{"current_steps": 4180, "total_steps": 20825, "loss": 0.904, "learning_rate": 4.689238106488647e-05, "epoch": 0.2007202881152461, "percentage": 20.07, "elapsed_time": "5:35:17", "remaining_time": "22:15:09", "throughput": 1702.12, "total_tokens": 34242560} -{"current_steps": 4190, "total_steps": 20825, "loss": 0.8948, "learning_rate": 4.687322416988779e-05, "epoch": 0.20120048019207684, "percentage": 20.12, "elapsed_time": "5:36:11", "remaining_time": "22:14:42", "throughput": 1701.67, "total_tokens": 34324480} -{"current_steps": 4200, "total_steps": 20825, "loss": 0.9203, "learning_rate": 4.685401234786544e-05, "epoch": 0.20168067226890757, "percentage": 20.17, "elapsed_time": "5:37:04", "remaining_time": "22:14:14", "throughput": 1701.24, "total_tokens": 34406400} -{"current_steps": 4210, "total_steps": 20825, "loss": 0.9092, "learning_rate": 4.683474564706327e-05, "epoch": 0.2021608643457383, "percentage": 20.22, "elapsed_time": "5:37:57", "remaining_time": "22:13:46", "throughput": 1700.8, "total_tokens": 34488320} -{"current_steps": 4220, "total_steps": 20825, "loss": 0.8973, "learning_rate": 4.681542411586294e-05, "epoch": 0.20264105642256902, "percentage": 20.26, "elapsed_time": "5:38:50", "remaining_time": "22:13:18", "throughput": 1700.38, "total_tokens": 34570240} -{"current_steps": 4230, "total_steps": 20825, "loss": 1.046, "learning_rate": 4.6796047802783755e-05, "epoch": 0.20312124849939975, "percentage": 20.31, "elapsed_time": "5:39:44", "remaining_time": "22:12:50", "throughput": 1699.96, "total_tokens": 34652160} -{"current_steps": 4240, "total_steps": 20825, "loss": 0.8767, "learning_rate": 4.6776616756482624e-05, "epoch": 0.2036014405762305, "percentage": 20.36, "elapsed_time": "5:40:37", "remaining_time": "22:12:23", "throughput": 1699.51, "total_tokens": 34734080} -{"current_steps": 4250, "total_steps": 20825, "loss": 0.849, "learning_rate": 4.6757131025753886e-05, "epoch": 0.20408163265306123, "percentage": 20.41, "elapsed_time": "5:41:31", "remaining_time": "22:11:54", "throughput": 1699.09, "total_tokens": 34816000} -{"current_steps": 4260, "total_steps": 20825, "loss": 1.1241, "learning_rate": 4.67375906595292e-05, "epoch": 0.20456182472989196, "percentage": 20.46, "elapsed_time": "5:42:24", "remaining_time": "22:11:26", "throughput": 1698.67, "total_tokens": 34897920} -{"current_steps": 4270, "total_steps": 20825, "loss": 1.1088, "learning_rate": 4.671799570687743e-05, "epoch": 0.20504201680672268, "percentage": 20.5, "elapsed_time": "5:43:17", "remaining_time": "22:10:59", "throughput": 1698.22, "total_tokens": 34979840} -{"current_steps": 4280, "total_steps": 20825, "loss": 0.9175, "learning_rate": 4.6698346217004494e-05, "epoch": 0.2055222088835534, "percentage": 20.55, "elapsed_time": "5:44:10", "remaining_time": "22:10:29", "throughput": 1697.83, "total_tokens": 35061760} -{"current_steps": 4290, "total_steps": 20825, "loss": 1.146, "learning_rate": 4.66786422392533e-05, "epoch": 0.20600240096038416, "percentage": 20.6, "elapsed_time": "5:45:04", "remaining_time": "22:10:00", "throughput": 1697.41, "total_tokens": 35143680} -{"current_steps": 4300, "total_steps": 20825, "loss": 0.9771, "learning_rate": 4.665888382310356e-05, "epoch": 0.2064825930372149, "percentage": 20.65, "elapsed_time": "5:45:57", "remaining_time": "22:09:31", "throughput": 1697.01, "total_tokens": 35225600} -{"current_steps": 4310, "total_steps": 20825, "loss": 0.9299, "learning_rate": 4.663907101817167e-05, "epoch": 0.20696278511404562, "percentage": 20.7, "elapsed_time": "5:46:50", "remaining_time": "22:09:02", "throughput": 1696.59, "total_tokens": 35307520} -{"current_steps": 4320, "total_steps": 20825, "loss": 1.0124, "learning_rate": 4.661920387421064e-05, "epoch": 0.20744297719087634, "percentage": 20.74, "elapsed_time": "5:47:44", "remaining_time": "22:08:33", "throughput": 1696.18, "total_tokens": 35389440} -{"current_steps": 4330, "total_steps": 20825, "loss": 0.9051, "learning_rate": 4.65992824411099e-05, "epoch": 0.20792316926770707, "percentage": 20.79, "elapsed_time": "5:48:37", "remaining_time": "22:08:04", "throughput": 1695.79, "total_tokens": 35471360} -{"current_steps": 4340, "total_steps": 20825, "loss": 1.11, "learning_rate": 4.657930676889526e-05, "epoch": 0.20840336134453782, "percentage": 20.84, "elapsed_time": "5:49:30", "remaining_time": "22:07:35", "throughput": 1695.36, "total_tokens": 35553280} -{"current_steps": 4350, "total_steps": 20825, "loss": 0.7549, "learning_rate": 4.655927690772868e-05, "epoch": 0.20888355342136855, "percentage": 20.89, "elapsed_time": "5:50:24", "remaining_time": "22:07:06", "throughput": 1694.96, "total_tokens": 35635200} -{"current_steps": 4360, "total_steps": 20825, "loss": 0.798, "learning_rate": 4.6539192907908204e-05, "epoch": 0.20936374549819928, "percentage": 20.94, "elapsed_time": "5:51:17", "remaining_time": "22:06:36", "throughput": 1694.56, "total_tokens": 35717120} -{"current_steps": 4370, "total_steps": 20825, "loss": 1.0632, "learning_rate": 4.6519054819867856e-05, "epoch": 0.20984393757503, "percentage": 20.98, "elapsed_time": "5:52:11", "remaining_time": "22:06:07", "throughput": 1694.14, "total_tokens": 35799040} -{"current_steps": 4380, "total_steps": 20825, "loss": 0.9968, "learning_rate": 4.649886269417746e-05, "epoch": 0.21032412965186073, "percentage": 21.03, "elapsed_time": "5:53:04", "remaining_time": "22:05:38", "throughput": 1693.75, "total_tokens": 35880960} -{"current_steps": 4390, "total_steps": 20825, "loss": 0.8916, "learning_rate": 4.647861658154254e-05, "epoch": 0.21080432172869148, "percentage": 21.08, "elapsed_time": "5:53:57", "remaining_time": "22:05:08", "throughput": 1693.35, "total_tokens": 35962880} -{"current_steps": 4400, "total_steps": 20825, "loss": 1.0407, "learning_rate": 4.6458316532804214e-05, "epoch": 0.2112845138055222, "percentage": 21.13, "elapsed_time": "5:54:50", "remaining_time": "22:04:37", "throughput": 1692.98, "total_tokens": 36044800} -{"current_steps": 4410, "total_steps": 20825, "loss": 0.9456, "learning_rate": 4.643796259893899e-05, "epoch": 0.21176470588235294, "percentage": 21.18, "elapsed_time": "5:55:44", "remaining_time": "22:04:07", "throughput": 1692.58, "total_tokens": 36126720} -{"current_steps": 4420, "total_steps": 20825, "loss": 0.9378, "learning_rate": 4.641755483105874e-05, "epoch": 0.21224489795918366, "percentage": 21.22, "elapsed_time": "5:56:37", "remaining_time": "22:03:38", "throughput": 1692.18, "total_tokens": 36208640} -{"current_steps": 4430, "total_steps": 20825, "loss": 0.8205, "learning_rate": 4.63970932804105e-05, "epoch": 0.21272509003601442, "percentage": 21.27, "elapsed_time": "5:57:31", "remaining_time": "22:03:08", "throughput": 1691.77, "total_tokens": 36290560} -{"current_steps": 4440, "total_steps": 20825, "loss": 0.8998, "learning_rate": 4.637657799837635e-05, "epoch": 0.21320528211284515, "percentage": 21.32, "elapsed_time": "5:58:24", "remaining_time": "22:02:38", "throughput": 1691.39, "total_tokens": 36372480} -{"current_steps": 4450, "total_steps": 20825, "loss": 0.8201, "learning_rate": 4.635600903647333e-05, "epoch": 0.21368547418967587, "percentage": 21.37, "elapsed_time": "5:59:17", "remaining_time": "22:02:08", "throughput": 1691.0, "total_tokens": 36454400} -{"current_steps": 4460, "total_steps": 20825, "loss": 0.879, "learning_rate": 4.633538644635326e-05, "epoch": 0.2141656662665066, "percentage": 21.42, "elapsed_time": "6:00:11", "remaining_time": "22:01:38", "throughput": 1690.61, "total_tokens": 36536320} -{"current_steps": 4470, "total_steps": 20825, "loss": 0.9865, "learning_rate": 4.631471027980262e-05, "epoch": 0.21464585834333733, "percentage": 21.46, "elapsed_time": "6:01:04", "remaining_time": "22:01:06", "throughput": 1690.24, "total_tokens": 36618240} -{"current_steps": 4480, "total_steps": 20825, "loss": 0.8658, "learning_rate": 4.629398058874245e-05, "epoch": 0.21512605042016808, "percentage": 21.51, "elapsed_time": "6:01:57", "remaining_time": "22:00:35", "throughput": 1689.87, "total_tokens": 36700160} -{"current_steps": 4490, "total_steps": 20825, "loss": 0.9567, "learning_rate": 4.6273197425228166e-05, "epoch": 0.2156062424969988, "percentage": 21.56, "elapsed_time": "6:02:51", "remaining_time": "22:00:05", "throughput": 1689.49, "total_tokens": 36782080} -{"current_steps": 4500, "total_steps": 20825, "loss": 0.9567, "learning_rate": 4.62523608414495e-05, "epoch": 0.21608643457382953, "percentage": 21.61, "elapsed_time": "6:03:44", "remaining_time": "21:59:33", "throughput": 1689.14, "total_tokens": 36864000} -{"current_steps": 4510, "total_steps": 20825, "loss": 0.7952, "learning_rate": 4.623147088973031e-05, "epoch": 0.21656662665066026, "percentage": 21.66, "elapsed_time": "6:04:37", "remaining_time": "21:59:02", "throughput": 1688.76, "total_tokens": 36945920} -{"current_steps": 4520, "total_steps": 20825, "loss": 1.1468, "learning_rate": 4.6210527622528465e-05, "epoch": 0.217046818727491, "percentage": 21.7, "elapsed_time": "6:05:30", "remaining_time": "21:58:31", "throughput": 1688.38, "total_tokens": 37027840} -{"current_steps": 4530, "total_steps": 20825, "loss": 0.8657, "learning_rate": 4.618953109243573e-05, "epoch": 0.21752701080432174, "percentage": 21.75, "elapsed_time": "6:06:24", "remaining_time": "21:58:00", "throughput": 1688.01, "total_tokens": 37109760} -{"current_steps": 4540, "total_steps": 20825, "loss": 0.9235, "learning_rate": 4.616848135217761e-05, "epoch": 0.21800720288115247, "percentage": 21.8, "elapsed_time": "6:07:17", "remaining_time": "21:57:29", "throughput": 1687.64, "total_tokens": 37191680} -{"current_steps": 4550, "total_steps": 20825, "loss": 0.8308, "learning_rate": 4.6147378454613246e-05, "epoch": 0.2184873949579832, "percentage": 21.85, "elapsed_time": "6:08:11", "remaining_time": "21:56:58", "throughput": 1687.26, "total_tokens": 37273600} -{"current_steps": 4560, "total_steps": 20825, "loss": 0.8878, "learning_rate": 4.6126222452735233e-05, "epoch": 0.21896758703481392, "percentage": 21.9, "elapsed_time": "6:09:04", "remaining_time": "21:56:28", "throughput": 1686.87, "total_tokens": 37355520} -{"current_steps": 4570, "total_steps": 20825, "loss": 0.9695, "learning_rate": 4.6105013399669564e-05, "epoch": 0.21944777911164465, "percentage": 21.94, "elapsed_time": "6:09:57", "remaining_time": "21:55:55", "throughput": 1686.53, "total_tokens": 37437440} -{"current_steps": 4580, "total_steps": 20825, "loss": 0.8531, "learning_rate": 4.608375134867541e-05, "epoch": 0.2199279711884754, "percentage": 21.99, "elapsed_time": "6:10:51", "remaining_time": "21:55:23", "throughput": 1686.17, "total_tokens": 37519360} -{"current_steps": 4590, "total_steps": 20825, "loss": 0.8998, "learning_rate": 4.6062436353145044e-05, "epoch": 0.22040816326530613, "percentage": 22.04, "elapsed_time": "6:11:44", "remaining_time": "21:54:53", "throughput": 1685.78, "total_tokens": 37601280} -{"current_steps": 4600, "total_steps": 20825, "loss": 1.2532, "learning_rate": 4.60410684666037e-05, "epoch": 0.22088835534213686, "percentage": 22.09, "elapsed_time": "6:12:38", "remaining_time": "21:54:21", "throughput": 1685.42, "total_tokens": 37683200} -{"current_steps": 4610, "total_steps": 20825, "loss": 0.9984, "learning_rate": 4.601964774270941e-05, "epoch": 0.22136854741896758, "percentage": 22.14, "elapsed_time": "6:13:31", "remaining_time": "21:53:48", "throughput": 1685.1, "total_tokens": 37765120} -{"current_steps": 4620, "total_steps": 20825, "loss": 1.0361, "learning_rate": 4.599817423525292e-05, "epoch": 0.2218487394957983, "percentage": 22.18, "elapsed_time": "6:14:24", "remaining_time": "21:53:15", "throughput": 1684.76, "total_tokens": 37847040} -{"current_steps": 4630, "total_steps": 20825, "loss": 1.0169, "learning_rate": 4.597664799815749e-05, "epoch": 0.22232893157262906, "percentage": 22.23, "elapsed_time": "6:15:17", "remaining_time": "21:52:43", "throughput": 1684.41, "total_tokens": 37928960} -{"current_steps": 4640, "total_steps": 20825, "loss": 0.9112, "learning_rate": 4.595506908547881e-05, "epoch": 0.2228091236494598, "percentage": 22.28, "elapsed_time": "6:16:10", "remaining_time": "21:52:10", "throughput": 1684.06, "total_tokens": 38010880} -{"current_steps": 4650, "total_steps": 20825, "loss": 0.9424, "learning_rate": 4.593343755140483e-05, "epoch": 0.22328931572629052, "percentage": 22.33, "elapsed_time": "6:17:04", "remaining_time": "21:51:38", "throughput": 1683.71, "total_tokens": 38092800} -{"current_steps": 4660, "total_steps": 20825, "loss": 1.0131, "learning_rate": 4.5911753450255665e-05, "epoch": 0.22376950780312124, "percentage": 22.38, "elapsed_time": "6:18:00", "remaining_time": "21:51:16", "throughput": 1683.13, "total_tokens": 38174720} -{"current_steps": 4670, "total_steps": 20825, "loss": 0.7262, "learning_rate": 4.589001683648343e-05, "epoch": 0.22424969987995197, "percentage": 22.42, "elapsed_time": "6:18:54", "remaining_time": "21:50:44", "throughput": 1682.78, "total_tokens": 38256640} -{"current_steps": 4680, "total_steps": 20825, "loss": 0.9312, "learning_rate": 4.586822776467208e-05, "epoch": 0.22472989195678272, "percentage": 22.47, "elapsed_time": "6:19:48", "remaining_time": "21:50:14", "throughput": 1682.38, "total_tokens": 38338560} -{"current_steps": 4690, "total_steps": 20825, "loss": 0.9062, "learning_rate": 4.584638628953733e-05, "epoch": 0.22521008403361345, "percentage": 22.52, "elapsed_time": "6:20:42", "remaining_time": "21:49:43", "throughput": 1682.01, "total_tokens": 38420480} -{"current_steps": 4700, "total_steps": 20825, "loss": 0.8918, "learning_rate": 4.582449246592647e-05, "epoch": 0.22569027611044418, "percentage": 22.57, "elapsed_time": "6:21:35", "remaining_time": "21:49:10", "throughput": 1681.67, "total_tokens": 38502400} -{"current_steps": 4710, "total_steps": 20825, "loss": 0.8067, "learning_rate": 4.5802546348818264e-05, "epoch": 0.2261704681872749, "percentage": 22.62, "elapsed_time": "6:22:28", "remaining_time": "21:48:37", "throughput": 1681.33, "total_tokens": 38584320} -{"current_steps": 4720, "total_steps": 20825, "loss": 0.9678, "learning_rate": 4.578054799332277e-05, "epoch": 0.22665066026410563, "percentage": 22.67, "elapsed_time": "6:23:22", "remaining_time": "21:48:05", "throughput": 1680.98, "total_tokens": 38666240} -{"current_steps": 4730, "total_steps": 20825, "loss": 1.0305, "learning_rate": 4.575849745468124e-05, "epoch": 0.22713085234093638, "percentage": 22.71, "elapsed_time": "6:24:15", "remaining_time": "21:47:32", "throughput": 1680.65, "total_tokens": 38748160} -{"current_steps": 4740, "total_steps": 20825, "loss": 0.8708, "learning_rate": 4.573639478826596e-05, "epoch": 0.2276110444177671, "percentage": 22.76, "elapsed_time": "6:25:08", "remaining_time": "21:46:59", "throughput": 1680.31, "total_tokens": 38830080} -{"current_steps": 4750, "total_steps": 20825, "loss": 1.0366, "learning_rate": 4.571424004958012e-05, "epoch": 0.22809123649459784, "percentage": 22.81, "elapsed_time": "6:26:02", "remaining_time": "21:46:25", "throughput": 1679.98, "total_tokens": 38912000} -{"current_steps": 4760, "total_steps": 20825, "loss": 1.1274, "learning_rate": 4.5692033294257666e-05, "epoch": 0.22857142857142856, "percentage": 22.86, "elapsed_time": "6:26:55", "remaining_time": "21:45:51", "throughput": 1679.66, "total_tokens": 38993920} -{"current_steps": 4770, "total_steps": 20825, "loss": 0.906, "learning_rate": 4.5669774578063174e-05, "epoch": 0.2290516206482593, "percentage": 22.91, "elapsed_time": "6:27:48", "remaining_time": "21:45:18", "throughput": 1679.34, "total_tokens": 39075840} -{"current_steps": 4780, "total_steps": 20825, "loss": 0.9868, "learning_rate": 4.56474639568917e-05, "epoch": 0.22953181272509005, "percentage": 22.95, "elapsed_time": "6:28:41", "remaining_time": "21:44:43", "throughput": 1679.03, "total_tokens": 39157760} -{"current_steps": 4790, "total_steps": 20825, "loss": 0.9674, "learning_rate": 4.5625101486768626e-05, "epoch": 0.23001200480192077, "percentage": 23.0, "elapsed_time": "6:29:35", "remaining_time": "21:44:10", "throughput": 1678.69, "total_tokens": 39239680} -{"current_steps": 4800, "total_steps": 20825, "loss": 0.944, "learning_rate": 4.560268722384956e-05, "epoch": 0.2304921968787515, "percentage": 23.05, "elapsed_time": "6:30:28", "remaining_time": "21:43:37", "throughput": 1678.36, "total_tokens": 39321600} -{"current_steps": 4810, "total_steps": 20825, "loss": 0.9393, "learning_rate": 4.558022122442016e-05, "epoch": 0.23097238895558223, "percentage": 23.1, "elapsed_time": "6:31:21", "remaining_time": "21:43:02", "throughput": 1678.06, "total_tokens": 39403520} -{"current_steps": 4820, "total_steps": 20825, "loss": 0.9572, "learning_rate": 4.555770354489598e-05, "epoch": 0.23145258103241295, "percentage": 23.15, "elapsed_time": "6:32:14", "remaining_time": "21:42:28", "throughput": 1677.74, "total_tokens": 39485440} -{"current_steps": 4830, "total_steps": 20825, "loss": 0.8217, "learning_rate": 4.5535134241822394e-05, "epoch": 0.2319327731092437, "percentage": 23.19, "elapsed_time": "6:33:08", "remaining_time": "21:41:55", "throughput": 1677.4, "total_tokens": 39567360} -{"current_steps": 4840, "total_steps": 20825, "loss": 0.8829, "learning_rate": 4.551251337187436e-05, "epoch": 0.23241296518607443, "percentage": 23.24, "elapsed_time": "6:34:01", "remaining_time": "21:41:20", "throughput": 1677.1, "total_tokens": 39649280} -{"current_steps": 4850, "total_steps": 20825, "loss": 1.0275, "learning_rate": 4.548984099185638e-05, "epoch": 0.23289315726290516, "percentage": 23.29, "elapsed_time": "6:34:54", "remaining_time": "21:40:46", "throughput": 1676.78, "total_tokens": 39731200} -{"current_steps": 4860, "total_steps": 20825, "loss": 0.8638, "learning_rate": 4.546711715870227e-05, "epoch": 0.23337334933973589, "percentage": 23.34, "elapsed_time": "6:35:49", "remaining_time": "21:40:16", "throughput": 1676.39, "total_tokens": 39813120} -{"current_steps": 4870, "total_steps": 20825, "loss": 0.9251, "learning_rate": 4.5444341929475064e-05, "epoch": 0.23385354141656664, "percentage": 23.39, "elapsed_time": "6:36:42", "remaining_time": "21:39:41", "throughput": 1676.08, "total_tokens": 39895040} -{"current_steps": 4880, "total_steps": 20825, "loss": 1.362, "learning_rate": 4.5421515361366854e-05, "epoch": 0.23433373349339737, "percentage": 23.43, "elapsed_time": "6:37:36", "remaining_time": "21:39:09", "throughput": 1675.73, "total_tokens": 39976960} -{"current_steps": 4890, "total_steps": 20825, "loss": 0.6601, "learning_rate": 4.5398637511698665e-05, "epoch": 0.2348139255702281, "percentage": 23.48, "elapsed_time": "6:38:30", "remaining_time": "21:38:36", "throughput": 1675.37, "total_tokens": 40058880} -{"current_steps": 4900, "total_steps": 20825, "loss": 0.9545, "learning_rate": 4.5375708437920284e-05, "epoch": 0.23529411764705882, "percentage": 23.53, "elapsed_time": "6:39:23", "remaining_time": "21:38:02", "throughput": 1675.06, "total_tokens": 40140800} -{"current_steps": 4910, "total_steps": 20825, "loss": 1.0709, "learning_rate": 4.535272819761014e-05, "epoch": 0.23577430972388955, "percentage": 23.58, "elapsed_time": "6:40:16", "remaining_time": "21:37:27", "throughput": 1674.77, "total_tokens": 40222720} -{"current_steps": 4920, "total_steps": 20825, "loss": 1.0263, "learning_rate": 4.532969684847514e-05, "epoch": 0.2362545018007203, "percentage": 23.63, "elapsed_time": "6:41:10", "remaining_time": "21:36:52", "throughput": 1674.46, "total_tokens": 40304640} -{"current_steps": 4930, "total_steps": 20825, "loss": 0.9399, "learning_rate": 4.530661444835054e-05, "epoch": 0.23673469387755103, "percentage": 23.67, "elapsed_time": "6:42:03", "remaining_time": "21:36:17", "throughput": 1674.16, "total_tokens": 40386560} -{"current_steps": 4940, "total_steps": 20825, "loss": 1.0041, "learning_rate": 4.5283481055199784e-05, "epoch": 0.23721488595438175, "percentage": 23.72, "elapsed_time": "6:42:56", "remaining_time": "21:35:41", "throughput": 1673.88, "total_tokens": 40468480} -{"current_steps": 4950, "total_steps": 20825, "loss": 1.1321, "learning_rate": 4.526029672711437e-05, "epoch": 0.23769507803121248, "percentage": 23.77, "elapsed_time": "6:43:50", "remaining_time": "21:35:07", "throughput": 1673.55, "total_tokens": 40550400} -{"current_steps": 4960, "total_steps": 20825, "loss": 0.9726, "learning_rate": 4.523706152231373e-05, "epoch": 0.2381752701080432, "percentage": 23.82, "elapsed_time": "6:44:43", "remaining_time": "21:34:34", "throughput": 1673.22, "total_tokens": 40632320} -{"current_steps": 4970, "total_steps": 20825, "loss": 1.0489, "learning_rate": 4.5213775499145e-05, "epoch": 0.23865546218487396, "percentage": 23.87, "elapsed_time": "6:45:37", "remaining_time": "21:33:59", "throughput": 1672.91, "total_tokens": 40714240} -{"current_steps": 4980, "total_steps": 20825, "loss": 0.7904, "learning_rate": 4.519043871608297e-05, "epoch": 0.2391356542617047, "percentage": 23.91, "elapsed_time": "6:46:30", "remaining_time": "21:33:25", "throughput": 1672.59, "total_tokens": 40796160} -{"current_steps": 4990, "total_steps": 20825, "loss": 0.8851, "learning_rate": 4.5167051231729894e-05, "epoch": 0.23961584633853542, "percentage": 23.96, "elapsed_time": "6:47:24", "remaining_time": "21:32:50", "throughput": 1672.28, "total_tokens": 40878080} -{"current_steps": 5000, "total_steps": 20825, "loss": 0.9244, "learning_rate": 4.514361310481533e-05, "epoch": 0.24009603841536614, "percentage": 24.01, "elapsed_time": "6:48:18", "remaining_time": "21:32:16", "throughput": 1671.96, "total_tokens": 40960000} -{"current_steps": 5010, "total_steps": 20825, "loss": 0.9562, "learning_rate": 4.512012439419601e-05, "epoch": 0.24057623049219687, "percentage": 24.06, "elapsed_time": "6:49:16", "remaining_time": "21:31:55", "throughput": 1671.36, "total_tokens": 41041920} -{"current_steps": 5020, "total_steps": 20825, "loss": 1.0229, "learning_rate": 4.509658515885568e-05, "epoch": 0.24105642256902762, "percentage": 24.11, "elapsed_time": "6:50:09", "remaining_time": "21:31:22", "throughput": 1671.03, "total_tokens": 41123840} -{"current_steps": 5030, "total_steps": 20825, "loss": 0.8586, "learning_rate": 4.5072995457904995e-05, "epoch": 0.24153661464585835, "percentage": 24.15, "elapsed_time": "6:51:03", "remaining_time": "21:30:46", "throughput": 1670.73, "total_tokens": 41205760} -{"current_steps": 5040, "total_steps": 20825, "loss": 0.9188, "learning_rate": 4.50493553505813e-05, "epoch": 0.24201680672268908, "percentage": 24.2, "elapsed_time": "6:51:56", "remaining_time": "21:30:11", "throughput": 1670.44, "total_tokens": 41287680} -{"current_steps": 5050, "total_steps": 20825, "loss": 1.041, "learning_rate": 4.502566489624855e-05, "epoch": 0.2424969987995198, "percentage": 24.25, "elapsed_time": "6:52:50", "remaining_time": "21:29:35", "throughput": 1670.15, "total_tokens": 41369600} -{"current_steps": 5060, "total_steps": 20825, "loss": 0.9901, "learning_rate": 4.50019241543971e-05, "epoch": 0.24297719087635053, "percentage": 24.3, "elapsed_time": "6:53:43", "remaining_time": "21:28:59", "throughput": 1669.87, "total_tokens": 41451520} -{"current_steps": 5070, "total_steps": 20825, "loss": 0.9472, "learning_rate": 4.4978133184643586e-05, "epoch": 0.24345738295318128, "percentage": 24.35, "elapsed_time": "6:54:36", "remaining_time": "21:28:24", "throughput": 1669.57, "total_tokens": 41533440} -{"current_steps": 5080, "total_steps": 20825, "loss": 0.9372, "learning_rate": 4.495429204673081e-05, "epoch": 0.243937575030012, "percentage": 24.39, "elapsed_time": "6:55:29", "remaining_time": "21:27:48", "throughput": 1669.29, "total_tokens": 41615360} -{"current_steps": 5090, "total_steps": 20825, "loss": 0.8477, "learning_rate": 4.493040080052752e-05, "epoch": 0.24441776710684274, "percentage": 24.44, "elapsed_time": "6:56:23", "remaining_time": "21:27:12", "throughput": 1669.0, "total_tokens": 41697280} -{"current_steps": 5100, "total_steps": 20825, "loss": 1.0359, "learning_rate": 4.49064595060283e-05, "epoch": 0.24489795918367346, "percentage": 24.49, "elapsed_time": "6:57:16", "remaining_time": "21:26:36", "throughput": 1668.71, "total_tokens": 41779200} -{"current_steps": 5110, "total_steps": 20825, "loss": 1.027, "learning_rate": 4.488246822335341e-05, "epoch": 0.2453781512605042, "percentage": 24.54, "elapsed_time": "6:58:10", "remaining_time": "21:26:01", "throughput": 1668.41, "total_tokens": 41861120} -{"current_steps": 5120, "total_steps": 20825, "loss": 1.4544, "learning_rate": 4.485842701274865e-05, "epoch": 0.24585834333733494, "percentage": 24.59, "elapsed_time": "6:59:04", "remaining_time": "21:25:27", "throughput": 1668.1, "total_tokens": 41943040} -{"current_steps": 5130, "total_steps": 20825, "loss": 0.8381, "learning_rate": 4.4834335934585194e-05, "epoch": 0.24633853541416567, "percentage": 24.63, "elapsed_time": "6:59:57", "remaining_time": "21:24:51", "throughput": 1667.8, "total_tokens": 42024960} -{"current_steps": 5140, "total_steps": 20825, "loss": 0.8446, "learning_rate": 4.4810195049359435e-05, "epoch": 0.2468187274909964, "percentage": 24.68, "elapsed_time": "7:00:51", "remaining_time": "21:24:15", "throughput": 1667.52, "total_tokens": 42106880} -{"current_steps": 5150, "total_steps": 20825, "loss": 0.9213, "learning_rate": 4.4786004417692836e-05, "epoch": 0.24729891956782712, "percentage": 24.73, "elapsed_time": "7:01:44", "remaining_time": "21:23:38", "throughput": 1667.25, "total_tokens": 42188800} -{"current_steps": 5160, "total_steps": 20825, "loss": 1.0777, "learning_rate": 4.4761764100331795e-05, "epoch": 0.24777911164465785, "percentage": 24.78, "elapsed_time": "7:02:37", "remaining_time": "21:23:02", "throughput": 1666.97, "total_tokens": 42270720} -{"current_steps": 5170, "total_steps": 20825, "loss": 0.8808, "learning_rate": 4.473747415814747e-05, "epoch": 0.2482593037214886, "percentage": 24.83, "elapsed_time": "7:03:31", "remaining_time": "21:22:26", "throughput": 1666.69, "total_tokens": 42352640} -{"current_steps": 5180, "total_steps": 20825, "loss": 1.0989, "learning_rate": 4.471313465213562e-05, "epoch": 0.24873949579831933, "percentage": 24.87, "elapsed_time": "7:04:25", "remaining_time": "21:21:51", "throughput": 1666.38, "total_tokens": 42434560} -{"current_steps": 5190, "total_steps": 20825, "loss": 0.8832, "learning_rate": 4.46887456434165e-05, "epoch": 0.24921968787515006, "percentage": 24.92, "elapsed_time": "7:05:18", "remaining_time": "21:21:16", "throughput": 1666.08, "total_tokens": 42516480} -{"current_steps": 5200, "total_steps": 20825, "loss": 0.843, "learning_rate": 4.466430719323465e-05, "epoch": 0.24969987995198079, "percentage": 24.97, "elapsed_time": "7:06:12", "remaining_time": "21:20:41", "throughput": 1665.77, "total_tokens": 42598400} -{"current_steps": 5210, "total_steps": 20825, "loss": 1.096, "learning_rate": 4.463981936295876e-05, "epoch": 0.25018007202881154, "percentage": 25.02, "elapsed_time": "7:07:06", "remaining_time": "21:20:05", "throughput": 1665.47, "total_tokens": 42680320} -{"current_steps": 5220, "total_steps": 20825, "loss": 0.8411, "learning_rate": 4.461528221408153e-05, "epoch": 0.25066026410564224, "percentage": 25.07, "elapsed_time": "7:08:00", "remaining_time": "21:19:31", "throughput": 1665.16, "total_tokens": 42762240} -{"current_steps": 5230, "total_steps": 20825, "loss": 0.9483, "learning_rate": 4.459069580821953e-05, "epoch": 0.251140456182473, "percentage": 25.11, "elapsed_time": "7:08:54", "remaining_time": "21:18:55", "throughput": 1664.87, "total_tokens": 42844160} -{"current_steps": 5240, "total_steps": 20825, "loss": 0.7803, "learning_rate": 4.4566060207112983e-05, "epoch": 0.25162064825930375, "percentage": 25.16, "elapsed_time": "7:09:48", "remaining_time": "21:18:21", "throughput": 1664.53, "total_tokens": 42926080} -{"current_steps": 5250, "total_steps": 20825, "loss": 0.9638, "learning_rate": 4.454137547262566e-05, "epoch": 0.25210084033613445, "percentage": 25.21, "elapsed_time": "7:10:42", "remaining_time": "21:17:46", "throughput": 1664.23, "total_tokens": 43008000} -{"current_steps": 5260, "total_steps": 20825, "loss": 0.9499, "learning_rate": 4.451664166674472e-05, "epoch": 0.2525810324129652, "percentage": 25.26, "elapsed_time": "7:11:35", "remaining_time": "21:17:09", "throughput": 1663.97, "total_tokens": 43089920} -{"current_steps": 5270, "total_steps": 20825, "loss": 0.8689, "learning_rate": 4.449185885158056e-05, "epoch": 0.2530612244897959, "percentage": 25.31, "elapsed_time": "7:12:29", "remaining_time": "21:16:32", "throughput": 1663.7, "total_tokens": 43171840} -{"current_steps": 5280, "total_steps": 20825, "loss": 0.9125, "learning_rate": 4.4467027089366625e-05, "epoch": 0.25354141656662665, "percentage": 25.35, "elapsed_time": "7:13:22", "remaining_time": "21:15:55", "throughput": 1663.44, "total_tokens": 43253760} -{"current_steps": 5290, "total_steps": 20825, "loss": 0.9452, "learning_rate": 4.444214644245928e-05, "epoch": 0.2540216086434574, "percentage": 25.4, "elapsed_time": "7:14:16", "remaining_time": "21:15:18", "throughput": 1663.17, "total_tokens": 43335680} -{"current_steps": 5300, "total_steps": 20825, "loss": 0.8625, "learning_rate": 4.441721697333765e-05, "epoch": 0.2545018007202881, "percentage": 25.45, "elapsed_time": "7:15:08", "remaining_time": "21:14:39", "throughput": 1662.94, "total_tokens": 43417600} -{"current_steps": 5310, "total_steps": 20825, "loss": 0.8692, "learning_rate": 4.4392238744603464e-05, "epoch": 0.25498199279711886, "percentage": 25.5, "elapsed_time": "7:16:02", "remaining_time": "21:14:02", "throughput": 1662.67, "total_tokens": 43499520} -{"current_steps": 5320, "total_steps": 20825, "loss": 1.0077, "learning_rate": 4.436721181898088e-05, "epoch": 0.25546218487394956, "percentage": 25.55, "elapsed_time": "7:16:55", "remaining_time": "21:13:25", "throughput": 1662.41, "total_tokens": 43581440} -{"current_steps": 5330, "total_steps": 20825, "loss": 0.9048, "learning_rate": 4.434213625931636e-05, "epoch": 0.2559423769507803, "percentage": 25.59, "elapsed_time": "7:17:49", "remaining_time": "21:12:48", "throughput": 1662.14, "total_tokens": 43663360} -{"current_steps": 5340, "total_steps": 20825, "loss": 0.9174, "learning_rate": 4.431701212857847e-05, "epoch": 0.25642256902761107, "percentage": 25.64, "elapsed_time": "7:18:42", "remaining_time": "21:12:11", "throughput": 1661.88, "total_tokens": 43745280} -{"current_steps": 5350, "total_steps": 20825, "loss": 0.7608, "learning_rate": 4.429183948985777e-05, "epoch": 0.25690276110444177, "percentage": 25.69, "elapsed_time": "7:19:37", "remaining_time": "21:11:36", "throughput": 1661.56, "total_tokens": 43827200} -{"current_steps": 5360, "total_steps": 20825, "loss": 0.8841, "learning_rate": 4.426661840636662e-05, "epoch": 0.2573829531812725, "percentage": 25.74, "elapsed_time": "7:20:30", "remaining_time": "21:10:58", "throughput": 1661.32, "total_tokens": 43909120} -{"current_steps": 5370, "total_steps": 20825, "loss": 1.0389, "learning_rate": 4.424134894143903e-05, "epoch": 0.2578631452581032, "percentage": 25.79, "elapsed_time": "7:21:23", "remaining_time": "21:10:20", "throughput": 1661.07, "total_tokens": 43991040} -{"current_steps": 5380, "total_steps": 20825, "loss": 1.0486, "learning_rate": 4.42160311585305e-05, "epoch": 0.258343337334934, "percentage": 25.83, "elapsed_time": "7:22:16", "remaining_time": "21:09:41", "throughput": 1660.83, "total_tokens": 44072960} -{"current_steps": 5390, "total_steps": 20825, "loss": 0.6945, "learning_rate": 4.419066512121788e-05, "epoch": 0.25882352941176473, "percentage": 25.88, "elapsed_time": "7:23:10", "remaining_time": "21:09:05", "throughput": 1660.55, "total_tokens": 44154880} -{"current_steps": 5400, "total_steps": 20825, "loss": 0.8972, "learning_rate": 4.4165250893199176e-05, "epoch": 0.25930372148859543, "percentage": 25.93, "elapsed_time": "7:24:04", "remaining_time": "21:08:29", "throughput": 1660.27, "total_tokens": 44236800} -{"current_steps": 5410, "total_steps": 20825, "loss": 0.8574, "learning_rate": 4.413978853829342e-05, "epoch": 0.2597839135654262, "percentage": 25.98, "elapsed_time": "7:24:57", "remaining_time": "21:07:51", "throughput": 1660.01, "total_tokens": 44318720} -{"current_steps": 5420, "total_steps": 20825, "loss": 0.9521, "learning_rate": 4.411427812044049e-05, "epoch": 0.2602641056422569, "percentage": 26.03, "elapsed_time": "7:25:51", "remaining_time": "21:07:13", "throughput": 1659.77, "total_tokens": 44400640} -{"current_steps": 5430, "total_steps": 20825, "loss": 1.0423, "learning_rate": 4.408871970370096e-05, "epoch": 0.26074429771908764, "percentage": 26.07, "elapsed_time": "7:26:44", "remaining_time": "21:06:35", "throughput": 1659.52, "total_tokens": 44482560} -{"current_steps": 5440, "total_steps": 20825, "loss": 0.9938, "learning_rate": 4.406311335225595e-05, "epoch": 0.2612244897959184, "percentage": 26.12, "elapsed_time": "7:27:37", "remaining_time": "21:05:57", "throughput": 1659.26, "total_tokens": 44564480} -{"current_steps": 5450, "total_steps": 20825, "loss": 0.8559, "learning_rate": 4.4037459130406923e-05, "epoch": 0.2617046818727491, "percentage": 26.17, "elapsed_time": "7:28:31", "remaining_time": "21:05:20", "throughput": 1658.99, "total_tokens": 44646400} -{"current_steps": 5460, "total_steps": 20825, "loss": 0.9533, "learning_rate": 4.401175710257558e-05, "epoch": 0.26218487394957984, "percentage": 26.22, "elapsed_time": "7:29:25", "remaining_time": "21:04:43", "throughput": 1658.73, "total_tokens": 44728320} -{"current_steps": 5470, "total_steps": 20825, "loss": 0.8958, "learning_rate": 4.398600733330365e-05, "epoch": 0.26266506602641054, "percentage": 26.27, "elapsed_time": "7:30:18", "remaining_time": "21:04:04", "throughput": 1658.49, "total_tokens": 44810240} -{"current_steps": 5480, "total_steps": 20825, "loss": 1.1406, "learning_rate": 4.3960209887252766e-05, "epoch": 0.2631452581032413, "percentage": 26.31, "elapsed_time": "7:31:13", "remaining_time": "21:03:30", "throughput": 1658.17, "total_tokens": 44892160} -{"current_steps": 5490, "total_steps": 20825, "loss": 1.0363, "learning_rate": 4.3934364829204265e-05, "epoch": 0.26362545018007205, "percentage": 26.36, "elapsed_time": "7:32:06", "remaining_time": "21:02:51", "throughput": 1657.93, "total_tokens": 44974080} -{"current_steps": 5500, "total_steps": 20825, "loss": 0.876, "learning_rate": 4.3908472224059064e-05, "epoch": 0.26410564225690275, "percentage": 26.41, "elapsed_time": "7:32:59", "remaining_time": "21:02:12", "throughput": 1657.7, "total_tokens": 45056000} -{"current_steps": 5510, "total_steps": 20825, "loss": 0.8846, "learning_rate": 4.388253213683747e-05, "epoch": 0.2645858343337335, "percentage": 26.46, "elapsed_time": "7:33:52", "remaining_time": "21:01:33", "throughput": 1657.48, "total_tokens": 45137920} -{"current_steps": 5520, "total_steps": 20825, "loss": 0.841, "learning_rate": 4.385654463267901e-05, "epoch": 0.2650660264105642, "percentage": 26.51, "elapsed_time": "7:34:45", "remaining_time": "21:00:53", "throughput": 1657.26, "total_tokens": 45219840} -{"current_steps": 5530, "total_steps": 20825, "loss": 1.1015, "learning_rate": 4.383050977684231e-05, "epoch": 0.26554621848739496, "percentage": 26.55, "elapsed_time": "7:35:39", "remaining_time": "21:00:14", "throughput": 1657.04, "total_tokens": 45301760} -{"current_steps": 5540, "total_steps": 20825, "loss": 0.7614, "learning_rate": 4.3804427634704885e-05, "epoch": 0.2660264105642257, "percentage": 26.6, "elapsed_time": "7:36:31", "remaining_time": "20:59:35", "throughput": 1656.83, "total_tokens": 45383680} -{"current_steps": 5550, "total_steps": 20825, "loss": 0.8541, "learning_rate": 4.3778298271762995e-05, "epoch": 0.2665066026410564, "percentage": 26.65, "elapsed_time": "7:37:25", "remaining_time": "20:58:56", "throughput": 1656.59, "total_tokens": 45465600} -{"current_steps": 5560, "total_steps": 20825, "loss": 0.9464, "learning_rate": 4.375212175363149e-05, "epoch": 0.26698679471788717, "percentage": 26.7, "elapsed_time": "7:38:18", "remaining_time": "20:58:17", "throughput": 1656.36, "total_tokens": 45547520} -{"current_steps": 5570, "total_steps": 20825, "loss": 0.8231, "learning_rate": 4.372589814604362e-05, "epoch": 0.26746698679471786, "percentage": 26.75, "elapsed_time": "7:39:12", "remaining_time": "20:57:40", "throughput": 1656.09, "total_tokens": 45629440} -{"current_steps": 5580, "total_steps": 20825, "loss": 0.8247, "learning_rate": 4.369962751485089e-05, "epoch": 0.2679471788715486, "percentage": 26.79, "elapsed_time": "7:40:05", "remaining_time": "20:57:00", "throughput": 1655.87, "total_tokens": 45711360} -{"current_steps": 5590, "total_steps": 20825, "loss": 0.7793, "learning_rate": 4.367330992602289e-05, "epoch": 0.2684273709483794, "percentage": 26.84, "elapsed_time": "7:40:59", "remaining_time": "20:56:22", "throughput": 1655.62, "total_tokens": 45793280} -{"current_steps": 5600, "total_steps": 20825, "loss": 0.7808, "learning_rate": 4.3646945445647114e-05, "epoch": 0.2689075630252101, "percentage": 26.89, "elapsed_time": "7:41:52", "remaining_time": "20:55:44", "throughput": 1655.38, "total_tokens": 45875200} -{"current_steps": 5610, "total_steps": 20825, "loss": 1.023, "learning_rate": 4.362053413992883e-05, "epoch": 0.2693877551020408, "percentage": 26.94, "elapsed_time": "7:42:46", "remaining_time": "20:55:04", "throughput": 1655.16, "total_tokens": 45957120} -{"current_steps": 5620, "total_steps": 20825, "loss": 0.7344, "learning_rate": 4.359407607519088e-05, "epoch": 0.2698679471788715, "percentage": 26.99, "elapsed_time": "7:43:39", "remaining_time": "20:54:25", "throughput": 1654.92, "total_tokens": 46039040} -{"current_steps": 5630, "total_steps": 20825, "loss": 0.9653, "learning_rate": 4.356757131787353e-05, "epoch": 0.2703481392557023, "percentage": 27.03, "elapsed_time": "7:44:33", "remaining_time": "20:53:48", "throughput": 1654.66, "total_tokens": 46120960} -{"current_steps": 5640, "total_steps": 20825, "loss": 0.8851, "learning_rate": 4.354101993453429e-05, "epoch": 0.27082833133253303, "percentage": 27.08, "elapsed_time": "7:45:26", "remaining_time": "20:53:09", "throughput": 1654.44, "total_tokens": 46202880} -{"current_steps": 5650, "total_steps": 20825, "loss": 0.8417, "learning_rate": 4.3514421991847746e-05, "epoch": 0.27130852340936373, "percentage": 27.13, "elapsed_time": "7:46:20", "remaining_time": "20:52:30", "throughput": 1654.19, "total_tokens": 46284800} -{"current_steps": 5660, "total_steps": 20825, "loss": 0.8548, "learning_rate": 4.3487777556605446e-05, "epoch": 0.2717887154861945, "percentage": 27.18, "elapsed_time": "7:47:13", "remaining_time": "20:51:51", "throughput": 1653.95, "total_tokens": 46366720} -{"current_steps": 5670, "total_steps": 20825, "loss": 1.0355, "learning_rate": 4.3461086695715625e-05, "epoch": 0.2722689075630252, "percentage": 27.23, "elapsed_time": "7:48:07", "remaining_time": "20:51:13", "throughput": 1653.7, "total_tokens": 46448640} -{"current_steps": 5680, "total_steps": 20825, "loss": 0.799, "learning_rate": 4.343434947620315e-05, "epoch": 0.27274909963985594, "percentage": 27.27, "elapsed_time": "7:49:00", "remaining_time": "20:50:33", "throughput": 1653.5, "total_tokens": 46530560} -{"current_steps": 5690, "total_steps": 20825, "loss": 0.9427, "learning_rate": 4.340756596520929e-05, "epoch": 0.2732292917166867, "percentage": 27.32, "elapsed_time": "7:49:53", "remaining_time": "20:49:53", "throughput": 1653.29, "total_tokens": 46612480} -{"current_steps": 5700, "total_steps": 20825, "loss": 0.904, "learning_rate": 4.338073622999154e-05, "epoch": 0.2737094837935174, "percentage": 27.37, "elapsed_time": "7:50:46", "remaining_time": "20:49:13", "throughput": 1653.08, "total_tokens": 46694400} -{"current_steps": 5710, "total_steps": 20825, "loss": 1.2054, "learning_rate": 4.335386033792347e-05, "epoch": 0.27418967587034815, "percentage": 27.42, "elapsed_time": "7:51:40", "remaining_time": "20:48:34", "throughput": 1652.85, "total_tokens": 46776320} -{"current_steps": 5720, "total_steps": 20825, "loss": 0.8869, "learning_rate": 4.332693835649461e-05, "epoch": 0.27466986794717885, "percentage": 27.47, "elapsed_time": "7:52:33", "remaining_time": "20:47:55", "throughput": 1652.62, "total_tokens": 46858240} -{"current_steps": 5730, "total_steps": 20825, "loss": 0.9947, "learning_rate": 4.329997035331015e-05, "epoch": 0.2751500600240096, "percentage": 27.52, "elapsed_time": "7:53:27", "remaining_time": "20:47:15", "throughput": 1652.39, "total_tokens": 46940160} -{"current_steps": 5740, "total_steps": 20825, "loss": 0.8496, "learning_rate": 4.3272956396090906e-05, "epoch": 0.27563025210084036, "percentage": 27.56, "elapsed_time": "7:54:20", "remaining_time": "20:46:36", "throughput": 1652.17, "total_tokens": 47022080} -{"current_steps": 5750, "total_steps": 20825, "loss": 0.9618, "learning_rate": 4.324589655267306e-05, "epoch": 0.27611044417767105, "percentage": 27.61, "elapsed_time": "7:55:13", "remaining_time": "20:45:55", "throughput": 1651.97, "total_tokens": 47104000} -{"current_steps": 5760, "total_steps": 20825, "loss": 1.065, "learning_rate": 4.321879089100805e-05, "epoch": 0.2765906362545018, "percentage": 27.66, "elapsed_time": "7:56:06", "remaining_time": "20:45:15", "throughput": 1651.76, "total_tokens": 47185920} -{"current_steps": 5770, "total_steps": 20825, "loss": 0.9001, "learning_rate": 4.319163947916234e-05, "epoch": 0.2770708283313325, "percentage": 27.71, "elapsed_time": "7:57:00", "remaining_time": "20:44:35", "throughput": 1651.56, "total_tokens": 47267840} -{"current_steps": 5780, "total_steps": 20825, "loss": 0.9649, "learning_rate": 4.316444238531729e-05, "epoch": 0.27755102040816326, "percentage": 27.76, "elapsed_time": "7:57:53", "remaining_time": "20:43:55", "throughput": 1651.34, "total_tokens": 47349760} -{"current_steps": 5790, "total_steps": 20825, "loss": 0.9746, "learning_rate": 4.313719967776899e-05, "epoch": 0.278031212484994, "percentage": 27.8, "elapsed_time": "7:58:46", "remaining_time": "20:43:15", "throughput": 1651.13, "total_tokens": 47431680} -{"current_steps": 5800, "total_steps": 20825, "loss": 1.0193, "learning_rate": 4.310991142492805e-05, "epoch": 0.2785114045618247, "percentage": 27.85, "elapsed_time": "7:59:40", "remaining_time": "20:42:35", "throughput": 1650.91, "total_tokens": 47513600} -{"current_steps": 5810, "total_steps": 20825, "loss": 0.9313, "learning_rate": 4.308257769531947e-05, "epoch": 0.27899159663865547, "percentage": 27.9, "elapsed_time": "8:00:33", "remaining_time": "20:41:55", "throughput": 1650.7, "total_tokens": 47595520} -{"current_steps": 5820, "total_steps": 20825, "loss": 1.0058, "learning_rate": 4.3055198557582445e-05, "epoch": 0.27947178871548617, "percentage": 27.95, "elapsed_time": "8:01:26", "remaining_time": "20:41:15", "throughput": 1650.49, "total_tokens": 47677440} -{"current_steps": 5830, "total_steps": 20825, "loss": 1.1261, "learning_rate": 4.3027774080470174e-05, "epoch": 0.2799519807923169, "percentage": 28.0, "elapsed_time": "8:02:19", "remaining_time": "20:40:34", "throughput": 1650.29, "total_tokens": 47759360} -{"current_steps": 5840, "total_steps": 20825, "loss": 0.8111, "learning_rate": 4.300030433284974e-05, "epoch": 0.2804321728691477, "percentage": 28.04, "elapsed_time": "8:03:13", "remaining_time": "20:39:55", "throughput": 1650.06, "total_tokens": 47841280} -{"current_steps": 5850, "total_steps": 20825, "loss": 0.7262, "learning_rate": 4.29727893837019e-05, "epoch": 0.2809123649459784, "percentage": 28.09, "elapsed_time": "8:04:06", "remaining_time": "20:39:15", "throughput": 1649.85, "total_tokens": 47923200} -{"current_steps": 5860, "total_steps": 20825, "loss": 0.809, "learning_rate": 4.294522930212091e-05, "epoch": 0.28139255702280913, "percentage": 28.14, "elapsed_time": "8:05:00", "remaining_time": "20:38:34", "throughput": 1649.66, "total_tokens": 48005120} -{"current_steps": 5870, "total_steps": 20825, "loss": 0.9162, "learning_rate": 4.291762415731437e-05, "epoch": 0.28187274909963983, "percentage": 28.19, "elapsed_time": "8:05:53", "remaining_time": "20:37:53", "throughput": 1649.47, "total_tokens": 48087040} -{"current_steps": 5880, "total_steps": 20825, "loss": 1.0343, "learning_rate": 4.288997401860303e-05, "epoch": 0.2823529411764706, "percentage": 28.24, "elapsed_time": "8:06:47", "remaining_time": "20:37:15", "throughput": 1649.21, "total_tokens": 48168960} -{"current_steps": 5890, "total_steps": 20825, "loss": 1.36, "learning_rate": 4.286227895542064e-05, "epoch": 0.28283313325330134, "percentage": 28.28, "elapsed_time": "8:07:40", "remaining_time": "20:36:34", "throughput": 1649.01, "total_tokens": 48250880} -{"current_steps": 5900, "total_steps": 20825, "loss": 0.8472, "learning_rate": 4.283453903731375e-05, "epoch": 0.28331332533013204, "percentage": 28.33, "elapsed_time": "8:08:33", "remaining_time": "20:35:54", "throughput": 1648.8, "total_tokens": 48332800} -{"current_steps": 5910, "total_steps": 20825, "loss": 1.1295, "learning_rate": 4.2806754333941546e-05, "epoch": 0.2837935174069628, "percentage": 28.38, "elapsed_time": "8:09:27", "remaining_time": "20:35:13", "throughput": 1648.6, "total_tokens": 48414720} -{"current_steps": 5920, "total_steps": 20825, "loss": 0.9477, "learning_rate": 4.2778924915075704e-05, "epoch": 0.2842737094837935, "percentage": 28.43, "elapsed_time": "8:10:20", "remaining_time": "20:34:33", "throughput": 1648.39, "total_tokens": 48496640} -{"current_steps": 5930, "total_steps": 20825, "loss": 0.93, "learning_rate": 4.275105085060014e-05, "epoch": 0.28475390156062425, "percentage": 28.48, "elapsed_time": "8:11:13", "remaining_time": "20:33:51", "throughput": 1648.21, "total_tokens": 48578560} -{"current_steps": 5940, "total_steps": 20825, "loss": 1.0398, "learning_rate": 4.272313221051094e-05, "epoch": 0.285234093637455, "percentage": 28.52, "elapsed_time": "8:12:06", "remaining_time": "20:33:11", "throughput": 1648.0, "total_tokens": 48660480} -{"current_steps": 5950, "total_steps": 20825, "loss": 0.9514, "learning_rate": 4.269516906491607e-05, "epoch": 0.2857142857142857, "percentage": 28.57, "elapsed_time": "8:13:00", "remaining_time": "20:32:30", "throughput": 1647.8, "total_tokens": 48742400} -{"current_steps": 5960, "total_steps": 20825, "loss": 0.7283, "learning_rate": 4.266716148403529e-05, "epoch": 0.28619447779111645, "percentage": 28.62, "elapsed_time": "8:13:53", "remaining_time": "20:31:49", "throughput": 1647.61, "total_tokens": 48824320} -{"current_steps": 5970, "total_steps": 20825, "loss": 0.9808, "learning_rate": 4.263910953819993e-05, "epoch": 0.28667466986794715, "percentage": 28.67, "elapsed_time": "8:14:46", "remaining_time": "20:31:08", "throughput": 1647.42, "total_tokens": 48906240} -{"current_steps": 5980, "total_steps": 20825, "loss": 0.9758, "learning_rate": 4.2611013297852744e-05, "epoch": 0.2871548619447779, "percentage": 28.72, "elapsed_time": "8:15:40", "remaining_time": "20:30:27", "throughput": 1647.21, "total_tokens": 48988160} -{"current_steps": 5990, "total_steps": 20825, "loss": 0.9226, "learning_rate": 4.2582872833547693e-05, "epoch": 0.28763505402160866, "percentage": 28.76, "elapsed_time": "8:16:33", "remaining_time": "20:29:47", "throughput": 1647.0, "total_tokens": 49070080} -{"current_steps": 6000, "total_steps": 20825, "loss": 1.0878, "learning_rate": 4.255468821594981e-05, "epoch": 0.28811524609843936, "percentage": 28.81, "elapsed_time": "8:17:27", "remaining_time": "20:29:07", "throughput": 1646.79, "total_tokens": 49152000} -{"current_steps": 6010, "total_steps": 20825, "loss": 0.917, "learning_rate": 4.2526459515834996e-05, "epoch": 0.2885954381752701, "percentage": 28.86, "elapsed_time": "8:18:23", "remaining_time": "20:28:34", "throughput": 1646.41, "total_tokens": 49233920} -{"current_steps": 6020, "total_steps": 20825, "loss": 1.0098, "learning_rate": 4.249818680408984e-05, "epoch": 0.28907563025210087, "percentage": 28.91, "elapsed_time": "8:19:17", "remaining_time": "20:27:54", "throughput": 1646.19, "total_tokens": 49315840} -{"current_steps": 6030, "total_steps": 20825, "loss": 1.0573, "learning_rate": 4.246987015171148e-05, "epoch": 0.28955582232893157, "percentage": 28.96, "elapsed_time": "8:20:10", "remaining_time": "20:27:13", "throughput": 1646.0, "total_tokens": 49397760} -{"current_steps": 6040, "total_steps": 20825, "loss": 1.1285, "learning_rate": 4.244150962980735e-05, "epoch": 0.2900360144057623, "percentage": 29.0, "elapsed_time": "8:21:04", "remaining_time": "20:26:32", "throughput": 1645.81, "total_tokens": 49479680} -{"current_steps": 6050, "total_steps": 20825, "loss": 0.9014, "learning_rate": 4.2413105309595105e-05, "epoch": 0.290516206482593, "percentage": 29.05, "elapsed_time": "8:21:57", "remaining_time": "20:25:52", "throughput": 1645.59, "total_tokens": 49561600} -{"current_steps": 6060, "total_steps": 20825, "loss": 0.8398, "learning_rate": 4.238465726240233e-05, "epoch": 0.2909963985594238, "percentage": 29.1, "elapsed_time": "8:22:51", "remaining_time": "20:25:11", "throughput": 1645.38, "total_tokens": 49643520} -{"current_steps": 6070, "total_steps": 20825, "loss": 0.879, "learning_rate": 4.235616555966645e-05, "epoch": 0.29147659063625453, "percentage": 29.15, "elapsed_time": "8:23:44", "remaining_time": "20:24:30", "throughput": 1645.19, "total_tokens": 49725440} -{"current_steps": 6080, "total_steps": 20825, "loss": 0.7561, "learning_rate": 4.232763027293451e-05, "epoch": 0.29195678271308523, "percentage": 29.2, "elapsed_time": "8:24:38", "remaining_time": "20:23:49", "throughput": 1645.0, "total_tokens": 49807360} -{"current_steps": 6090, "total_steps": 20825, "loss": 1.0367, "learning_rate": 4.2299051473862976e-05, "epoch": 0.292436974789916, "percentage": 29.24, "elapsed_time": "8:25:31", "remaining_time": "20:23:07", "throughput": 1644.81, "total_tokens": 49889280} -{"current_steps": 6100, "total_steps": 20825, "loss": 0.979, "learning_rate": 4.227042923421762e-05, "epoch": 0.2929171668667467, "percentage": 29.29, "elapsed_time": "8:26:24", "remaining_time": "20:22:26", "throughput": 1644.62, "total_tokens": 49971200} -{"current_steps": 6110, "total_steps": 20825, "loss": 0.9951, "learning_rate": 4.224176362587326e-05, "epoch": 0.29339735894357744, "percentage": 29.34, "elapsed_time": "8:27:18", "remaining_time": "20:21:45", "throughput": 1644.42, "total_tokens": 50053120} -{"current_steps": 6120, "total_steps": 20825, "loss": 0.8707, "learning_rate": 4.221305472081365e-05, "epoch": 0.2938775510204082, "percentage": 29.39, "elapsed_time": "8:28:11", "remaining_time": "20:21:04", "throughput": 1644.23, "total_tokens": 50135040} -{"current_steps": 6130, "total_steps": 20825, "loss": 0.9571, "learning_rate": 4.2184302591131264e-05, "epoch": 0.2943577430972389, "percentage": 29.44, "elapsed_time": "8:29:04", "remaining_time": "20:20:21", "throughput": 1644.07, "total_tokens": 50216960} -{"current_steps": 6140, "total_steps": 20825, "loss": 1.0041, "learning_rate": 4.21555073090271e-05, "epoch": 0.29483793517406964, "percentage": 29.48, "elapsed_time": "8:29:57", "remaining_time": "20:19:40", "throughput": 1643.88, "total_tokens": 50298880} -{"current_steps": 6150, "total_steps": 20825, "loss": 1.1052, "learning_rate": 4.2126668946810545e-05, "epoch": 0.29531812725090034, "percentage": 29.53, "elapsed_time": "8:30:50", "remaining_time": "20:18:58", "throughput": 1643.7, "total_tokens": 50380800} -{"current_steps": 6160, "total_steps": 20825, "loss": 0.7878, "learning_rate": 4.2097787576899144e-05, "epoch": 0.2957983193277311, "percentage": 29.58, "elapsed_time": "8:31:44", "remaining_time": "20:18:16", "throughput": 1643.51, "total_tokens": 50462720} -{"current_steps": 6170, "total_steps": 20825, "loss": 0.8359, "learning_rate": 4.2068863271818455e-05, "epoch": 0.29627851140456185, "percentage": 29.63, "elapsed_time": "8:32:37", "remaining_time": "20:17:34", "throughput": 1643.34, "total_tokens": 50544640} -{"current_steps": 6180, "total_steps": 20825, "loss": 0.7906, "learning_rate": 4.2039896104201844e-05, "epoch": 0.29675870348139255, "percentage": 29.68, "elapsed_time": "8:33:30", "remaining_time": "20:16:53", "throughput": 1643.14, "total_tokens": 50626560} -{"current_steps": 6190, "total_steps": 20825, "loss": 0.8226, "learning_rate": 4.201088614679032e-05, "epoch": 0.2972388955582233, "percentage": 29.72, "elapsed_time": "8:34:24", "remaining_time": "20:16:12", "throughput": 1642.94, "total_tokens": 50708480} -{"current_steps": 6200, "total_steps": 20825, "loss": 0.922, "learning_rate": 4.198183347243233e-05, "epoch": 0.297719087635054, "percentage": 29.77, "elapsed_time": "8:35:17", "remaining_time": "20:15:31", "throughput": 1642.76, "total_tokens": 50790400} -{"current_steps": 6210, "total_steps": 20825, "loss": 0.8489, "learning_rate": 4.1952738154083614e-05, "epoch": 0.29819927971188476, "percentage": 29.82, "elapsed_time": "8:36:10", "remaining_time": "20:14:48", "throughput": 1642.58, "total_tokens": 50872320} -{"current_steps": 6220, "total_steps": 20825, "loss": 0.9279, "learning_rate": 4.1923600264806975e-05, "epoch": 0.2986794717887155, "percentage": 29.87, "elapsed_time": "8:37:04", "remaining_time": "20:14:06", "throughput": 1642.41, "total_tokens": 50954240} -{"current_steps": 6230, "total_steps": 20825, "loss": 0.8793, "learning_rate": 4.189441987777212e-05, "epoch": 0.2991596638655462, "percentage": 29.92, "elapsed_time": "8:37:57", "remaining_time": "20:13:24", "throughput": 1642.23, "total_tokens": 51036160} -{"current_steps": 6240, "total_steps": 20825, "loss": 0.8057, "learning_rate": 4.186519706625549e-05, "epoch": 0.29963985594237696, "percentage": 29.96, "elapsed_time": "8:38:51", "remaining_time": "20:12:44", "throughput": 1642.02, "total_tokens": 51118080} -{"current_steps": 6250, "total_steps": 20825, "loss": 1.0145, "learning_rate": 4.1835931903640046e-05, "epoch": 0.30012004801920766, "percentage": 30.01, "elapsed_time": "8:39:44", "remaining_time": "20:12:01", "throughput": 1641.85, "total_tokens": 51200000} -{"current_steps": 6260, "total_steps": 20825, "loss": 0.9712, "learning_rate": 4.180662446341511e-05, "epoch": 0.3006002400960384, "percentage": 30.06, "elapsed_time": "8:40:37", "remaining_time": "20:11:19", "throughput": 1641.68, "total_tokens": 51281920} -{"current_steps": 6270, "total_steps": 20825, "loss": 0.9031, "learning_rate": 4.1777274819176154e-05, "epoch": 0.3010804321728692, "percentage": 30.11, "elapsed_time": "8:41:30", "remaining_time": "20:10:36", "throughput": 1641.52, "total_tokens": 51363840} -{"current_steps": 6280, "total_steps": 20825, "loss": 0.9543, "learning_rate": 4.1747883044624644e-05, "epoch": 0.30156062424969987, "percentage": 30.16, "elapsed_time": "8:42:23", "remaining_time": "20:09:55", "throughput": 1641.33, "total_tokens": 51445760} -{"current_steps": 6290, "total_steps": 20825, "loss": 1.0411, "learning_rate": 4.171844921356784e-05, "epoch": 0.3020408163265306, "percentage": 30.2, "elapsed_time": "8:43:17", "remaining_time": "20:09:13", "throughput": 1641.15, "total_tokens": 51527680} -{"current_steps": 6300, "total_steps": 20825, "loss": 1.0103, "learning_rate": 4.168897339991861e-05, "epoch": 0.3025210084033613, "percentage": 30.25, "elapsed_time": "8:44:10", "remaining_time": "20:08:30", "throughput": 1640.98, "total_tokens": 51609600} -{"current_steps": 6310, "total_steps": 20825, "loss": 1.0368, "learning_rate": 4.1659455677695245e-05, "epoch": 0.3030012004801921, "percentage": 30.3, "elapsed_time": "8:45:03", "remaining_time": "20:07:48", "throughput": 1640.8, "total_tokens": 51691520} -{"current_steps": 6320, "total_steps": 20825, "loss": 0.6589, "learning_rate": 4.162989612102128e-05, "epoch": 0.30348139255702283, "percentage": 30.35, "elapsed_time": "8:45:57", "remaining_time": "20:07:08", "throughput": 1640.59, "total_tokens": 51773440} -{"current_steps": 6330, "total_steps": 20825, "loss": 0.9936, "learning_rate": 4.160029480412529e-05, "epoch": 0.30396158463385353, "percentage": 30.4, "elapsed_time": "8:46:50", "remaining_time": "20:06:25", "throughput": 1640.44, "total_tokens": 51855360} -{"current_steps": 6340, "total_steps": 20825, "loss": 0.8154, "learning_rate": 4.1570651801340735e-05, "epoch": 0.3044417767106843, "percentage": 30.44, "elapsed_time": "8:47:43", "remaining_time": "20:05:42", "throughput": 1640.27, "total_tokens": 51937280} -{"current_steps": 6350, "total_steps": 20825, "loss": 1.0798, "learning_rate": 4.1540967187105753e-05, "epoch": 0.304921968787515, "percentage": 30.49, "elapsed_time": "8:48:36", "remaining_time": "20:04:59", "throughput": 1640.11, "total_tokens": 52019200} -{"current_steps": 6360, "total_steps": 20825, "loss": 0.8155, "learning_rate": 4.151124103596295e-05, "epoch": 0.30540216086434574, "percentage": 30.54, "elapsed_time": "8:49:29", "remaining_time": "20:04:16", "throughput": 1639.95, "total_tokens": 52101120} -{"current_steps": 6370, "total_steps": 20825, "loss": 0.9705, "learning_rate": 4.148147342255926e-05, "epoch": 0.3058823529411765, "percentage": 30.59, "elapsed_time": "8:50:23", "remaining_time": "20:03:34", "throughput": 1639.77, "total_tokens": 52183040} -{"current_steps": 6380, "total_steps": 20825, "loss": 0.849, "learning_rate": 4.145166442164573e-05, "epoch": 0.3063625450180072, "percentage": 30.64, "elapsed_time": "8:51:16", "remaining_time": "20:02:52", "throughput": 1639.6, "total_tokens": 52264960} -{"current_steps": 6390, "total_steps": 20825, "loss": 0.9561, "learning_rate": 4.142181410807735e-05, "epoch": 0.30684273709483795, "percentage": 30.68, "elapsed_time": "8:52:09", "remaining_time": "20:02:09", "throughput": 1639.44, "total_tokens": 52346880} -{"current_steps": 6400, "total_steps": 20825, "loss": 0.9117, "learning_rate": 4.1391922556812815e-05, "epoch": 0.30732292917166865, "percentage": 30.73, "elapsed_time": "8:53:02", "remaining_time": "20:01:26", "throughput": 1639.27, "total_tokens": 52428800} -{"current_steps": 6410, "total_steps": 20825, "loss": 0.8657, "learning_rate": 4.136198984291442e-05, "epoch": 0.3078031212484994, "percentage": 30.78, "elapsed_time": "8:53:56", "remaining_time": "20:00:44", "throughput": 1639.1, "total_tokens": 52510720} -{"current_steps": 6420, "total_steps": 20825, "loss": 0.9356, "learning_rate": 4.133201604154779e-05, "epoch": 0.30828331332533015, "percentage": 30.83, "elapsed_time": "8:54:50", "remaining_time": "20:00:02", "throughput": 1638.91, "total_tokens": 52592640} -{"current_steps": 6430, "total_steps": 20825, "loss": 1.0838, "learning_rate": 4.1302001227981765e-05, "epoch": 0.30876350540216085, "percentage": 30.88, "elapsed_time": "8:55:43", "remaining_time": "19:59:20", "throughput": 1638.72, "total_tokens": 52674560} -{"current_steps": 6440, "total_steps": 20825, "loss": 0.7471, "learning_rate": 4.1271945477588126e-05, "epoch": 0.3092436974789916, "percentage": 30.92, "elapsed_time": "8:56:37", "remaining_time": "19:58:39", "throughput": 1638.53, "total_tokens": 52756480} -{"current_steps": 6450, "total_steps": 20825, "loss": 0.9374, "learning_rate": 4.124184886584148e-05, "epoch": 0.3097238895558223, "percentage": 30.97, "elapsed_time": "8:57:31", "remaining_time": "19:57:57", "throughput": 1638.35, "total_tokens": 52838400} -{"current_steps": 6460, "total_steps": 20825, "loss": 1.0186, "learning_rate": 4.121171146831905e-05, "epoch": 0.31020408163265306, "percentage": 31.02, "elapsed_time": "8:58:24", "remaining_time": "19:57:14", "throughput": 1638.17, "total_tokens": 52920320} -{"current_steps": 6470, "total_steps": 20825, "loss": 1.1422, "learning_rate": 4.118153336070045e-05, "epoch": 0.3106842737094838, "percentage": 31.07, "elapsed_time": "8:59:18", "remaining_time": "19:56:33", "throughput": 1637.97, "total_tokens": 53002240} -{"current_steps": 6480, "total_steps": 20825, "loss": 1.0219, "learning_rate": 4.115131461876756e-05, "epoch": 0.3111644657863145, "percentage": 31.12, "elapsed_time": "9:00:11", "remaining_time": "19:55:51", "throughput": 1637.8, "total_tokens": 53084160} -{"current_steps": 6490, "total_steps": 20825, "loss": 0.9806, "learning_rate": 4.1121055318404264e-05, "epoch": 0.31164465786314527, "percentage": 31.16, "elapsed_time": "9:01:05", "remaining_time": "19:55:08", "throughput": 1637.64, "total_tokens": 53166080} -{"current_steps": 6500, "total_steps": 20825, "loss": 1.1074, "learning_rate": 4.109075553559633e-05, "epoch": 0.31212484993997597, "percentage": 31.21, "elapsed_time": "9:01:58", "remaining_time": "19:54:25", "throughput": 1637.48, "total_tokens": 53248000} -{"current_steps": 6510, "total_steps": 20825, "loss": 0.93, "learning_rate": 4.1060415346431134e-05, "epoch": 0.3126050420168067, "percentage": 31.26, "elapsed_time": "9:02:51", "remaining_time": "19:53:42", "throughput": 1637.32, "total_tokens": 53329920} -{"current_steps": 6520, "total_steps": 20825, "loss": 0.9669, "learning_rate": 4.103003482709758e-05, "epoch": 0.3130852340936375, "percentage": 31.31, "elapsed_time": "9:03:44", "remaining_time": "19:52:59", "throughput": 1637.15, "total_tokens": 53411840} -{"current_steps": 6530, "total_steps": 20825, "loss": 0.7738, "learning_rate": 4.0999614053885795e-05, "epoch": 0.3135654261704682, "percentage": 31.36, "elapsed_time": "9:04:38", "remaining_time": "19:52:17", "throughput": 1636.97, "total_tokens": 53493760} -{"current_steps": 6540, "total_steps": 20825, "loss": 0.8493, "learning_rate": 4.096915310318702e-05, "epoch": 0.31404561824729893, "percentage": 31.4, "elapsed_time": "9:05:31", "remaining_time": "19:51:33", "throughput": 1636.82, "total_tokens": 53575680} -{"current_steps": 6550, "total_steps": 20825, "loss": 0.9464, "learning_rate": 4.093865205149337e-05, "epoch": 0.31452581032412963, "percentage": 31.45, "elapsed_time": "9:06:24", "remaining_time": "19:50:50", "throughput": 1636.67, "total_tokens": 53657600} -{"current_steps": 6560, "total_steps": 20825, "loss": 0.7853, "learning_rate": 4.090811097539768e-05, "epoch": 0.3150060024009604, "percentage": 31.5, "elapsed_time": "9:07:18", "remaining_time": "19:50:08", "throughput": 1636.49, "total_tokens": 53739520} -{"current_steps": 6570, "total_steps": 20825, "loss": 0.764, "learning_rate": 4.087752995159327e-05, "epoch": 0.31548619447779114, "percentage": 31.55, "elapsed_time": "9:08:11", "remaining_time": "19:49:25", "throughput": 1636.32, "total_tokens": 53821440} -{"current_steps": 6580, "total_steps": 20825, "loss": 0.9871, "learning_rate": 4.084690905687379e-05, "epoch": 0.31596638655462184, "percentage": 31.6, "elapsed_time": "9:09:04", "remaining_time": "19:48:42", "throughput": 1636.17, "total_tokens": 53903360} -{"current_steps": 6590, "total_steps": 20825, "loss": 1.1464, "learning_rate": 4.0816248368133016e-05, "epoch": 0.3164465786314526, "percentage": 31.64, "elapsed_time": "9:09:58", "remaining_time": "19:47:59", "throughput": 1635.99, "total_tokens": 53985280} -{"current_steps": 6600, "total_steps": 20825, "loss": 0.7681, "learning_rate": 4.078554796236462e-05, "epoch": 0.3169267707082833, "percentage": 31.69, "elapsed_time": "9:10:51", "remaining_time": "19:47:15", "throughput": 1635.86, "total_tokens": 54067200} -{"current_steps": 6610, "total_steps": 20825, "loss": 1.0146, "learning_rate": 4.0754807916662055e-05, "epoch": 0.31740696278511404, "percentage": 31.74, "elapsed_time": "9:11:44", "remaining_time": "19:46:32", "throughput": 1635.7, "total_tokens": 54149120} -{"current_steps": 6620, "total_steps": 20825, "loss": 0.9229, "learning_rate": 4.072402830821829e-05, "epoch": 0.3178871548619448, "percentage": 31.79, "elapsed_time": "9:12:38", "remaining_time": "19:45:50", "throughput": 1635.52, "total_tokens": 54231040} -{"current_steps": 6630, "total_steps": 20825, "loss": 0.9067, "learning_rate": 4.069320921432564e-05, "epoch": 0.3183673469387755, "percentage": 31.84, "elapsed_time": "9:13:31", "remaining_time": "19:45:06", "throughput": 1635.37, "total_tokens": 54312960} -{"current_steps": 6640, "total_steps": 20825, "loss": 0.8371, "learning_rate": 4.066235071237559e-05, "epoch": 0.31884753901560625, "percentage": 31.88, "elapsed_time": "9:14:24", "remaining_time": "19:44:22", "throughput": 1635.22, "total_tokens": 54394880} -{"current_steps": 6650, "total_steps": 20825, "loss": 0.9809, "learning_rate": 4.0631452879858565e-05, "epoch": 0.31932773109243695, "percentage": 31.93, "elapsed_time": "9:15:17", "remaining_time": "19:43:39", "throughput": 1635.07, "total_tokens": 54476800} -{"current_steps": 6660, "total_steps": 20825, "loss": 0.9101, "learning_rate": 4.0600515794363774e-05, "epoch": 0.3198079231692677, "percentage": 31.98, "elapsed_time": "9:16:10", "remaining_time": "19:42:55", "throughput": 1634.93, "total_tokens": 54558720} -{"current_steps": 6670, "total_steps": 20825, "loss": 0.9802, "learning_rate": 4.0569539533578985e-05, "epoch": 0.32028811524609846, "percentage": 32.03, "elapsed_time": "9:17:04", "remaining_time": "19:42:12", "throughput": 1634.77, "total_tokens": 54640640} -{"current_steps": 6680, "total_steps": 20825, "loss": 0.7294, "learning_rate": 4.053852417529035e-05, "epoch": 0.32076830732292916, "percentage": 32.08, "elapsed_time": "9:17:57", "remaining_time": "19:41:29", "throughput": 1634.59, "total_tokens": 54722560} -{"current_steps": 6690, "total_steps": 20825, "loss": 0.9096, "learning_rate": 4.050746979738218e-05, "epoch": 0.3212484993997599, "percentage": 32.12, "elapsed_time": "9:18:51", "remaining_time": "19:40:46", "throughput": 1634.44, "total_tokens": 54804480} -{"current_steps": 6700, "total_steps": 20825, "loss": 1.0167, "learning_rate": 4.047637647783681e-05, "epoch": 0.3217286914765906, "percentage": 32.17, "elapsed_time": "9:19:44", "remaining_time": "19:40:02", "throughput": 1634.28, "total_tokens": 54886400} -{"current_steps": 6710, "total_steps": 20825, "loss": 0.8882, "learning_rate": 4.044524429473431e-05, "epoch": 0.32220888355342137, "percentage": 32.22, "elapsed_time": "9:20:37", "remaining_time": "19:39:19", "throughput": 1634.12, "total_tokens": 54968320} -{"current_steps": 6720, "total_steps": 20825, "loss": 0.8349, "learning_rate": 4.041407332625238e-05, "epoch": 0.3226890756302521, "percentage": 32.27, "elapsed_time": "9:21:30", "remaining_time": "19:38:35", "throughput": 1633.98, "total_tokens": 55050240} -{"current_steps": 6730, "total_steps": 20825, "loss": 0.8427, "learning_rate": 4.038286365066613e-05, "epoch": 0.3231692677070828, "percentage": 32.32, "elapsed_time": "9:22:24", "remaining_time": "19:37:52", "throughput": 1633.82, "total_tokens": 55132160} -{"current_steps": 6740, "total_steps": 20825, "loss": 0.9561, "learning_rate": 4.0351615346347804e-05, "epoch": 0.3236494597839136, "percentage": 32.36, "elapsed_time": "9:23:17", "remaining_time": "19:37:09", "throughput": 1633.66, "total_tokens": 55214080} -{"current_steps": 6750, "total_steps": 20825, "loss": 0.9102, "learning_rate": 4.032032849176673e-05, "epoch": 0.3241296518607443, "percentage": 32.41, "elapsed_time": "9:24:10", "remaining_time": "19:36:25", "throughput": 1633.51, "total_tokens": 55296000} -{"current_steps": 6760, "total_steps": 20825, "loss": 0.8668, "learning_rate": 4.0289003165488976e-05, "epoch": 0.324609843937575, "percentage": 32.46, "elapsed_time": "9:25:03", "remaining_time": "19:35:41", "throughput": 1633.38, "total_tokens": 55377920} -{"current_steps": 6770, "total_steps": 20825, "loss": 0.9355, "learning_rate": 4.025763944617727e-05, "epoch": 0.3250900360144058, "percentage": 32.51, "elapsed_time": "9:25:57", "remaining_time": "19:34:57", "throughput": 1633.22, "total_tokens": 55459840} -{"current_steps": 6780, "total_steps": 20825, "loss": 0.9062, "learning_rate": 4.0226237412590696e-05, "epoch": 0.3255702280912365, "percentage": 32.56, "elapsed_time": "9:26:50", "remaining_time": "19:34:14", "throughput": 1633.07, "total_tokens": 55541760} -{"current_steps": 6790, "total_steps": 20825, "loss": 0.8195, "learning_rate": 4.019479714358461e-05, "epoch": 0.32605042016806723, "percentage": 32.61, "elapsed_time": "9:27:44", "remaining_time": "19:33:30", "throughput": 1632.92, "total_tokens": 55623680} -{"current_steps": 6800, "total_steps": 20825, "loss": 0.7515, "learning_rate": 4.016331871811033e-05, "epoch": 0.32653061224489793, "percentage": 32.65, "elapsed_time": "9:28:37", "remaining_time": "19:32:47", "throughput": 1632.76, "total_tokens": 55705600} -{"current_steps": 6810, "total_steps": 20825, "loss": 1.0522, "learning_rate": 4.0131802215215025e-05, "epoch": 0.3270108043217287, "percentage": 32.7, "elapsed_time": "9:29:30", "remaining_time": "19:32:03", "throughput": 1632.62, "total_tokens": 55787520} -{"current_steps": 6820, "total_steps": 20825, "loss": 0.9683, "learning_rate": 4.010024771404147e-05, "epoch": 0.32749099639855944, "percentage": 32.75, "elapsed_time": "9:30:23", "remaining_time": "19:31:18", "throughput": 1632.48, "total_tokens": 55869440} -{"current_steps": 6830, "total_steps": 20825, "loss": 0.8884, "learning_rate": 4.006865529382787e-05, "epoch": 0.32797118847539014, "percentage": 32.8, "elapsed_time": "9:31:17", "remaining_time": "19:30:36", "throughput": 1632.31, "total_tokens": 55951360} -{"current_steps": 6840, "total_steps": 20825, "loss": 0.9416, "learning_rate": 4.0037025033907635e-05, "epoch": 0.3284513805522209, "percentage": 32.85, "elapsed_time": "9:32:10", "remaining_time": "19:29:51", "throughput": 1632.17, "total_tokens": 56033280} -{"current_steps": 6850, "total_steps": 20825, "loss": 0.9646, "learning_rate": 4.000535701370921e-05, "epoch": 0.3289315726290516, "percentage": 32.89, "elapsed_time": "9:33:03", "remaining_time": "19:29:07", "throughput": 1632.03, "total_tokens": 56115200} -{"current_steps": 6860, "total_steps": 20825, "loss": 0.9449, "learning_rate": 3.997365131275584e-05, "epoch": 0.32941176470588235, "percentage": 32.94, "elapsed_time": "9:33:56", "remaining_time": "19:28:23", "throughput": 1631.88, "total_tokens": 56197120} -{"current_steps": 6870, "total_steps": 20825, "loss": 1.1115, "learning_rate": 3.994190801066542e-05, "epoch": 0.3298919567827131, "percentage": 32.99, "elapsed_time": "9:34:50", "remaining_time": "19:27:40", "throughput": 1631.72, "total_tokens": 56279040} -{"current_steps": 6880, "total_steps": 20825, "loss": 0.996, "learning_rate": 3.9910127187150246e-05, "epoch": 0.3303721488595438, "percentage": 33.04, "elapsed_time": "9:35:43", "remaining_time": "19:26:56", "throughput": 1631.58, "total_tokens": 56360960} -{"current_steps": 6890, "total_steps": 20825, "loss": 0.887, "learning_rate": 3.9878308922016846e-05, "epoch": 0.33085234093637456, "percentage": 33.09, "elapsed_time": "9:36:36", "remaining_time": "19:26:12", "throughput": 1631.44, "total_tokens": 56442880} -{"current_steps": 6900, "total_steps": 20825, "loss": 0.803, "learning_rate": 3.984645329516578e-05, "epoch": 0.33133253301320525, "percentage": 33.13, "elapsed_time": "9:37:30", "remaining_time": "19:25:28", "throughput": 1631.3, "total_tokens": 56524800} -{"current_steps": 6910, "total_steps": 20825, "loss": 0.9339, "learning_rate": 3.98145603865914e-05, "epoch": 0.331812725090036, "percentage": 33.18, "elapsed_time": "9:38:23", "remaining_time": "19:24:43", "throughput": 1631.17, "total_tokens": 56606720} -{"current_steps": 6920, "total_steps": 20825, "loss": 1.0942, "learning_rate": 3.978263027638171e-05, "epoch": 0.33229291716686676, "percentage": 33.23, "elapsed_time": "9:39:16", "remaining_time": "19:23:59", "throughput": 1631.02, "total_tokens": 56688640} -{"current_steps": 6930, "total_steps": 20825, "loss": 0.9728, "learning_rate": 3.975066304471811e-05, "epoch": 0.33277310924369746, "percentage": 33.28, "elapsed_time": "9:40:09", "remaining_time": "19:23:15", "throughput": 1630.88, "total_tokens": 56770560} -{"current_steps": 6940, "total_steps": 20825, "loss": 0.8131, "learning_rate": 3.971865877187523e-05, "epoch": 0.3332533013205282, "percentage": 33.33, "elapsed_time": "9:41:03", "remaining_time": "19:22:31", "throughput": 1630.73, "total_tokens": 56852480} -{"current_steps": 6950, "total_steps": 20825, "loss": 0.8142, "learning_rate": 3.968661753822071e-05, "epoch": 0.33373349339735897, "percentage": 33.37, "elapsed_time": "9:41:56", "remaining_time": "19:21:46", "throughput": 1630.6, "total_tokens": 56934400} -{"current_steps": 6960, "total_steps": 20825, "loss": 0.9086, "learning_rate": 3.9654539424214996e-05, "epoch": 0.33421368547418967, "percentage": 33.42, "elapsed_time": "9:42:49", "remaining_time": "19:21:02", "throughput": 1630.47, "total_tokens": 57016320} -{"current_steps": 6970, "total_steps": 20825, "loss": 0.8183, "learning_rate": 3.962242451041118e-05, "epoch": 0.3346938775510204, "percentage": 33.47, "elapsed_time": "9:43:42", "remaining_time": "19:20:18", "throughput": 1630.32, "total_tokens": 57098240} -{"current_steps": 6980, "total_steps": 20825, "loss": 0.9817, "learning_rate": 3.9590272877454714e-05, "epoch": 0.3351740696278511, "percentage": 33.52, "elapsed_time": "9:44:36", "remaining_time": "19:19:34", "throughput": 1630.18, "total_tokens": 57180160} -{"current_steps": 6990, "total_steps": 20825, "loss": 1.0946, "learning_rate": 3.955808460608331e-05, "epoch": 0.3356542617046819, "percentage": 33.57, "elapsed_time": "9:45:29", "remaining_time": "19:18:49", "throughput": 1630.04, "total_tokens": 57262080} -{"current_steps": 7000, "total_steps": 20825, "loss": 1.0473, "learning_rate": 3.952585977712664e-05, "epoch": 0.33613445378151263, "percentage": 33.61, "elapsed_time": "9:46:22", "remaining_time": "19:18:06", "throughput": 1629.88, "total_tokens": 57344000} -{"current_steps": 7010, "total_steps": 20825, "loss": 0.9402, "learning_rate": 3.94935984715062e-05, "epoch": 0.33661464585834333, "percentage": 33.66, "elapsed_time": "9:47:21", "remaining_time": "19:17:32", "throughput": 1629.49, "total_tokens": 57425920} -{"current_steps": 7020, "total_steps": 20825, "loss": 0.678, "learning_rate": 3.9461300770235093e-05, "epoch": 0.3370948379351741, "percentage": 33.71, "elapsed_time": "9:48:15", "remaining_time": "19:16:48", "throughput": 1629.34, "total_tokens": 57507840} -{"current_steps": 7030, "total_steps": 20825, "loss": 0.9907, "learning_rate": 3.942896675441779e-05, "epoch": 0.3375750300120048, "percentage": 33.76, "elapsed_time": "9:49:08", "remaining_time": "19:16:04", "throughput": 1629.2, "total_tokens": 57589760} -{"current_steps": 7040, "total_steps": 20825, "loss": 0.9791, "learning_rate": 3.939659650524997e-05, "epoch": 0.33805522208883554, "percentage": 33.81, "elapsed_time": "9:50:01", "remaining_time": "19:15:19", "throughput": 1629.07, "total_tokens": 57671680} -{"current_steps": 7050, "total_steps": 20825, "loss": 0.8087, "learning_rate": 3.9364190104018307e-05, "epoch": 0.3385354141656663, "percentage": 33.85, "elapsed_time": "9:50:54", "remaining_time": "19:14:35", "throughput": 1628.94, "total_tokens": 57753600} -{"current_steps": 7060, "total_steps": 20825, "loss": 0.9574, "learning_rate": 3.933174763210024e-05, "epoch": 0.339015606242497, "percentage": 33.9, "elapsed_time": "9:51:47", "remaining_time": "19:13:50", "throughput": 1628.8, "total_tokens": 57835520} -{"current_steps": 7070, "total_steps": 20825, "loss": 0.866, "learning_rate": 3.9299269170963795e-05, "epoch": 0.33949579831932775, "percentage": 33.95, "elapsed_time": "9:52:41", "remaining_time": "19:13:05", "throughput": 1628.67, "total_tokens": 57917440} -{"current_steps": 7080, "total_steps": 20825, "loss": 0.9768, "learning_rate": 3.926675480216738e-05, "epoch": 0.33997599039615845, "percentage": 34.0, "elapsed_time": "9:53:34", "remaining_time": "19:12:21", "throughput": 1628.53, "total_tokens": 57999360} -{"current_steps": 7090, "total_steps": 20825, "loss": 0.9659, "learning_rate": 3.923420460735957e-05, "epoch": 0.3404561824729892, "percentage": 34.05, "elapsed_time": "9:54:27", "remaining_time": "19:11:37", "throughput": 1628.39, "total_tokens": 58081280} -{"current_steps": 7100, "total_steps": 20825, "loss": 0.7939, "learning_rate": 3.920161866827889e-05, "epoch": 0.34093637454981995, "percentage": 34.09, "elapsed_time": "9:55:20", "remaining_time": "19:10:52", "throughput": 1628.27, "total_tokens": 58163200} -{"current_steps": 7110, "total_steps": 20825, "loss": 1.1513, "learning_rate": 3.916899706675365e-05, "epoch": 0.34141656662665065, "percentage": 34.14, "elapsed_time": "9:56:14", "remaining_time": "19:10:07", "throughput": 1628.13, "total_tokens": 58245120} -{"current_steps": 7120, "total_steps": 20825, "loss": 1.0614, "learning_rate": 3.913633988470169e-05, "epoch": 0.3418967587034814, "percentage": 34.19, "elapsed_time": "9:57:07", "remaining_time": "19:09:22", "throughput": 1628.0, "total_tokens": 58327040} -{"current_steps": 7130, "total_steps": 20825, "loss": 1.0288, "learning_rate": 3.91036472041302e-05, "epoch": 0.3423769507803121, "percentage": 34.24, "elapsed_time": "9:58:01", "remaining_time": "19:08:40", "throughput": 1627.82, "total_tokens": 58408960} -{"current_steps": 7140, "total_steps": 20825, "loss": 0.9384, "learning_rate": 3.907091910713553e-05, "epoch": 0.34285714285714286, "percentage": 34.29, "elapsed_time": "9:58:55", "remaining_time": "19:07:55", "throughput": 1627.68, "total_tokens": 58490880} -{"current_steps": 7150, "total_steps": 20825, "loss": 0.9873, "learning_rate": 3.9038155675902956e-05, "epoch": 0.3433373349339736, "percentage": 34.33, "elapsed_time": "9:59:48", "remaining_time": "19:07:11", "throughput": 1627.54, "total_tokens": 58572800} -{"current_steps": 7160, "total_steps": 20825, "loss": 0.9565, "learning_rate": 3.900535699270647e-05, "epoch": 0.3438175270108043, "percentage": 34.38, "elapsed_time": "10:00:41", "remaining_time": "19:06:26", "throughput": 1627.41, "total_tokens": 58654720} -{"current_steps": 7170, "total_steps": 20825, "loss": 0.9251, "learning_rate": 3.8972523139908616e-05, "epoch": 0.34429771908763507, "percentage": 34.43, "elapsed_time": "10:01:35", "remaining_time": "19:05:41", "throughput": 1627.27, "total_tokens": 58736640} -{"current_steps": 7180, "total_steps": 20825, "loss": 0.9024, "learning_rate": 3.8939654199960244e-05, "epoch": 0.34477791116446577, "percentage": 34.48, "elapsed_time": "10:02:28", "remaining_time": "19:04:56", "throughput": 1627.15, "total_tokens": 58818560} -{"current_steps": 7190, "total_steps": 20825, "loss": 0.8464, "learning_rate": 3.890675025540028e-05, "epoch": 0.3452581032412965, "percentage": 34.53, "elapsed_time": "10:03:21", "remaining_time": "19:04:12", "throughput": 1627.0, "total_tokens": 58900480} -{"current_steps": 7200, "total_steps": 20825, "loss": 0.909, "learning_rate": 3.8873811388855605e-05, "epoch": 0.3457382953181273, "percentage": 34.57, "elapsed_time": "10:04:15", "remaining_time": "19:03:28", "throughput": 1626.85, "total_tokens": 58982400} -{"current_steps": 7210, "total_steps": 20825, "loss": 1.0237, "learning_rate": 3.8840837683040766e-05, "epoch": 0.346218487394958, "percentage": 34.62, "elapsed_time": "10:05:08", "remaining_time": "19:02:43", "throughput": 1626.74, "total_tokens": 59064320} -{"current_steps": 7220, "total_steps": 20825, "loss": 0.8262, "learning_rate": 3.880782922075778e-05, "epoch": 0.34669867947178873, "percentage": 34.67, "elapsed_time": "10:06:01", "remaining_time": "19:01:57", "throughput": 1626.62, "total_tokens": 59146240} -{"current_steps": 7230, "total_steps": 20825, "loss": 0.9193, "learning_rate": 3.8774786084896e-05, "epoch": 0.3471788715486194, "percentage": 34.72, "elapsed_time": "10:06:54", "remaining_time": "19:01:12", "throughput": 1626.5, "total_tokens": 59228160} -{"current_steps": 7240, "total_steps": 20825, "loss": 0.8414, "learning_rate": 3.8741708358431774e-05, "epoch": 0.3476590636254502, "percentage": 34.77, "elapsed_time": "10:07:47", "remaining_time": "19:00:27", "throughput": 1626.36, "total_tokens": 59310080} -{"current_steps": 7250, "total_steps": 20825, "loss": 1.138, "learning_rate": 3.870859612442837e-05, "epoch": 0.34813925570228094, "percentage": 34.81, "elapsed_time": "10:08:41", "remaining_time": "18:59:42", "throughput": 1626.24, "total_tokens": 59392000} -{"current_steps": 7260, "total_steps": 20825, "loss": 0.8703, "learning_rate": 3.86754494660357e-05, "epoch": 0.34861944777911164, "percentage": 34.86, "elapsed_time": "10:09:34", "remaining_time": "18:58:58", "throughput": 1626.09, "total_tokens": 59473920} -{"current_steps": 7270, "total_steps": 20825, "loss": 0.8408, "learning_rate": 3.864226846649008e-05, "epoch": 0.3490996398559424, "percentage": 34.91, "elapsed_time": "10:10:28", "remaining_time": "18:58:13", "throughput": 1625.96, "total_tokens": 59555840} -{"current_steps": 7280, "total_steps": 20825, "loss": 0.9104, "learning_rate": 3.860905320911413e-05, "epoch": 0.3495798319327731, "percentage": 34.96, "elapsed_time": "10:11:21", "remaining_time": "18:57:28", "throughput": 1625.83, "total_tokens": 59637760} -{"current_steps": 7290, "total_steps": 20825, "loss": 0.7804, "learning_rate": 3.857580377731644e-05, "epoch": 0.35006002400960384, "percentage": 35.01, "elapsed_time": "10:12:14", "remaining_time": "18:56:43", "throughput": 1625.7, "total_tokens": 59719680} -{"current_steps": 7300, "total_steps": 20825, "loss": 0.868, "learning_rate": 3.854252025459144e-05, "epoch": 0.3505402160864346, "percentage": 35.05, "elapsed_time": "10:13:07", "remaining_time": "18:55:58", "throughput": 1625.58, "total_tokens": 59801600} -{"current_steps": 7310, "total_steps": 20825, "loss": 0.9105, "learning_rate": 3.8509202724519165e-05, "epoch": 0.3510204081632653, "percentage": 35.1, "elapsed_time": "10:14:01", "remaining_time": "18:55:13", "throughput": 1625.45, "total_tokens": 59883520} -{"current_steps": 7320, "total_steps": 20825, "loss": 0.8274, "learning_rate": 3.8475851270765054e-05, "epoch": 0.35150060024009605, "percentage": 35.15, "elapsed_time": "10:14:54", "remaining_time": "18:54:28", "throughput": 1625.31, "total_tokens": 59965440} -{"current_steps": 7330, "total_steps": 20825, "loss": 0.9016, "learning_rate": 3.844246597707972e-05, "epoch": 0.35198079231692675, "percentage": 35.2, "elapsed_time": "10:15:48", "remaining_time": "18:53:44", "throughput": 1625.16, "total_tokens": 60047360} -{"current_steps": 7340, "total_steps": 20825, "loss": 0.8791, "learning_rate": 3.8409046927298755e-05, "epoch": 0.3524609843937575, "percentage": 35.25, "elapsed_time": "10:16:41", "remaining_time": "18:52:59", "throughput": 1625.04, "total_tokens": 60129280} -{"current_steps": 7350, "total_steps": 20825, "loss": 1.1453, "learning_rate": 3.8375594205342534e-05, "epoch": 0.35294117647058826, "percentage": 35.29, "elapsed_time": "10:17:35", "remaining_time": "18:52:14", "throughput": 1624.9, "total_tokens": 60211200} -{"current_steps": 7360, "total_steps": 20825, "loss": 1.0104, "learning_rate": 3.834210789521598e-05, "epoch": 0.35342136854741896, "percentage": 35.34, "elapsed_time": "10:18:28", "remaining_time": "18:51:29", "throughput": 1624.78, "total_tokens": 60293120} -{"current_steps": 7370, "total_steps": 20825, "loss": 1.0196, "learning_rate": 3.830858808100834e-05, "epoch": 0.3539015606242497, "percentage": 35.39, "elapsed_time": "10:19:21", "remaining_time": "18:50:43", "throughput": 1624.67, "total_tokens": 60375040} -{"current_steps": 7380, "total_steps": 20825, "loss": 0.8126, "learning_rate": 3.8275034846893046e-05, "epoch": 0.3543817527010804, "percentage": 35.44, "elapsed_time": "10:20:14", "remaining_time": "18:49:58", "throughput": 1624.55, "total_tokens": 60456960} -{"current_steps": 7390, "total_steps": 20825, "loss": 1.3003, "learning_rate": 3.824144827712738e-05, "epoch": 0.35486194477791116, "percentage": 35.49, "elapsed_time": "10:21:08", "remaining_time": "18:49:13", "throughput": 1624.4, "total_tokens": 60538880} -{"current_steps": 7400, "total_steps": 20825, "loss": 1.0134, "learning_rate": 3.82078284560524e-05, "epoch": 0.3553421368547419, "percentage": 35.53, "elapsed_time": "10:22:01", "remaining_time": "18:48:28", "throughput": 1624.28, "total_tokens": 60620800} -{"current_steps": 7410, "total_steps": 20825, "loss": 0.9036, "learning_rate": 3.817417546809263e-05, "epoch": 0.3558223289315726, "percentage": 35.58, "elapsed_time": "10:22:54", "remaining_time": "18:47:43", "throughput": 1624.16, "total_tokens": 60702720} -{"current_steps": 7420, "total_steps": 20825, "loss": 1.0055, "learning_rate": 3.8140489397755886e-05, "epoch": 0.3563025210084034, "percentage": 35.63, "elapsed_time": "10:23:48", "remaining_time": "18:46:57", "throughput": 1624.03, "total_tokens": 60784640} -{"current_steps": 7430, "total_steps": 20825, "loss": 0.9698, "learning_rate": 3.810677032963307e-05, "epoch": 0.35678271308523407, "percentage": 35.68, "elapsed_time": "10:24:41", "remaining_time": "18:46:13", "throughput": 1623.9, "total_tokens": 60866560} -{"current_steps": 7440, "total_steps": 20825, "loss": 0.8928, "learning_rate": 3.807301834839793e-05, "epoch": 0.3572629051620648, "percentage": 35.73, "elapsed_time": "10:25:34", "remaining_time": "18:45:27", "throughput": 1623.79, "total_tokens": 60948480} -{"current_steps": 7450, "total_steps": 20825, "loss": 0.7671, "learning_rate": 3.803923353880687e-05, "epoch": 0.3577430972388956, "percentage": 35.77, "elapsed_time": "10:26:28", "remaining_time": "18:44:42", "throughput": 1623.66, "total_tokens": 61030400} -{"current_steps": 7460, "total_steps": 20825, "loss": 0.9805, "learning_rate": 3.8005415985698754e-05, "epoch": 0.3582232893157263, "percentage": 35.82, "elapsed_time": "10:27:21", "remaining_time": "18:43:56", "throughput": 1623.55, "total_tokens": 61112320} -{"current_steps": 7470, "total_steps": 20825, "loss": 0.9943, "learning_rate": 3.797156577399462e-05, "epoch": 0.35870348139255703, "percentage": 35.87, "elapsed_time": "10:28:14", "remaining_time": "18:43:10", "throughput": 1623.44, "total_tokens": 61194240} -{"current_steps": 7480, "total_steps": 20825, "loss": 0.8656, "learning_rate": 3.7937682988697566e-05, "epoch": 0.35918367346938773, "percentage": 35.92, "elapsed_time": "10:29:07", "remaining_time": "18:42:24", "throughput": 1623.33, "total_tokens": 61276160} -{"current_steps": 7490, "total_steps": 20825, "loss": 1.0121, "learning_rate": 3.790376771489247e-05, "epoch": 0.3596638655462185, "percentage": 35.97, "elapsed_time": "10:30:00", "remaining_time": "18:41:39", "throughput": 1623.2, "total_tokens": 61358080} -{"current_steps": 7500, "total_steps": 20825, "loss": 0.8441, "learning_rate": 3.7869820037745776e-05, "epoch": 0.36014405762304924, "percentage": 36.01, "elapsed_time": "10:30:53", "remaining_time": "18:40:53", "throughput": 1623.09, "total_tokens": 61440000} -{"current_steps": 7510, "total_steps": 20825, "loss": 0.7604, "learning_rate": 3.783584004250531e-05, "epoch": 0.36062424969987994, "percentage": 36.06, "elapsed_time": "10:31:47", "remaining_time": "18:40:08", "throughput": 1622.97, "total_tokens": 61521920} -{"current_steps": 7520, "total_steps": 20825, "loss": 0.8183, "learning_rate": 3.7801827814500074e-05, "epoch": 0.3611044417767107, "percentage": 36.11, "elapsed_time": "10:32:40", "remaining_time": "18:39:22", "throughput": 1622.85, "total_tokens": 61603840} -{"current_steps": 7530, "total_steps": 20825, "loss": 0.8522, "learning_rate": 3.7767783439139984e-05, "epoch": 0.3615846338535414, "percentage": 36.16, "elapsed_time": "10:33:33", "remaining_time": "18:38:37", "throughput": 1622.73, "total_tokens": 61685760} -{"current_steps": 7540, "total_steps": 20825, "loss": 0.8296, "learning_rate": 3.77337070019157e-05, "epoch": 0.36206482593037215, "percentage": 36.21, "elapsed_time": "10:34:26", "remaining_time": "18:37:51", "throughput": 1622.61, "total_tokens": 61767680} -{"current_steps": 7550, "total_steps": 20825, "loss": 0.9405, "learning_rate": 3.7699598588398364e-05, "epoch": 0.3625450180072029, "percentage": 36.25, "elapsed_time": "10:35:20", "remaining_time": "18:37:05", "throughput": 1622.49, "total_tokens": 61849600} -{"current_steps": 7560, "total_steps": 20825, "loss": 0.9701, "learning_rate": 3.766545828423946e-05, "epoch": 0.3630252100840336, "percentage": 36.3, "elapsed_time": "10:36:13", "remaining_time": "18:36:20", "throughput": 1622.37, "total_tokens": 61931520} -{"current_steps": 7570, "total_steps": 20825, "loss": 0.8598, "learning_rate": 3.7631286175170535e-05, "epoch": 0.36350540216086435, "percentage": 36.35, "elapsed_time": "10:37:06", "remaining_time": "18:35:35", "throughput": 1622.24, "total_tokens": 62013440} -{"current_steps": 7580, "total_steps": 20825, "loss": 1.0999, "learning_rate": 3.7597082347003e-05, "epoch": 0.36398559423769505, "percentage": 36.4, "elapsed_time": "10:38:00", "remaining_time": "18:34:49", "throughput": 1622.11, "total_tokens": 62095360} -{"current_steps": 7590, "total_steps": 20825, "loss": 0.8699, "learning_rate": 3.75628468856279e-05, "epoch": 0.3644657863145258, "percentage": 36.45, "elapsed_time": "10:38:53", "remaining_time": "18:34:04", "throughput": 1622.0, "total_tokens": 62177280} -{"current_steps": 7600, "total_steps": 20825, "loss": 0.8688, "learning_rate": 3.7528579877015746e-05, "epoch": 0.36494597839135656, "percentage": 36.49, "elapsed_time": "10:39:47", "remaining_time": "18:33:18", "throughput": 1621.87, "total_tokens": 62259200} -{"current_steps": 7610, "total_steps": 20825, "loss": 1.0697, "learning_rate": 3.749428140721626e-05, "epoch": 0.36542617046818726, "percentage": 36.54, "elapsed_time": "10:40:40", "remaining_time": "18:32:33", "throughput": 1621.75, "total_tokens": 62341120} -{"current_steps": 7620, "total_steps": 20825, "loss": 0.8349, "learning_rate": 3.745995156235815e-05, "epoch": 0.365906362545018, "percentage": 36.59, "elapsed_time": "10:41:33", "remaining_time": "18:31:47", "throughput": 1621.63, "total_tokens": 62423040} -{"current_steps": 7630, "total_steps": 20825, "loss": 0.9453, "learning_rate": 3.742559042864895e-05, "epoch": 0.3663865546218487, "percentage": 36.64, "elapsed_time": "10:42:27", "remaining_time": "18:31:02", "throughput": 1621.5, "total_tokens": 62504960} -{"current_steps": 7640, "total_steps": 20825, "loss": 1.0237, "learning_rate": 3.7391198092374726e-05, "epoch": 0.36686674669867947, "percentage": 36.69, "elapsed_time": "10:43:20", "remaining_time": "18:30:16", "throughput": 1621.39, "total_tokens": 62586880} -{"current_steps": 7650, "total_steps": 20825, "loss": 0.8499, "learning_rate": 3.7356774639899914e-05, "epoch": 0.3673469387755102, "percentage": 36.73, "elapsed_time": "10:44:13", "remaining_time": "18:29:30", "throughput": 1621.29, "total_tokens": 62668800} -{"current_steps": 7660, "total_steps": 20825, "loss": 0.8653, "learning_rate": 3.7322320157667094e-05, "epoch": 0.3678271308523409, "percentage": 36.78, "elapsed_time": "10:45:06", "remaining_time": "18:28:44", "throughput": 1621.18, "total_tokens": 62750720} -{"current_steps": 7670, "total_steps": 20825, "loss": 0.7981, "learning_rate": 3.728783473219676e-05, "epoch": 0.3683073229291717, "percentage": 36.83, "elapsed_time": "10:46:00", "remaining_time": "18:27:58", "throughput": 1621.06, "total_tokens": 62832640} -{"current_steps": 7680, "total_steps": 20825, "loss": 0.7632, "learning_rate": 3.72533184500871e-05, "epoch": 0.3687875150060024, "percentage": 36.88, "elapsed_time": "10:46:53", "remaining_time": "18:27:12", "throughput": 1620.95, "total_tokens": 62914560} -{"current_steps": 7690, "total_steps": 20825, "loss": 0.9014, "learning_rate": 3.7218771398013807e-05, "epoch": 0.36926770708283313, "percentage": 36.93, "elapsed_time": "10:47:46", "remaining_time": "18:26:27", "throughput": 1620.83, "total_tokens": 62996480} -{"current_steps": 7700, "total_steps": 20825, "loss": 0.828, "learning_rate": 3.718419366272982e-05, "epoch": 0.3697478991596639, "percentage": 36.97, "elapsed_time": "10:48:40", "remaining_time": "18:25:41", "throughput": 1620.72, "total_tokens": 63078400} -{"current_steps": 7710, "total_steps": 20825, "loss": 0.7715, "learning_rate": 3.714958533106515e-05, "epoch": 0.3702280912364946, "percentage": 37.02, "elapsed_time": "10:49:33", "remaining_time": "18:24:55", "throughput": 1620.6, "total_tokens": 63160320} -{"current_steps": 7720, "total_steps": 20825, "loss": 0.9035, "learning_rate": 3.7114946489926633e-05, "epoch": 0.37070828331332534, "percentage": 37.07, "elapsed_time": "10:50:26", "remaining_time": "18:24:09", "throughput": 1620.49, "total_tokens": 63242240} -{"current_steps": 7730, "total_steps": 20825, "loss": 1.0931, "learning_rate": 3.708027722629772e-05, "epoch": 0.37118847539015604, "percentage": 37.12, "elapsed_time": "10:51:20", "remaining_time": "18:23:23", "throughput": 1620.36, "total_tokens": 63324160} -{"current_steps": 7740, "total_steps": 20825, "loss": 0.8443, "learning_rate": 3.704557762723823e-05, "epoch": 0.3716686674669868, "percentage": 37.17, "elapsed_time": "10:52:13", "remaining_time": "18:22:37", "throughput": 1620.26, "total_tokens": 63406080} -{"current_steps": 7750, "total_steps": 20825, "loss": 0.9003, "learning_rate": 3.7010847779884204e-05, "epoch": 0.37214885954381755, "percentage": 37.21, "elapsed_time": "10:53:06", "remaining_time": "18:21:51", "throughput": 1620.14, "total_tokens": 63488000} -{"current_steps": 7760, "total_steps": 20825, "loss": 0.9216, "learning_rate": 3.697608777144762e-05, "epoch": 0.37262905162064824, "percentage": 37.26, "elapsed_time": "10:54:00", "remaining_time": "18:21:05", "throughput": 1620.02, "total_tokens": 63569920} -{"current_steps": 7770, "total_steps": 20825, "loss": 0.966, "learning_rate": 3.694129768921619e-05, "epoch": 0.373109243697479, "percentage": 37.31, "elapsed_time": "10:54:53", "remaining_time": "18:20:20", "throughput": 1619.89, "total_tokens": 63651840} -{"current_steps": 7780, "total_steps": 20825, "loss": 0.947, "learning_rate": 3.6906477620553156e-05, "epoch": 0.3735894357743097, "percentage": 37.36, "elapsed_time": "10:55:47", "remaining_time": "18:19:35", "throughput": 1619.77, "total_tokens": 63733760} -{"current_steps": 7790, "total_steps": 20825, "loss": 0.9151, "learning_rate": 3.687162765289704e-05, "epoch": 0.37406962785114045, "percentage": 37.41, "elapsed_time": "10:56:40", "remaining_time": "18:18:49", "throughput": 1619.66, "total_tokens": 63815680} -{"current_steps": 7800, "total_steps": 20825, "loss": 0.8509, "learning_rate": 3.683674787376148e-05, "epoch": 0.3745498199279712, "percentage": 37.45, "elapsed_time": "10:57:33", "remaining_time": "18:18:02", "throughput": 1619.55, "total_tokens": 63897600} -{"current_steps": 7810, "total_steps": 20825, "loss": 0.7108, "learning_rate": 3.6801838370734945e-05, "epoch": 0.3750300120048019, "percentage": 37.5, "elapsed_time": "10:58:27", "remaining_time": "18:17:17", "throughput": 1619.44, "total_tokens": 63979520} -{"current_steps": 7820, "total_steps": 20825, "loss": 0.8534, "learning_rate": 3.676689923148056e-05, "epoch": 0.37551020408163266, "percentage": 37.55, "elapsed_time": "10:59:20", "remaining_time": "18:16:31", "throughput": 1619.32, "total_tokens": 64061440} -{"current_steps": 7830, "total_steps": 20825, "loss": 0.9249, "learning_rate": 3.673193054373587e-05, "epoch": 0.37599039615846336, "percentage": 37.6, "elapsed_time": "11:00:14", "remaining_time": "18:15:45", "throughput": 1619.2, "total_tokens": 64143360} -{"current_steps": 7840, "total_steps": 20825, "loss": 0.945, "learning_rate": 3.6696932395312606e-05, "epoch": 0.3764705882352941, "percentage": 37.65, "elapsed_time": "11:01:07", "remaining_time": "18:14:59", "throughput": 1619.08, "total_tokens": 64225280} -{"current_steps": 7850, "total_steps": 20825, "loss": 0.8673, "learning_rate": 3.6661904874096503e-05, "epoch": 0.37695078031212487, "percentage": 37.7, "elapsed_time": "11:02:01", "remaining_time": "18:14:13", "throughput": 1618.97, "total_tokens": 64307200} -{"current_steps": 7860, "total_steps": 20825, "loss": 0.817, "learning_rate": 3.662684806804704e-05, "epoch": 0.37743097238895557, "percentage": 37.74, "elapsed_time": "11:02:54", "remaining_time": "18:13:27", "throughput": 1618.86, "total_tokens": 64389120} -{"current_steps": 7870, "total_steps": 20825, "loss": 0.9525, "learning_rate": 3.659176206519724e-05, "epoch": 0.3779111644657863, "percentage": 37.79, "elapsed_time": "11:03:47", "remaining_time": "18:12:41", "throughput": 1618.76, "total_tokens": 64471040} -{"current_steps": 7880, "total_steps": 20825, "loss": 0.8771, "learning_rate": 3.655664695365344e-05, "epoch": 0.3783913565426171, "percentage": 37.84, "elapsed_time": "11:04:40", "remaining_time": "18:11:54", "throughput": 1618.66, "total_tokens": 64552960} -{"current_steps": 7890, "total_steps": 20825, "loss": 0.895, "learning_rate": 3.652150282159507e-05, "epoch": 0.3788715486194478, "percentage": 37.89, "elapsed_time": "11:05:33", "remaining_time": "18:11:08", "throughput": 1618.55, "total_tokens": 64634880} -{"current_steps": 7900, "total_steps": 20825, "loss": 0.8366, "learning_rate": 3.6486329757274454e-05, "epoch": 0.3793517406962785, "percentage": 37.94, "elapsed_time": "11:06:27", "remaining_time": "18:10:22", "throughput": 1618.43, "total_tokens": 64716800} -{"current_steps": 7910, "total_steps": 20825, "loss": 0.9177, "learning_rate": 3.645112784901655e-05, "epoch": 0.3798319327731092, "percentage": 37.98, "elapsed_time": "11:07:20", "remaining_time": "18:09:36", "throughput": 1618.32, "total_tokens": 64798720} -{"current_steps": 7920, "total_steps": 20825, "loss": 0.8592, "learning_rate": 3.641589718521875e-05, "epoch": 0.38031212484994, "percentage": 38.03, "elapsed_time": "11:08:14", "remaining_time": "18:08:50", "throughput": 1618.2, "total_tokens": 64880640} -{"current_steps": 7930, "total_steps": 20825, "loss": 0.9027, "learning_rate": 3.6380637854350665e-05, "epoch": 0.38079231692677074, "percentage": 38.08, "elapsed_time": "11:09:07", "remaining_time": "18:08:04", "throughput": 1618.08, "total_tokens": 64962560} -{"current_steps": 7940, "total_steps": 20825, "loss": 0.8225, "learning_rate": 3.634534994495387e-05, "epoch": 0.38127250900360143, "percentage": 38.13, "elapsed_time": "11:10:01", "remaining_time": "18:07:19", "throughput": 1617.95, "total_tokens": 65044480} -{"current_steps": 7950, "total_steps": 20825, "loss": 0.8546, "learning_rate": 3.631003354564175e-05, "epoch": 0.3817527010804322, "percentage": 38.18, "elapsed_time": "11:10:54", "remaining_time": "18:06:32", "throughput": 1617.85, "total_tokens": 65126400} -{"current_steps": 7960, "total_steps": 20825, "loss": 1.0001, "learning_rate": 3.6274688745099194e-05, "epoch": 0.3822328931572629, "percentage": 38.22, "elapsed_time": "11:11:48", "remaining_time": "18:05:46", "throughput": 1617.73, "total_tokens": 65208320} -{"current_steps": 7970, "total_steps": 20825, "loss": 0.9504, "learning_rate": 3.623931563208241e-05, "epoch": 0.38271308523409364, "percentage": 38.27, "elapsed_time": "11:12:41", "remaining_time": "18:05:00", "throughput": 1617.62, "total_tokens": 65290240} -{"current_steps": 7980, "total_steps": 20825, "loss": 0.8261, "learning_rate": 3.620391429541873e-05, "epoch": 0.3831932773109244, "percentage": 38.32, "elapsed_time": "11:13:34", "remaining_time": "18:04:13", "throughput": 1617.52, "total_tokens": 65372160} -{"current_steps": 7990, "total_steps": 20825, "loss": 0.9785, "learning_rate": 3.616848482400634e-05, "epoch": 0.3836734693877551, "percentage": 38.37, "elapsed_time": "11:14:28", "remaining_time": "18:03:27", "throughput": 1617.42, "total_tokens": 65454080} -{"current_steps": 8000, "total_steps": 20825, "loss": 0.9941, "learning_rate": 3.6133027306814085e-05, "epoch": 0.38415366146458585, "percentage": 38.42, "elapsed_time": "11:15:21", "remaining_time": "18:02:40", "throughput": 1617.32, "total_tokens": 65536000} -{"current_steps": 8010, "total_steps": 20825, "loss": 1.0458, "learning_rate": 3.609754183288122e-05, "epoch": 0.38463385354141655, "percentage": 38.46, "elapsed_time": "11:16:19", "remaining_time": "18:02:01", "throughput": 1617.03, "total_tokens": 65617920} -{"current_steps": 8020, "total_steps": 20825, "loss": 0.9985, "learning_rate": 3.606202849131723e-05, "epoch": 0.3851140456182473, "percentage": 38.51, "elapsed_time": "11:17:12", "remaining_time": "18:01:14", "throughput": 1616.94, "total_tokens": 65699840} -{"current_steps": 8030, "total_steps": 20825, "loss": 0.9213, "learning_rate": 3.6026487371301564e-05, "epoch": 0.38559423769507806, "percentage": 38.56, "elapsed_time": "11:18:05", "remaining_time": "18:00:27", "throughput": 1616.84, "total_tokens": 65781760} -{"current_steps": 8040, "total_steps": 20825, "loss": 0.8843, "learning_rate": 3.599091856208343e-05, "epoch": 0.38607442977190876, "percentage": 38.61, "elapsed_time": "11:18:58", "remaining_time": "17:59:40", "throughput": 1616.75, "total_tokens": 65863680} -{"current_steps": 8050, "total_steps": 20825, "loss": 0.9195, "learning_rate": 3.5955322152981575e-05, "epoch": 0.3865546218487395, "percentage": 38.66, "elapsed_time": "11:19:51", "remaining_time": "17:58:54", "throughput": 1616.64, "total_tokens": 65945600} -{"current_steps": 8060, "total_steps": 20825, "loss": 1.0418, "learning_rate": 3.5919698233384034e-05, "epoch": 0.3870348139255702, "percentage": 38.7, "elapsed_time": "11:20:45", "remaining_time": "17:58:08", "throughput": 1616.53, "total_tokens": 66027520} -{"current_steps": 8070, "total_steps": 20825, "loss": 0.8457, "learning_rate": 3.588404689274795e-05, "epoch": 0.38751500600240096, "percentage": 38.75, "elapsed_time": "11:21:38", "remaining_time": "17:57:22", "throughput": 1616.41, "total_tokens": 66109440} -{"current_steps": 8080, "total_steps": 20825, "loss": 0.7761, "learning_rate": 3.58483682205993e-05, "epoch": 0.3879951980792317, "percentage": 38.8, "elapsed_time": "11:22:32", "remaining_time": "17:56:35", "throughput": 1616.31, "total_tokens": 66191360} -{"current_steps": 8090, "total_steps": 20825, "loss": 0.86, "learning_rate": 3.581266230653271e-05, "epoch": 0.3884753901560624, "percentage": 38.85, "elapsed_time": "11:23:25", "remaining_time": "17:55:49", "throughput": 1616.21, "total_tokens": 66273280} -{"current_steps": 8100, "total_steps": 20825, "loss": 0.8299, "learning_rate": 3.5776929240211224e-05, "epoch": 0.38895558223289317, "percentage": 38.9, "elapsed_time": "11:24:18", "remaining_time": "17:55:02", "throughput": 1616.11, "total_tokens": 66355200} -{"current_steps": 8110, "total_steps": 20825, "loss": 1.0024, "learning_rate": 3.5741169111366047e-05, "epoch": 0.38943577430972387, "percentage": 38.94, "elapsed_time": "11:25:11", "remaining_time": "17:54:15", "throughput": 1616.01, "total_tokens": 66437120} -{"current_steps": 8120, "total_steps": 20825, "loss": 1.0171, "learning_rate": 3.570538200979635e-05, "epoch": 0.3899159663865546, "percentage": 38.99, "elapsed_time": "11:26:05", "remaining_time": "17:53:29", "throughput": 1615.9, "total_tokens": 66519040} -{"current_steps": 8130, "total_steps": 20825, "loss": 0.9044, "learning_rate": 3.566956802536904e-05, "epoch": 0.3903961584633854, "percentage": 39.04, "elapsed_time": "11:26:58", "remaining_time": "17:52:42", "throughput": 1615.8, "total_tokens": 66600960} -{"current_steps": 8140, "total_steps": 20825, "loss": 0.9338, "learning_rate": 3.5633727248018536e-05, "epoch": 0.3908763505402161, "percentage": 39.09, "elapsed_time": "11:27:51", "remaining_time": "17:51:55", "throughput": 1615.71, "total_tokens": 66682880} -{"current_steps": 8150, "total_steps": 20825, "loss": 0.8946, "learning_rate": 3.5597859767746524e-05, "epoch": 0.39135654261704683, "percentage": 39.14, "elapsed_time": "11:28:44", "remaining_time": "17:51:09", "throughput": 1615.61, "total_tokens": 66764800} -{"current_steps": 8160, "total_steps": 20825, "loss": 0.8835, "learning_rate": 3.556196567462175e-05, "epoch": 0.39183673469387753, "percentage": 39.18, "elapsed_time": "11:29:38", "remaining_time": "17:50:22", "throughput": 1615.51, "total_tokens": 66846720} -{"current_steps": 8170, "total_steps": 20825, "loss": 0.9559, "learning_rate": 3.5526045058779805e-05, "epoch": 0.3923169267707083, "percentage": 39.23, "elapsed_time": "11:30:32", "remaining_time": "17:49:36", "throughput": 1615.38, "total_tokens": 66928640} -{"current_steps": 8180, "total_steps": 20825, "loss": 0.8609, "learning_rate": 3.549009801042286e-05, "epoch": 0.39279711884753904, "percentage": 39.28, "elapsed_time": "11:31:25", "remaining_time": "17:48:50", "throughput": 1615.27, "total_tokens": 67010560} -{"current_steps": 8190, "total_steps": 20825, "loss": 0.9237, "learning_rate": 3.545412461981947e-05, "epoch": 0.39327731092436974, "percentage": 39.33, "elapsed_time": "11:32:19", "remaining_time": "17:48:03", "throughput": 1615.16, "total_tokens": 67092480} -{"current_steps": 8200, "total_steps": 20825, "loss": 0.992, "learning_rate": 3.541812497730435e-05, "epoch": 0.3937575030012005, "percentage": 39.38, "elapsed_time": "11:33:12", "remaining_time": "17:47:16", "throughput": 1615.07, "total_tokens": 67174400} -{"current_steps": 8210, "total_steps": 20825, "loss": 0.9067, "learning_rate": 3.5382099173278125e-05, "epoch": 0.3942376950780312, "percentage": 39.42, "elapsed_time": "11:34:05", "remaining_time": "17:46:29", "throughput": 1614.98, "total_tokens": 67256320} -{"current_steps": 8220, "total_steps": 20825, "loss": 0.891, "learning_rate": 3.5346047298207116e-05, "epoch": 0.39471788715486195, "percentage": 39.47, "elapsed_time": "11:34:58", "remaining_time": "17:45:43", "throughput": 1614.87, "total_tokens": 67338240} -{"current_steps": 8230, "total_steps": 20825, "loss": 0.7989, "learning_rate": 3.530996944262312e-05, "epoch": 0.3951980792316927, "percentage": 39.52, "elapsed_time": "11:35:52", "remaining_time": "17:44:56", "throughput": 1614.76, "total_tokens": 67420160} -{"current_steps": 8240, "total_steps": 20825, "loss": 0.8951, "learning_rate": 3.5273865697123164e-05, "epoch": 0.3956782713085234, "percentage": 39.57, "elapsed_time": "11:36:45", "remaining_time": "17:44:09", "throughput": 1614.68, "total_tokens": 67502080} -{"current_steps": 8250, "total_steps": 20825, "loss": 1.0857, "learning_rate": 3.52377361523693e-05, "epoch": 0.39615846338535415, "percentage": 39.62, "elapsed_time": "11:37:38", "remaining_time": "17:43:22", "throughput": 1614.57, "total_tokens": 67584000} -{"current_steps": 8260, "total_steps": 20825, "loss": 1.0151, "learning_rate": 3.520158089908836e-05, "epoch": 0.39663865546218485, "percentage": 39.66, "elapsed_time": "11:38:31", "remaining_time": "17:42:35", "throughput": 1614.48, "total_tokens": 67665920} -{"current_steps": 8270, "total_steps": 20825, "loss": 0.765, "learning_rate": 3.516540002807174e-05, "epoch": 0.3971188475390156, "percentage": 39.71, "elapsed_time": "11:39:25", "remaining_time": "17:41:48", "throughput": 1614.39, "total_tokens": 67747840} -{"current_steps": 8280, "total_steps": 20825, "loss": 0.881, "learning_rate": 3.512919363017516e-05, "epoch": 0.39759903961584636, "percentage": 39.76, "elapsed_time": "11:40:18", "remaining_time": "17:41:01", "throughput": 1614.29, "total_tokens": 67829760} -{"current_steps": 8290, "total_steps": 20825, "loss": 0.8293, "learning_rate": 3.509296179631843e-05, "epoch": 0.39807923169267706, "percentage": 39.81, "elapsed_time": "11:41:11", "remaining_time": "17:40:15", "throughput": 1614.19, "total_tokens": 67911680} -{"current_steps": 8300, "total_steps": 20825, "loss": 0.8953, "learning_rate": 3.505670461748527e-05, "epoch": 0.3985594237695078, "percentage": 39.86, "elapsed_time": "11:42:04", "remaining_time": "17:39:28", "throughput": 1614.09, "total_tokens": 67993600} -{"current_steps": 8310, "total_steps": 20825, "loss": 1.19, "learning_rate": 3.5020422184723e-05, "epoch": 0.3990396158463385, "percentage": 39.9, "elapsed_time": "11:42:58", "remaining_time": "17:38:41", "throughput": 1613.99, "total_tokens": 68075520} -{"current_steps": 8320, "total_steps": 20825, "loss": 0.8479, "learning_rate": 3.498411458914238e-05, "epoch": 0.39951980792316927, "percentage": 39.95, "elapsed_time": "11:43:51", "remaining_time": "17:37:54", "throughput": 1613.9, "total_tokens": 68157440} -{"current_steps": 8330, "total_steps": 20825, "loss": 0.8593, "learning_rate": 3.494778192191739e-05, "epoch": 0.4, "percentage": 40.0, "elapsed_time": "11:44:44", "remaining_time": "17:37:06", "throughput": 1613.81, "total_tokens": 68239360} -{"current_steps": 8340, "total_steps": 20825, "loss": 0.771, "learning_rate": 3.4911424274284886e-05, "epoch": 0.4004801920768307, "percentage": 40.05, "elapsed_time": "11:45:38", "remaining_time": "17:36:21", "throughput": 1613.68, "total_tokens": 68321280} -{"current_steps": 8350, "total_steps": 20825, "loss": 0.9203, "learning_rate": 3.4875041737544526e-05, "epoch": 0.4009603841536615, "percentage": 40.1, "elapsed_time": "11:46:33", "remaining_time": "17:35:36", "throughput": 1613.54, "total_tokens": 68403200} -{"current_steps": 8360, "total_steps": 20825, "loss": 0.8853, "learning_rate": 3.483863440305845e-05, "epoch": 0.4014405762304922, "percentage": 40.14, "elapsed_time": "11:47:26", "remaining_time": "17:34:49", "throughput": 1613.43, "total_tokens": 68485120} -{"current_steps": 8370, "total_steps": 20825, "loss": 0.9757, "learning_rate": 3.480220236225106e-05, "epoch": 0.40192076830732293, "percentage": 40.19, "elapsed_time": "11:48:20", "remaining_time": "17:34:02", "throughput": 1613.33, "total_tokens": 68567040} -{"current_steps": 8380, "total_steps": 20825, "loss": 0.8719, "learning_rate": 3.476574570660879e-05, "epoch": 0.4024009603841537, "percentage": 40.24, "elapsed_time": "11:49:13", "remaining_time": "17:33:14", "throughput": 1613.25, "total_tokens": 68648960} -{"current_steps": 8390, "total_steps": 20825, "loss": 0.7306, "learning_rate": 3.472926452767992e-05, "epoch": 0.4028811524609844, "percentage": 40.29, "elapsed_time": "11:50:06", "remaining_time": "17:32:27", "throughput": 1613.17, "total_tokens": 68730880} -{"current_steps": 8400, "total_steps": 20825, "loss": 0.8629, "learning_rate": 3.469275891707428e-05, "epoch": 0.40336134453781514, "percentage": 40.34, "elapsed_time": "11:50:59", "remaining_time": "17:31:40", "throughput": 1613.07, "total_tokens": 68812800} -{"current_steps": 8410, "total_steps": 20825, "loss": 0.8746, "learning_rate": 3.465622896646305e-05, "epoch": 0.40384153661464584, "percentage": 40.38, "elapsed_time": "11:51:52", "remaining_time": "17:30:52", "throughput": 1612.99, "total_tokens": 68894720} -{"current_steps": 8420, "total_steps": 20825, "loss": 0.8477, "learning_rate": 3.461967476757857e-05, "epoch": 0.4043217286914766, "percentage": 40.43, "elapsed_time": "11:52:45", "remaining_time": "17:30:05", "throughput": 1612.91, "total_tokens": 68976640} -{"current_steps": 8430, "total_steps": 20825, "loss": 1.0445, "learning_rate": 3.4583096412214025e-05, "epoch": 0.40480192076830734, "percentage": 40.48, "elapsed_time": "11:53:38", "remaining_time": "17:29:18", "throughput": 1612.81, "total_tokens": 69058560} -{"current_steps": 8440, "total_steps": 20825, "loss": 0.846, "learning_rate": 3.454649399222328e-05, "epoch": 0.40528211284513804, "percentage": 40.53, "elapsed_time": "11:54:32", "remaining_time": "17:28:31", "throughput": 1612.71, "total_tokens": 69140480} -{"current_steps": 8450, "total_steps": 20825, "loss": 0.8504, "learning_rate": 3.450986759952064e-05, "epoch": 0.4057623049219688, "percentage": 40.58, "elapsed_time": "11:55:25", "remaining_time": "17:27:43", "throughput": 1612.63, "total_tokens": 69222400} -{"current_steps": 8460, "total_steps": 20825, "loss": 0.8774, "learning_rate": 3.44732173260806e-05, "epoch": 0.4062424969987995, "percentage": 40.62, "elapsed_time": "11:56:18", "remaining_time": "17:26:56", "throughput": 1612.54, "total_tokens": 69304320} -{"current_steps": 8470, "total_steps": 20825, "loss": 0.9147, "learning_rate": 3.4436543263937613e-05, "epoch": 0.40672268907563025, "percentage": 40.67, "elapsed_time": "11:57:11", "remaining_time": "17:26:09", "throughput": 1612.44, "total_tokens": 69386240} -{"current_steps": 8480, "total_steps": 20825, "loss": 0.8726, "learning_rate": 3.439984550518589e-05, "epoch": 0.407202881152461, "percentage": 40.72, "elapsed_time": "11:58:05", "remaining_time": "17:25:22", "throughput": 1612.35, "total_tokens": 69468160} -{"current_steps": 8490, "total_steps": 20825, "loss": 0.9237, "learning_rate": 3.436312414197913e-05, "epoch": 0.4076830732292917, "percentage": 40.77, "elapsed_time": "11:58:58", "remaining_time": "17:24:34", "throughput": 1612.26, "total_tokens": 69550080} -{"current_steps": 8500, "total_steps": 20825, "loss": 1.0674, "learning_rate": 3.4326379266530314e-05, "epoch": 0.40816326530612246, "percentage": 40.82, "elapsed_time": "11:59:51", "remaining_time": "17:23:47", "throughput": 1612.17, "total_tokens": 69632000} -{"current_steps": 8510, "total_steps": 20825, "loss": 0.8397, "learning_rate": 3.428961097111146e-05, "epoch": 0.40864345738295316, "percentage": 40.86, "elapsed_time": "12:00:44", "remaining_time": "17:23:00", "throughput": 1612.07, "total_tokens": 69713920} -{"current_steps": 8520, "total_steps": 20825, "loss": 0.909, "learning_rate": 3.4252819348053424e-05, "epoch": 0.4091236494597839, "percentage": 40.91, "elapsed_time": "12:01:38", "remaining_time": "17:22:13", "throughput": 1611.97, "total_tokens": 69795840} -{"current_steps": 8530, "total_steps": 20825, "loss": 0.9302, "learning_rate": 3.421600448974559e-05, "epoch": 0.40960384153661467, "percentage": 40.96, "elapsed_time": "12:02:31", "remaining_time": "17:21:25", "throughput": 1611.89, "total_tokens": 69877760} -{"current_steps": 8540, "total_steps": 20825, "loss": 0.9918, "learning_rate": 3.4179166488635736e-05, "epoch": 0.41008403361344536, "percentage": 41.01, "elapsed_time": "12:03:24", "remaining_time": "17:20:38", "throughput": 1611.8, "total_tokens": 69959680} -{"current_steps": 8550, "total_steps": 20825, "loss": 0.9864, "learning_rate": 3.414230543722973e-05, "epoch": 0.4105642256902761, "percentage": 41.06, "elapsed_time": "12:04:17", "remaining_time": "17:19:51", "throughput": 1611.71, "total_tokens": 70041600} -{"current_steps": 8560, "total_steps": 20825, "loss": 0.872, "learning_rate": 3.410542142809134e-05, "epoch": 0.4110444177671068, "percentage": 41.1, "elapsed_time": "12:05:11", "remaining_time": "17:19:03", "throughput": 1611.62, "total_tokens": 70123520} -{"current_steps": 8570, "total_steps": 20825, "loss": 1.0904, "learning_rate": 3.4068514553841965e-05, "epoch": 0.41152460984393757, "percentage": 41.15, "elapsed_time": "12:06:04", "remaining_time": "17:18:16", "throughput": 1611.53, "total_tokens": 70205440} -{"current_steps": 8580, "total_steps": 20825, "loss": 0.8943, "learning_rate": 3.403158490716043e-05, "epoch": 0.4120048019207683, "percentage": 41.2, "elapsed_time": "12:06:57", "remaining_time": "17:17:29", "throughput": 1611.45, "total_tokens": 70287360} -{"current_steps": 8590, "total_steps": 20825, "loss": 0.8691, "learning_rate": 3.3994632580782766e-05, "epoch": 0.412484993997599, "percentage": 41.25, "elapsed_time": "12:07:50", "remaining_time": "17:16:41", "throughput": 1611.36, "total_tokens": 70369280} -{"current_steps": 8600, "total_steps": 20825, "loss": 0.8594, "learning_rate": 3.395765766750192e-05, "epoch": 0.4129651860744298, "percentage": 41.3, "elapsed_time": "12:08:44", "remaining_time": "17:15:54", "throughput": 1611.27, "total_tokens": 70451200} -{"current_steps": 8610, "total_steps": 20825, "loss": 0.8132, "learning_rate": 3.392066026016757e-05, "epoch": 0.4134453781512605, "percentage": 41.34, "elapsed_time": "12:09:37", "remaining_time": "17:15:06", "throughput": 1611.18, "total_tokens": 70533120} -{"current_steps": 8620, "total_steps": 20825, "loss": 0.8289, "learning_rate": 3.388364045168591e-05, "epoch": 0.41392557022809123, "percentage": 41.39, "elapsed_time": "12:10:30", "remaining_time": "17:14:19", "throughput": 1611.1, "total_tokens": 70615040} -{"current_steps": 8630, "total_steps": 20825, "loss": 0.8435, "learning_rate": 3.3846598335019335e-05, "epoch": 0.414405762304922, "percentage": 41.44, "elapsed_time": "12:11:23", "remaining_time": "17:13:31", "throughput": 1611.01, "total_tokens": 70696960} -{"current_steps": 8640, "total_steps": 20825, "loss": 0.9588, "learning_rate": 3.38095340031863e-05, "epoch": 0.4148859543817527, "percentage": 41.49, "elapsed_time": "12:12:16", "remaining_time": "17:12:44", "throughput": 1610.92, "total_tokens": 70778880} -{"current_steps": 8650, "total_steps": 20825, "loss": 1.0117, "learning_rate": 3.377244754926104e-05, "epoch": 0.41536614645858344, "percentage": 41.54, "elapsed_time": "12:13:10", "remaining_time": "17:11:56", "throughput": 1610.84, "total_tokens": 70860800} -{"current_steps": 8660, "total_steps": 20825, "loss": 0.8984, "learning_rate": 3.3735339066373314e-05, "epoch": 0.41584633853541414, "percentage": 41.58, "elapsed_time": "12:14:03", "remaining_time": "17:11:09", "throughput": 1610.74, "total_tokens": 70942720} -{"current_steps": 8670, "total_steps": 20825, "loss": 0.852, "learning_rate": 3.369820864770822e-05, "epoch": 0.4163265306122449, "percentage": 41.63, "elapsed_time": "12:14:56", "remaining_time": "17:10:22", "throughput": 1610.65, "total_tokens": 71024640} -{"current_steps": 8680, "total_steps": 20825, "loss": 0.8927, "learning_rate": 3.366105638650596e-05, "epoch": 0.41680672268907565, "percentage": 41.68, "elapsed_time": "12:15:50", "remaining_time": "17:09:34", "throughput": 1610.57, "total_tokens": 71106560} -{"current_steps": 8690, "total_steps": 20825, "loss": 0.8245, "learning_rate": 3.3623882376061554e-05, "epoch": 0.41728691476590635, "percentage": 41.73, "elapsed_time": "12:16:43", "remaining_time": "17:08:46", "throughput": 1610.48, "total_tokens": 71188480} -{"current_steps": 8700, "total_steps": 20825, "loss": 0.8433, "learning_rate": 3.358668670972465e-05, "epoch": 0.4177671068427371, "percentage": 41.78, "elapsed_time": "12:17:37", "remaining_time": "17:08:00", "throughput": 1610.37, "total_tokens": 71270400} -{"current_steps": 8710, "total_steps": 20825, "loss": 0.9426, "learning_rate": 3.354946948089927e-05, "epoch": 0.4182472989195678, "percentage": 41.82, "elapsed_time": "12:18:30", "remaining_time": "17:07:12", "throughput": 1610.28, "total_tokens": 71352320} -{"current_steps": 8720, "total_steps": 20825, "loss": 0.8831, "learning_rate": 3.351223078304359e-05, "epoch": 0.41872749099639855, "percentage": 41.87, "elapsed_time": "12:19:23", "remaining_time": "17:06:24", "throughput": 1610.2, "total_tokens": 71434240} -{"current_steps": 8730, "total_steps": 20825, "loss": 0.9697, "learning_rate": 3.34749707096697e-05, "epoch": 0.4192076830732293, "percentage": 41.92, "elapsed_time": "12:20:16", "remaining_time": "17:05:36", "throughput": 1610.13, "total_tokens": 71516160} -{"current_steps": 8740, "total_steps": 20825, "loss": 0.8492, "learning_rate": 3.343768935434337e-05, "epoch": 0.41968787515006, "percentage": 41.97, "elapsed_time": "12:21:09", "remaining_time": "17:04:49", "throughput": 1610.03, "total_tokens": 71598080} -{"current_steps": 8750, "total_steps": 20825, "loss": 0.9056, "learning_rate": 3.34003868106838e-05, "epoch": 0.42016806722689076, "percentage": 42.02, "elapsed_time": "12:22:03", "remaining_time": "17:04:02", "throughput": 1609.94, "total_tokens": 71680000} -{"current_steps": 8760, "total_steps": 20825, "loss": 0.9732, "learning_rate": 3.3363063172363396e-05, "epoch": 0.42064825930372146, "percentage": 42.06, "elapsed_time": "12:22:56", "remaining_time": "17:03:14", "throughput": 1609.85, "total_tokens": 71761920} -{"current_steps": 8770, "total_steps": 20825, "loss": 1.1805, "learning_rate": 3.3325718533107556e-05, "epoch": 0.4211284513805522, "percentage": 42.11, "elapsed_time": "12:23:49", "remaining_time": "17:02:27", "throughput": 1609.77, "total_tokens": 71843840} -{"current_steps": 8780, "total_steps": 20825, "loss": 0.9309, "learning_rate": 3.3288352986694396e-05, "epoch": 0.42160864345738297, "percentage": 42.16, "elapsed_time": "12:24:43", "remaining_time": "17:01:39", "throughput": 1609.69, "total_tokens": 71925760} -{"current_steps": 8790, "total_steps": 20825, "loss": 1.0555, "learning_rate": 3.325096662695454e-05, "epoch": 0.42208883553421367, "percentage": 42.21, "elapsed_time": "12:25:36", "remaining_time": "17:00:51", "throughput": 1609.6, "total_tokens": 72007680} -{"current_steps": 8800, "total_steps": 20825, "loss": 0.831, "learning_rate": 3.321355954777087e-05, "epoch": 0.4225690276110444, "percentage": 42.26, "elapsed_time": "12:26:29", "remaining_time": "17:00:04", "throughput": 1609.51, "total_tokens": 72089600} -{"current_steps": 8810, "total_steps": 20825, "loss": 0.9081, "learning_rate": 3.317613184307832e-05, "epoch": 0.4230492196878752, "percentage": 42.3, "elapsed_time": "12:27:23", "remaining_time": "16:59:17", "throughput": 1609.4, "total_tokens": 72171520} -{"current_steps": 8820, "total_steps": 20825, "loss": 0.9385, "learning_rate": 3.313868360686359e-05, "epoch": 0.4235294117647059, "percentage": 42.35, "elapsed_time": "12:28:16", "remaining_time": "16:58:29", "throughput": 1609.32, "total_tokens": 72253440} -{"current_steps": 8830, "total_steps": 20825, "loss": 0.8992, "learning_rate": 3.310121493316495e-05, "epoch": 0.42400960384153663, "percentage": 42.4, "elapsed_time": "12:29:10", "remaining_time": "16:57:41", "throughput": 1609.23, "total_tokens": 72335360} -{"current_steps": 8840, "total_steps": 20825, "loss": 0.8763, "learning_rate": 3.306372591607199e-05, "epoch": 0.42448979591836733, "percentage": 42.45, "elapsed_time": "12:30:03", "remaining_time": "16:56:54", "throughput": 1609.15, "total_tokens": 72417280} -{"current_steps": 8850, "total_steps": 20825, "loss": 0.8636, "learning_rate": 3.30262166497254e-05, "epoch": 0.4249699879951981, "percentage": 42.5, "elapsed_time": "12:30:57", "remaining_time": "16:56:07", "throughput": 1609.04, "total_tokens": 72499200} -{"current_steps": 8860, "total_steps": 20825, "loss": 1.1187, "learning_rate": 3.29886872283167e-05, "epoch": 0.42545018007202884, "percentage": 42.55, "elapsed_time": "12:31:51", "remaining_time": "16:55:20", "throughput": 1608.94, "total_tokens": 72581120} -{"current_steps": 8870, "total_steps": 20825, "loss": 0.9403, "learning_rate": 3.2951137746088004e-05, "epoch": 0.42593037214885954, "percentage": 42.59, "elapsed_time": "12:32:44", "remaining_time": "16:54:32", "throughput": 1608.86, "total_tokens": 72663040} -{"current_steps": 8880, "total_steps": 20825, "loss": 0.8392, "learning_rate": 3.291356829733186e-05, "epoch": 0.4264105642256903, "percentage": 42.64, "elapsed_time": "12:33:37", "remaining_time": "16:53:44", "throughput": 1608.79, "total_tokens": 72744960} -{"current_steps": 8890, "total_steps": 20825, "loss": 1.0537, "learning_rate": 3.287597897639092e-05, "epoch": 0.426890756302521, "percentage": 42.69, "elapsed_time": "12:34:30", "remaining_time": "16:52:56", "throughput": 1608.7, "total_tokens": 72826880} -{"current_steps": 8900, "total_steps": 20825, "loss": 0.8691, "learning_rate": 3.283836987765771e-05, "epoch": 0.42737094837935174, "percentage": 42.74, "elapsed_time": "12:35:23", "remaining_time": "16:52:08", "throughput": 1608.63, "total_tokens": 72908800} -{"current_steps": 8910, "total_steps": 20825, "loss": 0.8148, "learning_rate": 3.280074109557447e-05, "epoch": 0.4278511404561825, "percentage": 42.79, "elapsed_time": "12:36:17", "remaining_time": "16:51:21", "throughput": 1608.54, "total_tokens": 72990720} -{"current_steps": 8920, "total_steps": 20825, "loss": 0.8026, "learning_rate": 3.2763092724632854e-05, "epoch": 0.4283313325330132, "percentage": 42.83, "elapsed_time": "12:37:11", "remaining_time": "16:50:34", "throughput": 1608.43, "total_tokens": 73072640} -{"current_steps": 8930, "total_steps": 20825, "loss": 0.9775, "learning_rate": 3.272542485937369e-05, "epoch": 0.42881152460984395, "percentage": 42.88, "elapsed_time": "12:38:04", "remaining_time": "16:49:46", "throughput": 1608.35, "total_tokens": 73154560} -{"current_steps": 8940, "total_steps": 20825, "loss": 0.7946, "learning_rate": 3.2687737594386766e-05, "epoch": 0.42929171668667465, "percentage": 42.93, "elapsed_time": "12:38:57", "remaining_time": "16:48:58", "throughput": 1608.25, "total_tokens": 73236480} -{"current_steps": 8950, "total_steps": 20825, "loss": 1.0062, "learning_rate": 3.2650031024310603e-05, "epoch": 0.4297719087635054, "percentage": 42.98, "elapsed_time": "12:39:51", "remaining_time": "16:48:11", "throughput": 1608.16, "total_tokens": 73318400} -{"current_steps": 8960, "total_steps": 20825, "loss": 1.0847, "learning_rate": 3.2612305243832176e-05, "epoch": 0.43025210084033616, "percentage": 43.03, "elapsed_time": "12:40:45", "remaining_time": "16:47:24", "throughput": 1608.05, "total_tokens": 73400320} -{"current_steps": 8970, "total_steps": 20825, "loss": 0.9699, "learning_rate": 3.2574560347686725e-05, "epoch": 0.43073229291716686, "percentage": 43.07, "elapsed_time": "12:41:38", "remaining_time": "16:46:36", "throughput": 1607.97, "total_tokens": 73482240} -{"current_steps": 8980, "total_steps": 20825, "loss": 0.9454, "learning_rate": 3.253679643065747e-05, "epoch": 0.4312124849939976, "percentage": 43.12, "elapsed_time": "12:42:32", "remaining_time": "16:45:49", "throughput": 1607.88, "total_tokens": 73564160} -{"current_steps": 8990, "total_steps": 20825, "loss": 0.9417, "learning_rate": 3.249901358757538e-05, "epoch": 0.4316926770708283, "percentage": 43.17, "elapsed_time": "12:43:25", "remaining_time": "16:45:01", "throughput": 1607.8, "total_tokens": 73646080} -{"current_steps": 9000, "total_steps": 20825, "loss": 0.9839, "learning_rate": 3.246121191331902e-05, "epoch": 0.43217286914765907, "percentage": 43.22, "elapsed_time": "12:44:18", "remaining_time": "16:44:12", "throughput": 1607.73, "total_tokens": 73728000} -{"current_steps": 9010, "total_steps": 20825, "loss": 0.8661, "learning_rate": 3.242339150281417e-05, "epoch": 0.4326530612244898, "percentage": 43.27, "elapsed_time": "12:45:14", "remaining_time": "16:43:28", "throughput": 1607.55, "total_tokens": 73809920} -{"current_steps": 9020, "total_steps": 20825, "loss": 0.8686, "learning_rate": 3.238555245103368e-05, "epoch": 0.4331332533013205, "percentage": 43.31, "elapsed_time": "12:46:07", "remaining_time": "16:42:40", "throughput": 1607.47, "total_tokens": 73891840} -{"current_steps": 9030, "total_steps": 20825, "loss": 0.8504, "learning_rate": 3.234769485299724e-05, "epoch": 0.4336134453781513, "percentage": 43.36, "elapsed_time": "12:47:01", "remaining_time": "16:41:52", "throughput": 1607.38, "total_tokens": 73973760} -{"current_steps": 9040, "total_steps": 20825, "loss": 1.0346, "learning_rate": 3.230981880377107e-05, "epoch": 0.434093637454982, "percentage": 43.41, "elapsed_time": "12:47:54", "remaining_time": "16:41:05", "throughput": 1607.3, "total_tokens": 74055680} -{"current_steps": 9050, "total_steps": 20825, "loss": 0.9299, "learning_rate": 3.227192439846775e-05, "epoch": 0.4345738295318127, "percentage": 43.46, "elapsed_time": "12:48:47", "remaining_time": "16:40:17", "throughput": 1607.22, "total_tokens": 74137600} -{"current_steps": 9060, "total_steps": 20825, "loss": 0.9369, "learning_rate": 3.223401173224595e-05, "epoch": 0.4350540216086435, "percentage": 43.51, "elapsed_time": "12:49:40", "remaining_time": "16:39:28", "throughput": 1607.15, "total_tokens": 74219520} -{"current_steps": 9070, "total_steps": 20825, "loss": 0.8562, "learning_rate": 3.219608090031021e-05, "epoch": 0.4355342136854742, "percentage": 43.55, "elapsed_time": "12:50:34", "remaining_time": "16:38:41", "throughput": 1607.06, "total_tokens": 74301440} -{"current_steps": 9080, "total_steps": 20825, "loss": 1.0076, "learning_rate": 3.215813199791065e-05, "epoch": 0.43601440576230494, "percentage": 43.6, "elapsed_time": "12:51:27", "remaining_time": "16:37:53", "throughput": 1606.98, "total_tokens": 74383360} -{"current_steps": 9090, "total_steps": 20825, "loss": 0.8394, "learning_rate": 3.212016512034279e-05, "epoch": 0.43649459783913563, "percentage": 43.65, "elapsed_time": "12:52:21", "remaining_time": "16:37:05", "throughput": 1606.89, "total_tokens": 74465280} -{"current_steps": 9100, "total_steps": 20825, "loss": 0.9406, "learning_rate": 3.2082180362947304e-05, "epoch": 0.4369747899159664, "percentage": 43.7, "elapsed_time": "12:53:14", "remaining_time": "16:36:17", "throughput": 1606.81, "total_tokens": 74547200} -{"current_steps": 9110, "total_steps": 20825, "loss": 1.0131, "learning_rate": 3.204417782110974e-05, "epoch": 0.43745498199279714, "percentage": 43.75, "elapsed_time": "12:54:07", "remaining_time": "16:35:28", "throughput": 1606.75, "total_tokens": 74629120} -{"current_steps": 9120, "total_steps": 20825, "loss": 1.0524, "learning_rate": 3.200615759026031e-05, "epoch": 0.43793517406962784, "percentage": 43.79, "elapsed_time": "12:55:00", "remaining_time": "16:34:40", "throughput": 1606.67, "total_tokens": 74711040} -{"current_steps": 9130, "total_steps": 20825, "loss": 0.8463, "learning_rate": 3.1968119765873654e-05, "epoch": 0.4384153661464586, "percentage": 43.84, "elapsed_time": "12:55:53", "remaining_time": "16:33:52", "throughput": 1606.59, "total_tokens": 74792960} -{"current_steps": 9140, "total_steps": 20825, "loss": 0.8177, "learning_rate": 3.193006444346859e-05, "epoch": 0.4388955582232893, "percentage": 43.89, "elapsed_time": "12:56:47", "remaining_time": "16:33:04", "throughput": 1606.51, "total_tokens": 74874880} -{"current_steps": 9150, "total_steps": 20825, "loss": 1.1675, "learning_rate": 3.189199171860787e-05, "epoch": 0.43937575030012005, "percentage": 43.94, "elapsed_time": "12:57:40", "remaining_time": "16:32:17", "throughput": 1606.41, "total_tokens": 74956800} -{"current_steps": 9160, "total_steps": 20825, "loss": 0.7782, "learning_rate": 3.185390168689796e-05, "epoch": 0.4398559423769508, "percentage": 43.99, "elapsed_time": "12:58:33", "remaining_time": "16:31:28", "throughput": 1606.34, "total_tokens": 75038720} -{"current_steps": 9170, "total_steps": 20825, "loss": 0.74, "learning_rate": 3.1815794443988763e-05, "epoch": 0.4403361344537815, "percentage": 44.03, "elapsed_time": "12:59:27", "remaining_time": "16:30:40", "throughput": 1606.27, "total_tokens": 75120640} -{"current_steps": 9180, "total_steps": 20825, "loss": 0.9299, "learning_rate": 3.177767008557343e-05, "epoch": 0.44081632653061226, "percentage": 44.08, "elapsed_time": "13:00:20", "remaining_time": "16:29:52", "throughput": 1606.2, "total_tokens": 75202560} -{"current_steps": 9190, "total_steps": 20825, "loss": 0.8375, "learning_rate": 3.1739528707388066e-05, "epoch": 0.44129651860744296, "percentage": 44.13, "elapsed_time": "13:01:13", "remaining_time": "16:29:04", "throughput": 1606.12, "total_tokens": 75284480} -{"current_steps": 9200, "total_steps": 20825, "loss": 0.8294, "learning_rate": 3.1701370405211535e-05, "epoch": 0.4417767106842737, "percentage": 44.18, "elapsed_time": "13:02:07", "remaining_time": "16:28:16", "throughput": 1606.03, "total_tokens": 75366400} -{"current_steps": 9210, "total_steps": 20825, "loss": 0.965, "learning_rate": 3.166319527486519e-05, "epoch": 0.44225690276110446, "percentage": 44.23, "elapsed_time": "13:03:00", "remaining_time": "16:27:28", "throughput": 1605.95, "total_tokens": 75448320} -{"current_steps": 9220, "total_steps": 20825, "loss": 0.9839, "learning_rate": 3.162500341221264e-05, "epoch": 0.44273709483793516, "percentage": 44.27, "elapsed_time": "13:03:53", "remaining_time": "16:26:40", "throughput": 1605.87, "total_tokens": 75530240} -{"current_steps": 9230, "total_steps": 20825, "loss": 0.9622, "learning_rate": 3.158679491315951e-05, "epoch": 0.4432172869147659, "percentage": 44.32, "elapsed_time": "13:04:47", "remaining_time": "16:25:52", "throughput": 1605.8, "total_tokens": 75612160} -{"current_steps": 9240, "total_steps": 20825, "loss": 0.9561, "learning_rate": 3.154856987365322e-05, "epoch": 0.4436974789915966, "percentage": 44.37, "elapsed_time": "13:05:40", "remaining_time": "16:25:04", "throughput": 1605.7, "total_tokens": 75694080} -{"current_steps": 9250, "total_steps": 20825, "loss": 0.794, "learning_rate": 3.151032838968271e-05, "epoch": 0.44417767106842737, "percentage": 44.42, "elapsed_time": "13:06:34", "remaining_time": "16:24:16", "throughput": 1605.62, "total_tokens": 75776000} -{"current_steps": 9260, "total_steps": 20825, "loss": 1.0292, "learning_rate": 3.14720705572782e-05, "epoch": 0.4446578631452581, "percentage": 44.47, "elapsed_time": "13:07:27", "remaining_time": "16:23:28", "throughput": 1605.53, "total_tokens": 75857920} -{"current_steps": 9270, "total_steps": 20825, "loss": 0.865, "learning_rate": 3.1433796472511e-05, "epoch": 0.4451380552220888, "percentage": 44.51, "elapsed_time": "13:08:21", "remaining_time": "16:22:40", "throughput": 1605.46, "total_tokens": 75939840} -{"current_steps": 9280, "total_steps": 20825, "loss": 1.0853, "learning_rate": 3.13955062314932e-05, "epoch": 0.4456182472989196, "percentage": 44.56, "elapsed_time": "13:09:14", "remaining_time": "16:21:52", "throughput": 1605.38, "total_tokens": 76021760} -{"current_steps": 9290, "total_steps": 20825, "loss": 0.9558, "learning_rate": 3.135719993037748e-05, "epoch": 0.4460984393757503, "percentage": 44.61, "elapsed_time": "13:10:07", "remaining_time": "16:21:03", "throughput": 1605.31, "total_tokens": 76103680} -{"current_steps": 9300, "total_steps": 20825, "loss": 0.9276, "learning_rate": 3.131887766535684e-05, "epoch": 0.44657863145258103, "percentage": 44.66, "elapsed_time": "13:11:00", "remaining_time": "16:20:15", "throughput": 1605.23, "total_tokens": 76185600} -{"current_steps": 9310, "total_steps": 20825, "loss": 0.8235, "learning_rate": 3.1280539532664366e-05, "epoch": 0.4470588235294118, "percentage": 44.71, "elapsed_time": "13:11:54", "remaining_time": "16:19:27", "throughput": 1605.14, "total_tokens": 76267520} -{"current_steps": 9320, "total_steps": 20825, "loss": 0.8764, "learning_rate": 3.1242185628573e-05, "epoch": 0.4475390156062425, "percentage": 44.75, "elapsed_time": "13:12:47", "remaining_time": "16:18:39", "throughput": 1605.07, "total_tokens": 76349440} -{"current_steps": 9330, "total_steps": 20825, "loss": 0.8174, "learning_rate": 3.120381604939529e-05, "epoch": 0.44801920768307324, "percentage": 44.8, "elapsed_time": "13:13:40", "remaining_time": "16:17:51", "throughput": 1605.0, "total_tokens": 76431360} -{"current_steps": 9340, "total_steps": 20825, "loss": 0.9815, "learning_rate": 3.116543089148312e-05, "epoch": 0.44849939975990394, "percentage": 44.85, "elapsed_time": "13:14:33", "remaining_time": "16:17:02", "throughput": 1604.93, "total_tokens": 76513280} -{"current_steps": 9350, "total_steps": 20825, "loss": 0.7665, "learning_rate": 3.112703025122754e-05, "epoch": 0.4489795918367347, "percentage": 44.9, "elapsed_time": "13:15:27", "remaining_time": "16:16:14", "throughput": 1604.84, "total_tokens": 76595200} -{"current_steps": 9360, "total_steps": 20825, "loss": 0.7452, "learning_rate": 3.108861422505842e-05, "epoch": 0.44945978391356545, "percentage": 44.95, "elapsed_time": "13:16:20", "remaining_time": "16:15:26", "throughput": 1604.77, "total_tokens": 76677120} -{"current_steps": 9370, "total_steps": 20825, "loss": 0.9044, "learning_rate": 3.105018290944432e-05, "epoch": 0.44993997599039615, "percentage": 44.99, "elapsed_time": "13:17:13", "remaining_time": "16:14:37", "throughput": 1604.7, "total_tokens": 76759040} -{"current_steps": 9380, "total_steps": 20825, "loss": 0.8608, "learning_rate": 3.1011736400892175e-05, "epoch": 0.4504201680672269, "percentage": 45.04, "elapsed_time": "13:18:07", "remaining_time": "16:13:49", "throughput": 1604.63, "total_tokens": 76840960} -{"current_steps": 9390, "total_steps": 20825, "loss": 0.7893, "learning_rate": 3.097327479594707e-05, "epoch": 0.4509003601440576, "percentage": 45.09, "elapsed_time": "13:19:01", "remaining_time": "16:13:01", "throughput": 1604.53, "total_tokens": 76922880} -{"current_steps": 9400, "total_steps": 20825, "loss": 0.935, "learning_rate": 3.093479819119198e-05, "epoch": 0.45138055222088835, "percentage": 45.14, "elapsed_time": "13:19:54", "remaining_time": "16:12:14", "throughput": 1604.44, "total_tokens": 77004800} -{"current_steps": 9410, "total_steps": 20825, "loss": 0.92, "learning_rate": 3.089630668324759e-05, "epoch": 0.4518607442977191, "percentage": 45.19, "elapsed_time": "13:20:48", "remaining_time": "16:11:26", "throughput": 1604.36, "total_tokens": 77086720} -{"current_steps": 9420, "total_steps": 20825, "loss": 0.8323, "learning_rate": 3.085780036877197e-05, "epoch": 0.4523409363745498, "percentage": 45.23, "elapsed_time": "13:21:41", "remaining_time": "16:10:37", "throughput": 1604.29, "total_tokens": 77168640} -{"current_steps": 9430, "total_steps": 20825, "loss": 0.8059, "learning_rate": 3.0819279344460396e-05, "epoch": 0.45282112845138056, "percentage": 45.28, "elapsed_time": "13:22:35", "remaining_time": "16:09:50", "throughput": 1604.19, "total_tokens": 77250560} -{"current_steps": 9440, "total_steps": 20825, "loss": 0.9285, "learning_rate": 3.078074370704507e-05, "epoch": 0.45330132052821126, "percentage": 45.33, "elapsed_time": "13:23:28", "remaining_time": "16:09:01", "throughput": 1604.12, "total_tokens": 77332480} -{"current_steps": 9450, "total_steps": 20825, "loss": 0.8807, "learning_rate": 3.07421935532949e-05, "epoch": 0.453781512605042, "percentage": 45.38, "elapsed_time": "13:24:21", "remaining_time": "16:08:13", "throughput": 1604.05, "total_tokens": 77414400} -{"current_steps": 9460, "total_steps": 20825, "loss": 0.9211, "learning_rate": 3.0703628980015214e-05, "epoch": 0.45426170468187277, "percentage": 45.43, "elapsed_time": "13:25:15", "remaining_time": "16:07:24", "throughput": 1603.97, "total_tokens": 77496320} -{"current_steps": 9470, "total_steps": 20825, "loss": 0.8221, "learning_rate": 3.0665050084047605e-05, "epoch": 0.45474189675870347, "percentage": 45.47, "elapsed_time": "13:26:08", "remaining_time": "16:06:36", "throughput": 1603.89, "total_tokens": 77578240} -{"current_steps": 9480, "total_steps": 20825, "loss": 0.7467, "learning_rate": 3.062645696226959e-05, "epoch": 0.4552220888355342, "percentage": 45.52, "elapsed_time": "13:27:02", "remaining_time": "16:05:48", "throughput": 1603.82, "total_tokens": 77660160} -{"current_steps": 9490, "total_steps": 20825, "loss": 0.982, "learning_rate": 3.0587849711594425e-05, "epoch": 0.4557022809123649, "percentage": 45.57, "elapsed_time": "13:27:55", "remaining_time": "16:05:00", "throughput": 1603.73, "total_tokens": 77742080} -{"current_steps": 9500, "total_steps": 20825, "loss": 0.863, "learning_rate": 3.054922842897084e-05, "epoch": 0.4561824729891957, "percentage": 45.62, "elapsed_time": "13:28:48", "remaining_time": "16:04:11", "throughput": 1603.66, "total_tokens": 77824000} -{"current_steps": 9510, "total_steps": 20825, "loss": 1.0322, "learning_rate": 3.051059321138281e-05, "epoch": 0.45666266506602643, "percentage": 45.67, "elapsed_time": "13:29:42", "remaining_time": "16:03:23", "throughput": 1603.59, "total_tokens": 77905920} -{"current_steps": 9520, "total_steps": 20825, "loss": 0.9702, "learning_rate": 3.047194415584929e-05, "epoch": 0.45714285714285713, "percentage": 45.71, "elapsed_time": "13:30:35", "remaining_time": "16:02:34", "throughput": 1603.51, "total_tokens": 77987840} -{"current_steps": 9530, "total_steps": 20825, "loss": 0.9051, "learning_rate": 3.0433281359424008e-05, "epoch": 0.4576230492196879, "percentage": 45.76, "elapsed_time": "13:31:29", "remaining_time": "16:01:46", "throughput": 1603.42, "total_tokens": 78069760} -{"current_steps": 9540, "total_steps": 20825, "loss": 0.785, "learning_rate": 3.0394604919195156e-05, "epoch": 0.4581032412965186, "percentage": 45.81, "elapsed_time": "13:32:22", "remaining_time": "16:00:58", "throughput": 1603.36, "total_tokens": 78151680} -{"current_steps": 9550, "total_steps": 20825, "loss": 0.9501, "learning_rate": 3.0355914932285228e-05, "epoch": 0.45858343337334934, "percentage": 45.86, "elapsed_time": "13:33:15", "remaining_time": "16:00:09", "throughput": 1603.28, "total_tokens": 78233600} -{"current_steps": 9560, "total_steps": 20825, "loss": 0.8565, "learning_rate": 3.0317211495850717e-05, "epoch": 0.4590636254501801, "percentage": 45.91, "elapsed_time": "13:34:09", "remaining_time": "15:59:21", "throughput": 1603.21, "total_tokens": 78315520} -{"current_steps": 9570, "total_steps": 20825, "loss": 0.7823, "learning_rate": 3.02784947070819e-05, "epoch": 0.4595438175270108, "percentage": 45.95, "elapsed_time": "13:35:02", "remaining_time": "15:58:32", "throughput": 1603.14, "total_tokens": 78397440} -{"current_steps": 9580, "total_steps": 20825, "loss": 0.9049, "learning_rate": 3.0239764663202562e-05, "epoch": 0.46002400960384154, "percentage": 46.0, "elapsed_time": "13:35:55", "remaining_time": "15:57:44", "throughput": 1603.07, "total_tokens": 78479360} -{"current_steps": 9590, "total_steps": 20825, "loss": 0.9584, "learning_rate": 3.0201021461469803e-05, "epoch": 0.46050420168067224, "percentage": 46.05, "elapsed_time": "13:36:49", "remaining_time": "15:56:55", "throughput": 1602.99, "total_tokens": 78561280} -{"current_steps": 9600, "total_steps": 20825, "loss": 0.8946, "learning_rate": 3.0162265199173738e-05, "epoch": 0.460984393757503, "percentage": 46.1, "elapsed_time": "13:37:42", "remaining_time": "15:56:07", "throughput": 1602.91, "total_tokens": 78643200} -{"current_steps": 9610, "total_steps": 20825, "loss": 0.973, "learning_rate": 3.0123495973637305e-05, "epoch": 0.46146458583433375, "percentage": 46.15, "elapsed_time": "13:38:36", "remaining_time": "15:55:19", "throughput": 1602.84, "total_tokens": 78725120} -{"current_steps": 9620, "total_steps": 20825, "loss": 0.8953, "learning_rate": 3.008471388221597e-05, "epoch": 0.46194477791116445, "percentage": 46.19, "elapsed_time": "13:39:29", "remaining_time": "15:54:30", "throughput": 1602.77, "total_tokens": 78807040} -{"current_steps": 9630, "total_steps": 20825, "loss": 0.7189, "learning_rate": 3.0045919022297524e-05, "epoch": 0.4624249699879952, "percentage": 46.24, "elapsed_time": "13:40:22", "remaining_time": "15:53:41", "throughput": 1602.7, "total_tokens": 78888960} -{"current_steps": 9640, "total_steps": 20825, "loss": 0.8521, "learning_rate": 3.0007111491301816e-05, "epoch": 0.4629051620648259, "percentage": 46.29, "elapsed_time": "13:41:15", "remaining_time": "15:52:53", "throughput": 1602.63, "total_tokens": 78970880} -{"current_steps": 9650, "total_steps": 20825, "loss": 0.941, "learning_rate": 2.9968291386680503e-05, "epoch": 0.46338535414165666, "percentage": 46.34, "elapsed_time": "13:42:09", "remaining_time": "15:52:04", "throughput": 1602.56, "total_tokens": 79052800} -{"current_steps": 9660, "total_steps": 20825, "loss": 1.0642, "learning_rate": 2.9929458805916837e-05, "epoch": 0.4638655462184874, "percentage": 46.39, "elapsed_time": "13:43:02", "remaining_time": "15:51:16", "throughput": 1602.47, "total_tokens": 79134720} -{"current_steps": 9670, "total_steps": 20825, "loss": 0.7306, "learning_rate": 2.9890613846525395e-05, "epoch": 0.4643457382953181, "percentage": 46.43, "elapsed_time": "13:43:56", "remaining_time": "15:50:27", "throughput": 1602.41, "total_tokens": 79216640} -{"current_steps": 9680, "total_steps": 20825, "loss": 0.8926, "learning_rate": 2.9851756606051817e-05, "epoch": 0.46482593037214887, "percentage": 46.48, "elapsed_time": "13:44:49", "remaining_time": "15:49:39", "throughput": 1602.34, "total_tokens": 79298560} -{"current_steps": 9690, "total_steps": 20825, "loss": 0.9238, "learning_rate": 2.9812887182072607e-05, "epoch": 0.46530612244897956, "percentage": 46.53, "elapsed_time": "13:45:42", "remaining_time": "15:48:50", "throughput": 1602.27, "total_tokens": 79380480} -{"current_steps": 9700, "total_steps": 20825, "loss": 0.8351, "learning_rate": 2.9774005672194854e-05, "epoch": 0.4657863145258103, "percentage": 46.58, "elapsed_time": "13:46:35", "remaining_time": "15:48:01", "throughput": 1602.2, "total_tokens": 79462400} -{"current_steps": 9710, "total_steps": 20825, "loss": 0.8861, "learning_rate": 2.9735112174056006e-05, "epoch": 0.4662665066026411, "percentage": 46.63, "elapsed_time": "13:47:28", "remaining_time": "15:47:12", "throughput": 1602.14, "total_tokens": 79544320} -{"current_steps": 9720, "total_steps": 20825, "loss": 0.8593, "learning_rate": 2.96962067853236e-05, "epoch": 0.46674669867947177, "percentage": 46.67, "elapsed_time": "13:48:21", "remaining_time": "15:46:23", "throughput": 1602.08, "total_tokens": 79626240} -{"current_steps": 9730, "total_steps": 20825, "loss": 0.8369, "learning_rate": 2.9657289603695037e-05, "epoch": 0.4672268907563025, "percentage": 46.72, "elapsed_time": "13:49:15", "remaining_time": "15:45:35", "throughput": 1602.01, "total_tokens": 79708160} -{"current_steps": 9740, "total_steps": 20825, "loss": 1.3, "learning_rate": 2.9618360726897344e-05, "epoch": 0.4677070828331333, "percentage": 46.77, "elapsed_time": "13:50:08", "remaining_time": "15:44:46", "throughput": 1601.94, "total_tokens": 79790080} -{"current_steps": 9750, "total_steps": 20825, "loss": 0.9522, "learning_rate": 2.957942025268689e-05, "epoch": 0.468187274909964, "percentage": 46.82, "elapsed_time": "13:51:02", "remaining_time": "15:43:58", "throughput": 1601.85, "total_tokens": 79872000} -{"current_steps": 9760, "total_steps": 20825, "loss": 0.8728, "learning_rate": 2.9540468278849208e-05, "epoch": 0.46866746698679473, "percentage": 46.87, "elapsed_time": "13:51:55", "remaining_time": "15:43:09", "throughput": 1601.79, "total_tokens": 79953920} -{"current_steps": 9770, "total_steps": 20825, "loss": 0.8798, "learning_rate": 2.950150490319866e-05, "epoch": 0.46914765906362543, "percentage": 46.91, "elapsed_time": "13:52:48", "remaining_time": "15:42:21", "throughput": 1601.71, "total_tokens": 80035840} -{"current_steps": 9780, "total_steps": 20825, "loss": 0.9698, "learning_rate": 2.9462530223578273e-05, "epoch": 0.4696278511404562, "percentage": 46.96, "elapsed_time": "13:53:42", "remaining_time": "15:41:32", "throughput": 1601.63, "total_tokens": 80117760} -{"current_steps": 9790, "total_steps": 20825, "loss": 0.8272, "learning_rate": 2.9423544337859454e-05, "epoch": 0.47010804321728694, "percentage": 47.01, "elapsed_time": "13:54:36", "remaining_time": "15:40:44", "throughput": 1601.56, "total_tokens": 80199680} -{"current_steps": 9800, "total_steps": 20825, "loss": 0.8527, "learning_rate": 2.938454734394174e-05, "epoch": 0.47058823529411764, "percentage": 47.06, "elapsed_time": "13:55:29", "remaining_time": "15:39:55", "throughput": 1601.49, "total_tokens": 80281600} -{"current_steps": 9810, "total_steps": 20825, "loss": 0.9777, "learning_rate": 2.9345539339752575e-05, "epoch": 0.4710684273709484, "percentage": 47.11, "elapsed_time": "13:56:22", "remaining_time": "15:39:06", "throughput": 1601.42, "total_tokens": 80363520} -{"current_steps": 9820, "total_steps": 20825, "loss": 0.8295, "learning_rate": 2.9306520423247045e-05, "epoch": 0.4715486194477791, "percentage": 47.15, "elapsed_time": "13:57:16", "remaining_time": "15:38:18", "throughput": 1601.34, "total_tokens": 80445440} -{"current_steps": 9830, "total_steps": 20825, "loss": 0.9394, "learning_rate": 2.9267490692407635e-05, "epoch": 0.47202881152460985, "percentage": 47.2, "elapsed_time": "13:58:10", "remaining_time": "15:37:30", "throughput": 1601.26, "total_tokens": 80527360} -{"current_steps": 9840, "total_steps": 20825, "loss": 0.9649, "learning_rate": 2.9228450245243993e-05, "epoch": 0.4725090036014406, "percentage": 47.25, "elapsed_time": "13:59:03", "remaining_time": "15:36:41", "throughput": 1601.2, "total_tokens": 80609280} -{"current_steps": 9850, "total_steps": 20825, "loss": 1.1218, "learning_rate": 2.9189399179792676e-05, "epoch": 0.4729891956782713, "percentage": 47.3, "elapsed_time": "13:59:56", "remaining_time": "15:35:52", "throughput": 1601.12, "total_tokens": 80691200} -{"current_steps": 9860, "total_steps": 20825, "loss": 0.9087, "learning_rate": 2.9150337594116904e-05, "epoch": 0.47346938775510206, "percentage": 47.35, "elapsed_time": "14:00:50", "remaining_time": "15:35:04", "throughput": 1601.04, "total_tokens": 80773120} -{"current_steps": 9870, "total_steps": 20825, "loss": 0.849, "learning_rate": 2.9111265586306314e-05, "epoch": 0.47394957983193275, "percentage": 47.39, "elapsed_time": "14:01:43", "remaining_time": "15:34:15", "throughput": 1600.97, "total_tokens": 80855040} -{"current_steps": 9880, "total_steps": 20825, "loss": 0.8285, "learning_rate": 2.9072183254476713e-05, "epoch": 0.4744297719087635, "percentage": 47.44, "elapsed_time": "14:02:36", "remaining_time": "15:33:26", "throughput": 1600.91, "total_tokens": 80936960} -{"current_steps": 9890, "total_steps": 20825, "loss": 0.9502, "learning_rate": 2.903309069676984e-05, "epoch": 0.47490996398559426, "percentage": 47.49, "elapsed_time": "14:03:30", "remaining_time": "15:32:37", "throughput": 1600.84, "total_tokens": 81018880} -{"current_steps": 9900, "total_steps": 20825, "loss": 0.8596, "learning_rate": 2.8993988011353112e-05, "epoch": 0.47539015606242496, "percentage": 47.54, "elapsed_time": "14:04:23", "remaining_time": "15:31:48", "throughput": 1600.78, "total_tokens": 81100800} -{"current_steps": 9910, "total_steps": 20825, "loss": 0.8992, "learning_rate": 2.8954875296419364e-05, "epoch": 0.4758703481392557, "percentage": 47.59, "elapsed_time": "14:05:16", "remaining_time": "15:30:59", "throughput": 1600.72, "total_tokens": 81182720} -{"current_steps": 9920, "total_steps": 20825, "loss": 0.9792, "learning_rate": 2.8915752650186635e-05, "epoch": 0.4763505402160864, "percentage": 47.64, "elapsed_time": "14:06:10", "remaining_time": "15:30:11", "throughput": 1600.63, "total_tokens": 81264640} -{"current_steps": 9930, "total_steps": 20825, "loss": 0.7938, "learning_rate": 2.8876620170897895e-05, "epoch": 0.47683073229291717, "percentage": 47.68, "elapsed_time": "14:07:03", "remaining_time": "15:29:22", "throughput": 1600.56, "total_tokens": 81346560} -{"current_steps": 9940, "total_steps": 20825, "loss": 0.8632, "learning_rate": 2.88374779568208e-05, "epoch": 0.4773109243697479, "percentage": 47.73, "elapsed_time": "14:07:57", "remaining_time": "15:28:34", "throughput": 1600.49, "total_tokens": 81428480} -{"current_steps": 9950, "total_steps": 20825, "loss": 0.8698, "learning_rate": 2.879832610624747e-05, "epoch": 0.4777911164465786, "percentage": 47.78, "elapsed_time": "14:08:50", "remaining_time": "15:27:45", "throughput": 1600.43, "total_tokens": 81510400} -{"current_steps": 9960, "total_steps": 20825, "loss": 0.8159, "learning_rate": 2.8759164717494202e-05, "epoch": 0.4782713085234094, "percentage": 47.83, "elapsed_time": "14:09:43", "remaining_time": "15:26:56", "throughput": 1600.36, "total_tokens": 81592320} -{"current_steps": 9970, "total_steps": 20825, "loss": 1.0499, "learning_rate": 2.8719993888901258e-05, "epoch": 0.4787515006002401, "percentage": 47.88, "elapsed_time": "14:10:36", "remaining_time": "15:26:07", "throughput": 1600.3, "total_tokens": 81674240} -{"current_steps": 9980, "total_steps": 20825, "loss": 0.8724, "learning_rate": 2.86808137188326e-05, "epoch": 0.47923169267707083, "percentage": 47.92, "elapsed_time": "14:11:30", "remaining_time": "15:25:18", "throughput": 1600.23, "total_tokens": 81756160} -{"current_steps": 9990, "total_steps": 20825, "loss": 0.9881, "learning_rate": 2.8641624305675657e-05, "epoch": 0.4797118847539016, "percentage": 47.97, "elapsed_time": "14:12:23", "remaining_time": "15:24:29", "throughput": 1600.18, "total_tokens": 81838080} -{"current_steps": 10000, "total_steps": 20825, "loss": 0.7335, "learning_rate": 2.8602425747841057e-05, "epoch": 0.4801920768307323, "percentage": 48.02, "elapsed_time": "14:13:16", "remaining_time": "15:23:40", "throughput": 1600.11, "total_tokens": 81920000} -{"current_steps": 10010, "total_steps": 20825, "loss": 0.8356, "learning_rate": 2.8563218143762383e-05, "epoch": 0.48067226890756304, "percentage": 48.07, "elapsed_time": "14:14:12", "remaining_time": "15:22:54", "throughput": 1599.95, "total_tokens": 82001920} -{"current_steps": 10020, "total_steps": 20825, "loss": 0.8458, "learning_rate": 2.852400159189597e-05, "epoch": 0.48115246098439374, "percentage": 48.12, "elapsed_time": "14:15:06", "remaining_time": "15:22:05", "throughput": 1599.88, "total_tokens": 82083840} -{"current_steps": 10030, "total_steps": 20825, "loss": 0.995, "learning_rate": 2.848477619072059e-05, "epoch": 0.4816326530612245, "percentage": 48.16, "elapsed_time": "14:15:59", "remaining_time": "15:21:16", "throughput": 1599.81, "total_tokens": 82165760} -{"current_steps": 10040, "total_steps": 20825, "loss": 1.0218, "learning_rate": 2.8445542038737245e-05, "epoch": 0.48211284513805525, "percentage": 48.21, "elapsed_time": "14:16:52", "remaining_time": "15:20:28", "throughput": 1599.74, "total_tokens": 82247680} -{"current_steps": 10050, "total_steps": 20825, "loss": 0.9613, "learning_rate": 2.8406299234468915e-05, "epoch": 0.48259303721488594, "percentage": 48.26, "elapsed_time": "14:17:46", "remaining_time": "15:19:39", "throughput": 1599.67, "total_tokens": 82329600} -{"current_steps": 10060, "total_steps": 20825, "loss": 1.0402, "learning_rate": 2.8367047876460305e-05, "epoch": 0.4830732292917167, "percentage": 48.31, "elapsed_time": "14:18:40", "remaining_time": "15:18:50", "throughput": 1599.59, "total_tokens": 82411520} -{"current_steps": 10070, "total_steps": 20825, "loss": 0.9294, "learning_rate": 2.8327788063277594e-05, "epoch": 0.4835534213685474, "percentage": 48.36, "elapsed_time": "14:19:33", "remaining_time": "15:18:01", "throughput": 1599.53, "total_tokens": 82493440} -{"current_steps": 10080, "total_steps": 20825, "loss": 0.8672, "learning_rate": 2.8288519893508212e-05, "epoch": 0.48403361344537815, "percentage": 48.4, "elapsed_time": "14:20:26", "remaining_time": "15:17:12", "throughput": 1599.47, "total_tokens": 82575360} -{"current_steps": 10090, "total_steps": 20825, "loss": 0.8052, "learning_rate": 2.8249243465760566e-05, "epoch": 0.4845138055222089, "percentage": 48.45, "elapsed_time": "14:21:20", "remaining_time": "15:16:24", "throughput": 1599.39, "total_tokens": 82657280} -{"current_steps": 10100, "total_steps": 20825, "loss": 0.8885, "learning_rate": 2.8209958878663778e-05, "epoch": 0.4849939975990396, "percentage": 48.5, "elapsed_time": "14:22:13", "remaining_time": "15:15:35", "throughput": 1599.33, "total_tokens": 82739200} -{"current_steps": 10110, "total_steps": 20825, "loss": 0.8561, "learning_rate": 2.817066623086748e-05, "epoch": 0.48547418967587036, "percentage": 48.55, "elapsed_time": "14:23:07", "remaining_time": "15:14:46", "throughput": 1599.26, "total_tokens": 82821120} -{"current_steps": 10120, "total_steps": 20825, "loss": 0.8841, "learning_rate": 2.813136562104155e-05, "epoch": 0.48595438175270106, "percentage": 48.6, "elapsed_time": "14:23:59", "remaining_time": "15:13:56", "throughput": 1599.21, "total_tokens": 82903040} -{"current_steps": 10130, "total_steps": 20825, "loss": 0.9224, "learning_rate": 2.8092057147875856e-05, "epoch": 0.4864345738295318, "percentage": 48.64, "elapsed_time": "14:24:52", "remaining_time": "15:13:07", "throughput": 1599.16, "total_tokens": 82984960} -{"current_steps": 10140, "total_steps": 20825, "loss": 0.9768, "learning_rate": 2.8052740910079994e-05, "epoch": 0.48691476590636257, "percentage": 48.69, "elapsed_time": "14:25:45", "remaining_time": "15:12:17", "throughput": 1599.1, "total_tokens": 83066880} -{"current_steps": 10150, "total_steps": 20825, "loss": 0.9255, "learning_rate": 2.8013417006383076e-05, "epoch": 0.48739495798319327, "percentage": 48.74, "elapsed_time": "14:26:39", "remaining_time": "15:11:29", "throughput": 1599.03, "total_tokens": 83148800} -{"current_steps": 10160, "total_steps": 20825, "loss": 0.8565, "learning_rate": 2.7974085535533473e-05, "epoch": 0.487875150060024, "percentage": 48.79, "elapsed_time": "14:27:33", "remaining_time": "15:10:40", "throughput": 1598.96, "total_tokens": 83230720} -{"current_steps": 10170, "total_steps": 20825, "loss": 1.0491, "learning_rate": 2.7934746596298535e-05, "epoch": 0.4883553421368547, "percentage": 48.84, "elapsed_time": "14:28:26", "remaining_time": "15:09:51", "throughput": 1598.9, "total_tokens": 83312640} -{"current_steps": 10180, "total_steps": 20825, "loss": 0.8835, "learning_rate": 2.789540028746438e-05, "epoch": 0.4888355342136855, "percentage": 48.88, "elapsed_time": "14:29:19", "remaining_time": "15:09:02", "throughput": 1598.84, "total_tokens": 83394560} -{"current_steps": 10190, "total_steps": 20825, "loss": 0.9588, "learning_rate": 2.785604670783563e-05, "epoch": 0.48931572629051623, "percentage": 48.93, "elapsed_time": "14:30:12", "remaining_time": "15:08:12", "throughput": 1598.77, "total_tokens": 83476480} -{"current_steps": 10200, "total_steps": 20825, "loss": 0.7832, "learning_rate": 2.7816685956235165e-05, "epoch": 0.4897959183673469, "percentage": 48.98, "elapsed_time": "14:31:06", "remaining_time": "15:07:23", "throughput": 1598.71, "total_tokens": 83558400} -{"current_steps": 10210, "total_steps": 20825, "loss": 0.9374, "learning_rate": 2.7777318131503873e-05, "epoch": 0.4902761104441777, "percentage": 49.03, "elapsed_time": "14:31:59", "remaining_time": "15:06:35", "throughput": 1598.63, "total_tokens": 83640320} -{"current_steps": 10220, "total_steps": 20825, "loss": 0.767, "learning_rate": 2.773794333250041e-05, "epoch": 0.4907563025210084, "percentage": 49.08, "elapsed_time": "14:32:53", "remaining_time": "15:05:46", "throughput": 1598.57, "total_tokens": 83722240} -{"current_steps": 10230, "total_steps": 20825, "loss": 0.9588, "learning_rate": 2.769856165810093e-05, "epoch": 0.49123649459783914, "percentage": 49.12, "elapsed_time": "14:33:46", "remaining_time": "15:04:57", "throughput": 1598.5, "total_tokens": 83804160} -{"current_steps": 10240, "total_steps": 20825, "loss": 0.929, "learning_rate": 2.765917320719887e-05, "epoch": 0.4917166866746699, "percentage": 49.17, "elapsed_time": "14:34:40", "remaining_time": "15:04:08", "throughput": 1598.44, "total_tokens": 83886080} -{"current_steps": 10250, "total_steps": 20825, "loss": 0.8619, "learning_rate": 2.7619778078704685e-05, "epoch": 0.4921968787515006, "percentage": 49.22, "elapsed_time": "14:35:33", "remaining_time": "15:03:18", "throughput": 1598.38, "total_tokens": 83968000} -{"current_steps": 10260, "total_steps": 20825, "loss": 0.7223, "learning_rate": 2.7580376371545573e-05, "epoch": 0.49267707082833134, "percentage": 49.27, "elapsed_time": "14:36:26", "remaining_time": "15:02:29", "throughput": 1598.32, "total_tokens": 84049920} -{"current_steps": 10270, "total_steps": 20825, "loss": 0.8415, "learning_rate": 2.7540968184665283e-05, "epoch": 0.49315726290516204, "percentage": 49.32, "elapsed_time": "14:37:19", "remaining_time": "15:01:40", "throughput": 1598.26, "total_tokens": 84131840} -{"current_steps": 10280, "total_steps": 20825, "loss": 0.9001, "learning_rate": 2.7501553617023816e-05, "epoch": 0.4936374549819928, "percentage": 49.36, "elapsed_time": "14:38:12", "remaining_time": "15:00:51", "throughput": 1598.2, "total_tokens": 84213760} -{"current_steps": 10290, "total_steps": 20825, "loss": 0.8124, "learning_rate": 2.7462132767597205e-05, "epoch": 0.49411764705882355, "percentage": 49.41, "elapsed_time": "14:39:05", "remaining_time": "15:00:01", "throughput": 1598.14, "total_tokens": 84295680} -{"current_steps": 10300, "total_steps": 20825, "loss": 0.8611, "learning_rate": 2.742270573537724e-05, "epoch": 0.49459783913565425, "percentage": 49.46, "elapsed_time": "14:39:58", "remaining_time": "14:59:12", "throughput": 1598.09, "total_tokens": 84377600} -{"current_steps": 10310, "total_steps": 20825, "loss": 0.9993, "learning_rate": 2.7383272619371276e-05, "epoch": 0.495078031212485, "percentage": 49.51, "elapsed_time": "14:40:52", "remaining_time": "14:58:23", "throughput": 1598.01, "total_tokens": 84459520} -{"current_steps": 10320, "total_steps": 20825, "loss": 0.8757, "learning_rate": 2.7343833518601913e-05, "epoch": 0.4955582232893157, "percentage": 49.56, "elapsed_time": "14:41:46", "remaining_time": "14:57:34", "throughput": 1597.95, "total_tokens": 84541440} -{"current_steps": 10330, "total_steps": 20825, "loss": 1.1208, "learning_rate": 2.7304388532106768e-05, "epoch": 0.49603841536614646, "percentage": 49.6, "elapsed_time": "14:42:39", "remaining_time": "14:56:45", "throughput": 1597.89, "total_tokens": 84623360} -{"current_steps": 10340, "total_steps": 20825, "loss": 0.7873, "learning_rate": 2.726493775893828e-05, "epoch": 0.4965186074429772, "percentage": 49.65, "elapsed_time": "14:43:32", "remaining_time": "14:55:56", "throughput": 1597.82, "total_tokens": 84705280} -{"current_steps": 10350, "total_steps": 20825, "loss": 0.9001, "learning_rate": 2.7225481298163387e-05, "epoch": 0.4969987995198079, "percentage": 49.7, "elapsed_time": "14:44:26", "remaining_time": "14:55:06", "throughput": 1597.77, "total_tokens": 84787200} -{"current_steps": 10360, "total_steps": 20825, "loss": 1.0793, "learning_rate": 2.718601924886332e-05, "epoch": 0.49747899159663866, "percentage": 49.75, "elapsed_time": "14:45:19", "remaining_time": "14:54:17", "throughput": 1597.71, "total_tokens": 84869120} -{"current_steps": 10370, "total_steps": 20825, "loss": 0.8888, "learning_rate": 2.7146551710133346e-05, "epoch": 0.49795918367346936, "percentage": 49.8, "elapsed_time": "14:46:12", "remaining_time": "14:53:28", "throughput": 1597.65, "total_tokens": 84951040} -{"current_steps": 10380, "total_steps": 20825, "loss": 0.8732, "learning_rate": 2.7107078781082508e-05, "epoch": 0.4984393757503001, "percentage": 49.84, "elapsed_time": "14:47:06", "remaining_time": "14:52:39", "throughput": 1597.57, "total_tokens": 85032960} -{"current_steps": 10390, "total_steps": 20825, "loss": 0.9422, "learning_rate": 2.7067600560833384e-05, "epoch": 0.49891956782713087, "percentage": 49.89, "elapsed_time": "14:47:59", "remaining_time": "14:51:50", "throughput": 1597.51, "total_tokens": 85114880} -{"current_steps": 10400, "total_steps": 20825, "loss": 0.8577, "learning_rate": 2.7028117148521863e-05, "epoch": 0.49939975990396157, "percentage": 49.94, "elapsed_time": "14:48:53", "remaining_time": "14:51:01", "throughput": 1597.44, "total_tokens": 85196800} -{"current_steps": 10410, "total_steps": 20825, "loss": 0.9081, "learning_rate": 2.698862864329685e-05, "epoch": 0.4998799519807923, "percentage": 49.99, "elapsed_time": "14:49:46", "remaining_time": "14:50:12", "throughput": 1597.37, "total_tokens": 85278720} -{"current_steps": 10420, "total_steps": 20825, "loss": 0.9876, "learning_rate": 2.6949135144320026e-05, "epoch": 0.5003601440576231, "percentage": 50.04, "elapsed_time": "14:50:40", "remaining_time": "14:49:23", "throughput": 1597.32, "total_tokens": 85360640} -{"current_steps": 10430, "total_steps": 20825, "loss": 0.8621, "learning_rate": 2.6909636750765653e-05, "epoch": 0.5008403361344538, "percentage": 50.08, "elapsed_time": "14:51:33", "remaining_time": "14:48:34", "throughput": 1597.25, "total_tokens": 85442560} -{"current_steps": 10440, "total_steps": 20825, "loss": 0.9355, "learning_rate": 2.6870133561820243e-05, "epoch": 0.5013205282112845, "percentage": 50.13, "elapsed_time": "14:52:27", "remaining_time": "14:47:45", "throughput": 1597.18, "total_tokens": 85524480} -{"current_steps": 10450, "total_steps": 20825, "loss": 1.0307, "learning_rate": 2.683062567668238e-05, "epoch": 0.5018007202881153, "percentage": 50.18, "elapsed_time": "14:53:21", "remaining_time": "14:46:56", "throughput": 1597.1, "total_tokens": 85606400} -{"current_steps": 10460, "total_steps": 20825, "loss": 0.8886, "learning_rate": 2.679111319456242e-05, "epoch": 0.502280912364946, "percentage": 50.23, "elapsed_time": "14:54:14", "remaining_time": "14:46:06", "throughput": 1597.05, "total_tokens": 85688320} -{"current_steps": 10470, "total_steps": 20825, "loss": 0.6568, "learning_rate": 2.6751596214682278e-05, "epoch": 0.5027611044417767, "percentage": 50.28, "elapsed_time": "14:55:07", "remaining_time": "14:45:17", "throughput": 1596.99, "total_tokens": 85770240} -{"current_steps": 10480, "total_steps": 20825, "loss": 0.9178, "learning_rate": 2.671207483627515e-05, "epoch": 0.5032412965186075, "percentage": 50.32, "elapsed_time": "14:56:00", "remaining_time": "14:44:28", "throughput": 1596.93, "total_tokens": 85852160} -{"current_steps": 10490, "total_steps": 20825, "loss": 0.832, "learning_rate": 2.6672549158585293e-05, "epoch": 0.5037214885954382, "percentage": 50.37, "elapsed_time": "14:56:54", "remaining_time": "14:43:38", "throughput": 1596.87, "total_tokens": 85934080} -{"current_steps": 10500, "total_steps": 20825, "loss": 0.7443, "learning_rate": 2.663301928086774e-05, "epoch": 0.5042016806722689, "percentage": 50.42, "elapsed_time": "14:57:47", "remaining_time": "14:42:50", "throughput": 1596.8, "total_tokens": 86016000} -{"current_steps": 10510, "total_steps": 20825, "loss": 0.8535, "learning_rate": 2.6593485302388087e-05, "epoch": 0.5046818727490996, "percentage": 50.47, "elapsed_time": "14:58:40", "remaining_time": "14:42:00", "throughput": 1596.74, "total_tokens": 86097920} -{"current_steps": 10520, "total_steps": 20825, "loss": 0.9447, "learning_rate": 2.6553947322422223e-05, "epoch": 0.5051620648259304, "percentage": 50.52, "elapsed_time": "14:59:34", "remaining_time": "14:41:10", "throughput": 1596.69, "total_tokens": 86179840} -{"current_steps": 10530, "total_steps": 20825, "loss": 0.8657, "learning_rate": 2.6514405440256086e-05, "epoch": 0.5056422569027611, "percentage": 50.56, "elapsed_time": "15:00:27", "remaining_time": "14:40:21", "throughput": 1596.64, "total_tokens": 86261760} -{"current_steps": 10540, "total_steps": 20825, "loss": 0.9218, "learning_rate": 2.6474859755185415e-05, "epoch": 0.5061224489795918, "percentage": 50.61, "elapsed_time": "15:01:20", "remaining_time": "14:39:31", "throughput": 1596.59, "total_tokens": 86343680} -{"current_steps": 10550, "total_steps": 20825, "loss": 0.9897, "learning_rate": 2.6435310366515498e-05, "epoch": 0.5066026410564226, "percentage": 50.66, "elapsed_time": "15:02:13", "remaining_time": "14:38:42", "throughput": 1596.53, "total_tokens": 86425600} -{"current_steps": 10560, "total_steps": 20825, "loss": 1.0327, "learning_rate": 2.6395757373560904e-05, "epoch": 0.5070828331332533, "percentage": 50.71, "elapsed_time": "15:03:07", "remaining_time": "14:37:53", "throughput": 1596.45, "total_tokens": 86507520} -{"current_steps": 10570, "total_steps": 20825, "loss": 0.9704, "learning_rate": 2.6356200875645287e-05, "epoch": 0.507563025210084, "percentage": 50.76, "elapsed_time": "15:04:00", "remaining_time": "14:37:04", "throughput": 1596.39, "total_tokens": 86589440} -{"current_steps": 10580, "total_steps": 20825, "loss": 0.7818, "learning_rate": 2.631664097210108e-05, "epoch": 0.5080432172869148, "percentage": 50.8, "elapsed_time": "15:04:54", "remaining_time": "14:36:14", "throughput": 1596.33, "total_tokens": 86671360} -{"current_steps": 10590, "total_steps": 20825, "loss": 0.717, "learning_rate": 2.6277077762269276e-05, "epoch": 0.5085234093637455, "percentage": 50.85, "elapsed_time": "15:05:47", "remaining_time": "14:35:25", "throughput": 1596.26, "total_tokens": 86753280} -{"current_steps": 10600, "total_steps": 20825, "loss": 0.8514, "learning_rate": 2.6237511345499167e-05, "epoch": 0.5090036014405762, "percentage": 50.9, "elapsed_time": "15:06:40", "remaining_time": "14:34:36", "throughput": 1596.21, "total_tokens": 86835200} -{"current_steps": 10610, "total_steps": 20825, "loss": 0.8897, "learning_rate": 2.61979418211481e-05, "epoch": 0.5094837935174069, "percentage": 50.95, "elapsed_time": "15:07:33", "remaining_time": "14:33:46", "throughput": 1596.16, "total_tokens": 86917120} -{"current_steps": 10620, "total_steps": 20825, "loss": 0.9499, "learning_rate": 2.615836928858122e-05, "epoch": 0.5099639855942377, "percentage": 51.0, "elapsed_time": "15:08:27", "remaining_time": "14:32:57", "throughput": 1596.1, "total_tokens": 86999040} -{"current_steps": 10630, "total_steps": 20825, "loss": 0.7749, "learning_rate": 2.6118793847171236e-05, "epoch": 0.5104441776710684, "percentage": 51.04, "elapsed_time": "15:09:20", "remaining_time": "14:32:07", "throughput": 1596.05, "total_tokens": 87080960} -{"current_steps": 10640, "total_steps": 20825, "loss": 1.0117, "learning_rate": 2.607921559629816e-05, "epoch": 0.5109243697478991, "percentage": 51.09, "elapsed_time": "15:10:13", "remaining_time": "14:31:18", "throughput": 1595.99, "total_tokens": 87162880} -{"current_steps": 10650, "total_steps": 20825, "loss": 0.9039, "learning_rate": 2.6039634635349043e-05, "epoch": 0.5114045618247299, "percentage": 51.14, "elapsed_time": "15:11:06", "remaining_time": "14:30:28", "throughput": 1595.94, "total_tokens": 87244800} -{"current_steps": 10660, "total_steps": 20825, "loss": 0.8813, "learning_rate": 2.6000051063717767e-05, "epoch": 0.5118847539015606, "percentage": 51.19, "elapsed_time": "15:11:59", "remaining_time": "14:29:38", "throughput": 1595.89, "total_tokens": 87326720} -{"current_steps": 10670, "total_steps": 20825, "loss": 0.856, "learning_rate": 2.596046498080475e-05, "epoch": 0.5123649459783913, "percentage": 51.24, "elapsed_time": "15:12:53", "remaining_time": "14:28:49", "throughput": 1595.83, "total_tokens": 87408640} -{"current_steps": 10680, "total_steps": 20825, "loss": 0.9129, "learning_rate": 2.5920876486016726e-05, "epoch": 0.5128451380552221, "percentage": 51.28, "elapsed_time": "15:13:46", "remaining_time": "14:27:59", "throughput": 1595.78, "total_tokens": 87490560} -{"current_steps": 10690, "total_steps": 20825, "loss": 0.8935, "learning_rate": 2.5881285678766482e-05, "epoch": 0.5133253301320528, "percentage": 51.33, "elapsed_time": "15:14:39", "remaining_time": "14:27:09", "throughput": 1595.74, "total_tokens": 87572480} -{"current_steps": 10700, "total_steps": 20825, "loss": 0.8172, "learning_rate": 2.5841692658472617e-05, "epoch": 0.5138055222088835, "percentage": 51.38, "elapsed_time": "15:15:32", "remaining_time": "14:26:20", "throughput": 1595.68, "total_tokens": 87654400} -{"current_steps": 10710, "total_steps": 20825, "loss": 1.0935, "learning_rate": 2.5802097524559264e-05, "epoch": 0.5142857142857142, "percentage": 51.43, "elapsed_time": "15:16:25", "remaining_time": "14:25:30", "throughput": 1595.62, "total_tokens": 87736320} -{"current_steps": 10720, "total_steps": 20825, "loss": 0.8728, "learning_rate": 2.5762500376455912e-05, "epoch": 0.514765906362545, "percentage": 51.48, "elapsed_time": "15:17:18", "remaining_time": "14:24:41", "throughput": 1595.57, "total_tokens": 87818240} -{"current_steps": 10730, "total_steps": 20825, "loss": 0.8416, "learning_rate": 2.5722901313597052e-05, "epoch": 0.5152460984393757, "percentage": 51.52, "elapsed_time": "15:18:11", "remaining_time": "14:23:51", "throughput": 1595.52, "total_tokens": 87900160} -{"current_steps": 10740, "total_steps": 20825, "loss": 0.8828, "learning_rate": 2.5683300435422032e-05, "epoch": 0.5157262905162064, "percentage": 51.57, "elapsed_time": "15:19:05", "remaining_time": "14:23:02", "throughput": 1595.45, "total_tokens": 87982080} -{"current_steps": 10750, "total_steps": 20825, "loss": 0.8147, "learning_rate": 2.564369784137472e-05, "epoch": 0.5162064825930373, "percentage": 51.62, "elapsed_time": "15:19:58", "remaining_time": "14:22:12", "throughput": 1595.39, "total_tokens": 88064000} -{"current_steps": 10760, "total_steps": 20825, "loss": 0.8245, "learning_rate": 2.5604093630903307e-05, "epoch": 0.516686674669868, "percentage": 51.67, "elapsed_time": "15:20:51", "remaining_time": "14:21:23", "throughput": 1595.35, "total_tokens": 88145920} -{"current_steps": 10770, "total_steps": 20825, "loss": 0.7478, "learning_rate": 2.556448790346006e-05, "epoch": 0.5171668667466987, "percentage": 51.72, "elapsed_time": "15:21:45", "remaining_time": "14:20:33", "throughput": 1595.29, "total_tokens": 88227840} -{"current_steps": 10780, "total_steps": 20825, "loss": 1.0129, "learning_rate": 2.5524880758501035e-05, "epoch": 0.5176470588235295, "percentage": 51.76, "elapsed_time": "15:22:38", "remaining_time": "14:19:44", "throughput": 1595.23, "total_tokens": 88309760} -{"current_steps": 10790, "total_steps": 20825, "loss": 0.9362, "learning_rate": 2.5485272295485846e-05, "epoch": 0.5181272509003602, "percentage": 51.81, "elapsed_time": "15:23:32", "remaining_time": "14:18:54", "throughput": 1595.16, "total_tokens": 88391680} -{"current_steps": 10800, "total_steps": 20825, "loss": 0.756, "learning_rate": 2.544566261387743e-05, "epoch": 0.5186074429771909, "percentage": 51.86, "elapsed_time": "15:24:25", "remaining_time": "14:18:05", "throughput": 1595.11, "total_tokens": 88473600} -{"current_steps": 10810, "total_steps": 20825, "loss": 0.843, "learning_rate": 2.5406051813141773e-05, "epoch": 0.5190876350540216, "percentage": 51.91, "elapsed_time": "15:25:18", "remaining_time": "14:17:15", "throughput": 1595.06, "total_tokens": 88555520} -{"current_steps": 10820, "total_steps": 20825, "loss": 0.8411, "learning_rate": 2.5366439992747688e-05, "epoch": 0.5195678271308524, "percentage": 51.96, "elapsed_time": "15:26:12", "remaining_time": "14:16:26", "throughput": 1595.0, "total_tokens": 88637440} -{"current_steps": 10830, "total_steps": 20825, "loss": 0.8732, "learning_rate": 2.5326827252166523e-05, "epoch": 0.5200480192076831, "percentage": 52.0, "elapsed_time": "15:27:05", "remaining_time": "14:15:37", "throughput": 1594.93, "total_tokens": 88719360} -{"current_steps": 10840, "total_steps": 20825, "loss": 0.8446, "learning_rate": 2.5287213690871957e-05, "epoch": 0.5205282112845138, "percentage": 52.05, "elapsed_time": "15:27:58", "remaining_time": "14:14:47", "throughput": 1594.88, "total_tokens": 88801280} -{"current_steps": 10850, "total_steps": 20825, "loss": 0.8941, "learning_rate": 2.5247599408339723e-05, "epoch": 0.5210084033613446, "percentage": 52.1, "elapsed_time": "15:28:52", "remaining_time": "14:13:57", "throughput": 1594.82, "total_tokens": 88883200} -{"current_steps": 10860, "total_steps": 20825, "loss": 0.8391, "learning_rate": 2.5207984504047365e-05, "epoch": 0.5214885954381753, "percentage": 52.15, "elapsed_time": "15:29:45", "remaining_time": "14:13:08", "throughput": 1594.77, "total_tokens": 88965120} -{"current_steps": 10870, "total_steps": 20825, "loss": 0.7663, "learning_rate": 2.5168369077474004e-05, "epoch": 0.521968787515006, "percentage": 52.2, "elapsed_time": "15:30:38", "remaining_time": "14:12:18", "throughput": 1594.72, "total_tokens": 89047040} -{"current_steps": 10880, "total_steps": 20825, "loss": 0.9436, "learning_rate": 2.512875322810002e-05, "epoch": 0.5224489795918368, "percentage": 52.24, "elapsed_time": "15:31:31", "remaining_time": "14:11:28", "throughput": 1594.67, "total_tokens": 89128960} -{"current_steps": 10890, "total_steps": 20825, "loss": 0.8914, "learning_rate": 2.508913705540693e-05, "epoch": 0.5229291716686675, "percentage": 52.29, "elapsed_time": "15:32:25", "remaining_time": "14:10:38", "throughput": 1594.62, "total_tokens": 89210880} -{"current_steps": 10900, "total_steps": 20825, "loss": 0.8412, "learning_rate": 2.504952065887701e-05, "epoch": 0.5234093637454982, "percentage": 52.34, "elapsed_time": "15:33:18", "remaining_time": "14:09:49", "throughput": 1594.55, "total_tokens": 89292800} -{"current_steps": 10910, "total_steps": 20825, "loss": 0.9038, "learning_rate": 2.5009904137993106e-05, "epoch": 0.5238895558223289, "percentage": 52.39, "elapsed_time": "15:34:12", "remaining_time": "14:09:00", "throughput": 1594.49, "total_tokens": 89374720} -{"current_steps": 10920, "total_steps": 20825, "loss": 1.0436, "learning_rate": 2.497028759223839e-05, "epoch": 0.5243697478991597, "percentage": 52.44, "elapsed_time": "15:35:06", "remaining_time": "14:08:11", "throughput": 1594.42, "total_tokens": 89456640} -{"current_steps": 10930, "total_steps": 20825, "loss": 0.9828, "learning_rate": 2.4930671121096105e-05, "epoch": 0.5248499399759904, "percentage": 52.48, "elapsed_time": "15:35:59", "remaining_time": "14:07:21", "throughput": 1594.38, "total_tokens": 89538560} -{"current_steps": 10940, "total_steps": 20825, "loss": 0.7117, "learning_rate": 2.4891054824049264e-05, "epoch": 0.5253301320528211, "percentage": 52.53, "elapsed_time": "15:36:52", "remaining_time": "14:06:31", "throughput": 1594.32, "total_tokens": 89620480} -{"current_steps": 10950, "total_steps": 20825, "loss": 0.8639, "learning_rate": 2.485143880058049e-05, "epoch": 0.5258103241296519, "percentage": 52.58, "elapsed_time": "15:37:45", "remaining_time": "14:05:41", "throughput": 1594.27, "total_tokens": 89702400} -{"current_steps": 10960, "total_steps": 20825, "loss": 0.8927, "learning_rate": 2.4811823150171692e-05, "epoch": 0.5262905162064826, "percentage": 52.63, "elapsed_time": "15:38:38", "remaining_time": "14:04:51", "throughput": 1594.22, "total_tokens": 89784320} -{"current_steps": 10970, "total_steps": 20825, "loss": 1.0442, "learning_rate": 2.477220797230385e-05, "epoch": 0.5267707082833133, "percentage": 52.68, "elapsed_time": "15:39:31", "remaining_time": "14:04:02", "throughput": 1594.16, "total_tokens": 89866240} -{"current_steps": 10980, "total_steps": 20825, "loss": 1.1357, "learning_rate": 2.4732593366456755e-05, "epoch": 0.5272509003601441, "percentage": 52.73, "elapsed_time": "15:40:26", "remaining_time": "14:03:13", "throughput": 1594.08, "total_tokens": 89948160} -{"current_steps": 10990, "total_steps": 20825, "loss": 0.9067, "learning_rate": 2.4692979432108777e-05, "epoch": 0.5277310924369748, "percentage": 52.77, "elapsed_time": "15:41:20", "remaining_time": "14:02:24", "throughput": 1594.01, "total_tokens": 90030080} -{"current_steps": 11000, "total_steps": 20825, "loss": 1.0397, "learning_rate": 2.4653366268736565e-05, "epoch": 0.5282112845138055, "percentage": 52.82, "elapsed_time": "15:42:13", "remaining_time": "14:01:34", "throughput": 1593.95, "total_tokens": 90112000} -{"current_steps": 11010, "total_steps": 20825, "loss": 0.7986, "learning_rate": 2.461375397581487e-05, "epoch": 0.5286914765906362, "percentage": 52.87, "elapsed_time": "15:43:10", "remaining_time": "14:00:48", "throughput": 1593.8, "total_tokens": 90193920} -{"current_steps": 11020, "total_steps": 20825, "loss": 0.8494, "learning_rate": 2.4574142652816238e-05, "epoch": 0.529171668667467, "percentage": 52.92, "elapsed_time": "15:44:03", "remaining_time": "13:59:58", "throughput": 1593.74, "total_tokens": 90275840} -{"current_steps": 11030, "total_steps": 20825, "loss": 0.75, "learning_rate": 2.453453239921077e-05, "epoch": 0.5296518607442977, "percentage": 52.97, "elapsed_time": "15:44:57", "remaining_time": "13:59:09", "throughput": 1593.68, "total_tokens": 90357760} -{"current_steps": 11040, "total_steps": 20825, "loss": 0.7564, "learning_rate": 2.44949233144659e-05, "epoch": 0.5301320528211284, "percentage": 53.01, "elapsed_time": "15:45:50", "remaining_time": "13:58:19", "throughput": 1593.63, "total_tokens": 90439680} -{"current_steps": 11050, "total_steps": 20825, "loss": 0.8193, "learning_rate": 2.4455315498046134e-05, "epoch": 0.5306122448979592, "percentage": 53.06, "elapsed_time": "15:46:44", "remaining_time": "13:57:29", "throughput": 1593.58, "total_tokens": 90521600} -{"current_steps": 11060, "total_steps": 20825, "loss": 0.8752, "learning_rate": 2.4415709049412757e-05, "epoch": 0.5310924369747899, "percentage": 53.11, "elapsed_time": "15:47:37", "remaining_time": "13:56:40", "throughput": 1593.52, "total_tokens": 90603520} -{"current_steps": 11070, "total_steps": 20825, "loss": 0.8828, "learning_rate": 2.437610406802365e-05, "epoch": 0.5315726290516206, "percentage": 53.16, "elapsed_time": "15:48:30", "remaining_time": "13:55:50", "throughput": 1593.47, "total_tokens": 90685440} -{"current_steps": 11080, "total_steps": 20825, "loss": 0.9908, "learning_rate": 2.4336500653333012e-05, "epoch": 0.5320528211284514, "percentage": 53.21, "elapsed_time": "15:49:24", "remaining_time": "13:55:00", "throughput": 1593.41, "total_tokens": 90767360} -{"current_steps": 11090, "total_steps": 20825, "loss": 0.9681, "learning_rate": 2.4296898904791076e-05, "epoch": 0.5325330132052821, "percentage": 53.25, "elapsed_time": "15:50:17", "remaining_time": "13:54:11", "throughput": 1593.35, "total_tokens": 90849280} -{"current_steps": 11100, "total_steps": 20825, "loss": 0.8629, "learning_rate": 2.425729892184393e-05, "epoch": 0.5330132052821128, "percentage": 53.3, "elapsed_time": "15:51:10", "remaining_time": "13:53:21", "throughput": 1593.3, "total_tokens": 90931200} -{"current_steps": 11110, "total_steps": 20825, "loss": 1.1662, "learning_rate": 2.421770080393321e-05, "epoch": 0.5334933973589436, "percentage": 53.35, "elapsed_time": "15:52:04", "remaining_time": "13:52:31", "throughput": 1593.25, "total_tokens": 91013120} -{"current_steps": 11120, "total_steps": 20825, "loss": 0.9811, "learning_rate": 2.417810465049585e-05, "epoch": 0.5339735894357743, "percentage": 53.4, "elapsed_time": "15:52:57", "remaining_time": "13:51:41", "throughput": 1593.2, "total_tokens": 91095040} -{"current_steps": 11130, "total_steps": 20825, "loss": 0.7801, "learning_rate": 2.413851056096388e-05, "epoch": 0.534453781512605, "percentage": 53.45, "elapsed_time": "15:53:51", "remaining_time": "13:50:52", "throughput": 1593.13, "total_tokens": 91176960} -{"current_steps": 11140, "total_steps": 20825, "loss": 0.8704, "learning_rate": 2.4098918634764153e-05, "epoch": 0.5349339735894357, "percentage": 53.49, "elapsed_time": "15:54:44", "remaining_time": "13:50:02", "throughput": 1593.09, "total_tokens": 91258880} -{"current_steps": 11150, "total_steps": 20825, "loss": 1.0149, "learning_rate": 2.4059328971318053e-05, "epoch": 0.5354141656662665, "percentage": 53.54, "elapsed_time": "15:55:37", "remaining_time": "13:49:12", "throughput": 1593.03, "total_tokens": 91340800} -{"current_steps": 11160, "total_steps": 20825, "loss": 0.9053, "learning_rate": 2.4019741670041305e-05, "epoch": 0.5358943577430972, "percentage": 53.59, "elapsed_time": "15:56:31", "remaining_time": "13:48:22", "throughput": 1592.98, "total_tokens": 91422720} -{"current_steps": 11170, "total_steps": 20825, "loss": 0.966, "learning_rate": 2.398015683034371e-05, "epoch": 0.5363745498199279, "percentage": 53.64, "elapsed_time": "15:57:24", "remaining_time": "13:47:33", "throughput": 1592.92, "total_tokens": 91504640} -{"current_steps": 11180, "total_steps": 20825, "loss": 0.696, "learning_rate": 2.394057455162886e-05, "epoch": 0.5368547418967587, "percentage": 53.69, "elapsed_time": "15:58:18", "remaining_time": "13:46:43", "throughput": 1592.86, "total_tokens": 91586560} -{"current_steps": 11190, "total_steps": 20825, "loss": 0.7898, "learning_rate": 2.3900994933293953e-05, "epoch": 0.5373349339735894, "percentage": 53.73, "elapsed_time": "15:59:11", "remaining_time": "13:45:53", "throughput": 1592.81, "total_tokens": 91668480} -{"current_steps": 11200, "total_steps": 20825, "loss": 0.9175, "learning_rate": 2.3861418074729476e-05, "epoch": 0.5378151260504201, "percentage": 53.78, "elapsed_time": "16:00:04", "remaining_time": "13:45:04", "throughput": 1592.76, "total_tokens": 91750400} -{"current_steps": 11210, "total_steps": 20825, "loss": 0.8275, "learning_rate": 2.3821844075318993e-05, "epoch": 0.538295318127251, "percentage": 53.83, "elapsed_time": "16:00:57", "remaining_time": "13:44:14", "throughput": 1592.71, "total_tokens": 91832320} -{"current_steps": 11220, "total_steps": 20825, "loss": 0.9653, "learning_rate": 2.378227303443889e-05, "epoch": 0.5387755102040817, "percentage": 53.88, "elapsed_time": "16:01:51", "remaining_time": "13:43:24", "throughput": 1592.65, "total_tokens": 91914240} -{"current_steps": 11230, "total_steps": 20825, "loss": 0.8119, "learning_rate": 2.3742705051458145e-05, "epoch": 0.5392557022809124, "percentage": 53.93, "elapsed_time": "16:02:44", "remaining_time": "13:42:34", "throughput": 1592.61, "total_tokens": 91996160} -{"current_steps": 11240, "total_steps": 20825, "loss": 0.9283, "learning_rate": 2.3703140225738017e-05, "epoch": 0.539735894357743, "percentage": 53.97, "elapsed_time": "16:03:37", "remaining_time": "13:41:44", "throughput": 1592.56, "total_tokens": 92078080} -{"current_steps": 11250, "total_steps": 20825, "loss": 0.8144, "learning_rate": 2.3663578656631858e-05, "epoch": 0.5402160864345739, "percentage": 54.02, "elapsed_time": "16:04:30", "remaining_time": "13:40:54", "throughput": 1592.51, "total_tokens": 92160000} -{"current_steps": 11260, "total_steps": 20825, "loss": 0.8041, "learning_rate": 2.362402044348486e-05, "epoch": 0.5406962785114046, "percentage": 54.07, "elapsed_time": "16:05:24", "remaining_time": "13:40:04", "throughput": 1592.46, "total_tokens": 92241920} -{"current_steps": 11270, "total_steps": 20825, "loss": 0.877, "learning_rate": 2.3584465685633738e-05, "epoch": 0.5411764705882353, "percentage": 54.12, "elapsed_time": "16:06:17", "remaining_time": "13:39:14", "throughput": 1592.41, "total_tokens": 92323840} -{"current_steps": 11280, "total_steps": 20825, "loss": 0.8796, "learning_rate": 2.3544914482406592e-05, "epoch": 0.5416566626650661, "percentage": 54.17, "elapsed_time": "16:07:10", "remaining_time": "13:38:24", "throughput": 1592.36, "total_tokens": 92405760} -{"current_steps": 11290, "total_steps": 20825, "loss": 0.8823, "learning_rate": 2.350536693312255e-05, "epoch": 0.5421368547418968, "percentage": 54.21, "elapsed_time": "16:08:04", "remaining_time": "13:37:35", "throughput": 1592.3, "total_tokens": 92487680} -{"current_steps": 11300, "total_steps": 20825, "loss": 0.8294, "learning_rate": 2.3465823137091572e-05, "epoch": 0.5426170468187275, "percentage": 54.26, "elapsed_time": "16:08:57", "remaining_time": "13:36:45", "throughput": 1592.25, "total_tokens": 92569600} -{"current_steps": 11310, "total_steps": 20825, "loss": 0.8574, "learning_rate": 2.3426283193614208e-05, "epoch": 0.5430972388955583, "percentage": 54.31, "elapsed_time": "16:09:51", "remaining_time": "13:35:55", "throughput": 1592.2, "total_tokens": 92651520} -{"current_steps": 11320, "total_steps": 20825, "loss": 1.143, "learning_rate": 2.3386747201981338e-05, "epoch": 0.543577430972389, "percentage": 54.36, "elapsed_time": "16:10:44", "remaining_time": "13:35:05", "throughput": 1592.15, "total_tokens": 92733440} -{"current_steps": 11330, "total_steps": 20825, "loss": 0.8502, "learning_rate": 2.3347215261473887e-05, "epoch": 0.5440576230492197, "percentage": 54.41, "elapsed_time": "16:11:37", "remaining_time": "13:34:15", "throughput": 1592.1, "total_tokens": 92815360} -{"current_steps": 11340, "total_steps": 20825, "loss": 0.9998, "learning_rate": 2.330768747136263e-05, "epoch": 0.5445378151260504, "percentage": 54.45, "elapsed_time": "16:12:31", "remaining_time": "13:33:26", "throughput": 1592.04, "total_tokens": 92897280} -{"current_steps": 11350, "total_steps": 20825, "loss": 0.8627, "learning_rate": 2.3268163930907933e-05, "epoch": 0.5450180072028812, "percentage": 54.5, "elapsed_time": "16:13:24", "remaining_time": "13:32:36", "throughput": 1591.98, "total_tokens": 92979200} -{"current_steps": 11360, "total_steps": 20825, "loss": 0.8115, "learning_rate": 2.3228644739359444e-05, "epoch": 0.5454981992797119, "percentage": 54.55, "elapsed_time": "16:14:18", "remaining_time": "13:31:47", "throughput": 1591.91, "total_tokens": 93061120} -{"current_steps": 11370, "total_steps": 20825, "loss": 0.9262, "learning_rate": 2.3189129995955943e-05, "epoch": 0.5459783913565426, "percentage": 54.6, "elapsed_time": "16:15:12", "remaining_time": "13:30:57", "throughput": 1591.86, "total_tokens": 93143040} -{"current_steps": 11380, "total_steps": 20825, "loss": 0.9588, "learning_rate": 2.314961979992501e-05, "epoch": 0.5464585834333734, "percentage": 54.65, "elapsed_time": "16:16:05", "remaining_time": "13:30:07", "throughput": 1591.8, "total_tokens": 93224960} -{"current_steps": 11390, "total_steps": 20825, "loss": 1.0475, "learning_rate": 2.311011425048281e-05, "epoch": 0.5469387755102041, "percentage": 54.69, "elapsed_time": "16:16:59", "remaining_time": "13:29:18", "throughput": 1591.73, "total_tokens": 93306880} -{"current_steps": 11400, "total_steps": 20825, "loss": 0.9962, "learning_rate": 2.3070613446833842e-05, "epoch": 0.5474189675870348, "percentage": 54.74, "elapsed_time": "16:17:52", "remaining_time": "13:28:27", "throughput": 1591.69, "total_tokens": 93388800} -{"current_steps": 11410, "total_steps": 20825, "loss": 0.9423, "learning_rate": 2.30311174881707e-05, "epoch": 0.5478991596638656, "percentage": 54.79, "elapsed_time": "16:18:46", "remaining_time": "13:27:38", "throughput": 1591.64, "total_tokens": 93470720} -{"current_steps": 11420, "total_steps": 20825, "loss": 0.78, "learning_rate": 2.2991626473673773e-05, "epoch": 0.5483793517406963, "percentage": 54.84, "elapsed_time": "16:19:39", "remaining_time": "13:26:48", "throughput": 1591.58, "total_tokens": 93552640} -{"current_steps": 11430, "total_steps": 20825, "loss": 0.9205, "learning_rate": 2.295214050251108e-05, "epoch": 0.548859543817527, "percentage": 54.89, "elapsed_time": "16:20:32", "remaining_time": "13:25:58", "throughput": 1591.54, "total_tokens": 93634560} -{"current_steps": 11440, "total_steps": 20825, "loss": 0.7834, "learning_rate": 2.2912659673837965e-05, "epoch": 0.5493397358943577, "percentage": 54.93, "elapsed_time": "16:21:26", "remaining_time": "13:25:08", "throughput": 1591.49, "total_tokens": 93716480} -{"current_steps": 11450, "total_steps": 20825, "loss": 0.8649, "learning_rate": 2.2873184086796824e-05, "epoch": 0.5498199279711885, "percentage": 54.98, "elapsed_time": "16:22:19", "remaining_time": "13:24:18", "throughput": 1591.43, "total_tokens": 93798400} -{"current_steps": 11460, "total_steps": 20825, "loss": 1.2097, "learning_rate": 2.283371384051693e-05, "epoch": 0.5503001200480192, "percentage": 55.03, "elapsed_time": "16:23:12", "remaining_time": "13:23:28", "throughput": 1591.38, "total_tokens": 93880320} -{"current_steps": 11470, "total_steps": 20825, "loss": 0.9085, "learning_rate": 2.2794249034114137e-05, "epoch": 0.5507803121248499, "percentage": 55.08, "elapsed_time": "16:24:05", "remaining_time": "13:22:38", "throughput": 1591.34, "total_tokens": 93962240} -{"current_steps": 11480, "total_steps": 20825, "loss": 1.0061, "learning_rate": 2.275478976669062e-05, "epoch": 0.5512605042016807, "percentage": 55.13, "elapsed_time": "16:24:59", "remaining_time": "13:21:48", "throughput": 1591.29, "total_tokens": 94044160} -{"current_steps": 11490, "total_steps": 20825, "loss": 0.9816, "learning_rate": 2.2715336137334657e-05, "epoch": 0.5517406962785114, "percentage": 55.17, "elapsed_time": "16:25:52", "remaining_time": "13:20:58", "throughput": 1591.25, "total_tokens": 94126080} -{"current_steps": 11500, "total_steps": 20825, "loss": 1.0597, "learning_rate": 2.2675888245120382e-05, "epoch": 0.5522208883553421, "percentage": 55.22, "elapsed_time": "16:26:45", "remaining_time": "13:20:07", "throughput": 1591.2, "total_tokens": 94208000} -{"current_steps": 11510, "total_steps": 20825, "loss": 0.9222, "learning_rate": 2.263644618910749e-05, "epoch": 0.5527010804321729, "percentage": 55.27, "elapsed_time": "16:27:38", "remaining_time": "13:19:17", "throughput": 1591.16, "total_tokens": 94289920} -{"current_steps": 11520, "total_steps": 20825, "loss": 0.6929, "learning_rate": 2.2597010068341052e-05, "epoch": 0.5531812725090036, "percentage": 55.32, "elapsed_time": "16:28:32", "remaining_time": "13:18:27", "throughput": 1591.1, "total_tokens": 94371840} -{"current_steps": 11530, "total_steps": 20825, "loss": 0.943, "learning_rate": 2.255757998185122e-05, "epoch": 0.5536614645858343, "percentage": 55.37, "elapsed_time": "16:29:25", "remaining_time": "13:17:38", "throughput": 1591.05, "total_tokens": 94453760} -{"current_steps": 11540, "total_steps": 20825, "loss": 0.9255, "learning_rate": 2.2518156028652977e-05, "epoch": 0.554141656662665, "percentage": 55.41, "elapsed_time": "16:30:19", "remaining_time": "13:16:48", "throughput": 1591.0, "total_tokens": 94535680} -{"current_steps": 11550, "total_steps": 20825, "loss": 0.7929, "learning_rate": 2.2478738307745938e-05, "epoch": 0.5546218487394958, "percentage": 55.46, "elapsed_time": "16:31:12", "remaining_time": "13:15:58", "throughput": 1590.94, "total_tokens": 94617600} -{"current_steps": 11560, "total_steps": 20825, "loss": 0.9169, "learning_rate": 2.243932691811405e-05, "epoch": 0.5551020408163265, "percentage": 55.51, "elapsed_time": "16:32:06", "remaining_time": "13:15:08", "throughput": 1590.88, "total_tokens": 94699520} -{"current_steps": 11570, "total_steps": 20825, "loss": 0.9749, "learning_rate": 2.2399921958725364e-05, "epoch": 0.5555822328931572, "percentage": 55.56, "elapsed_time": "16:33:00", "remaining_time": "13:14:19", "throughput": 1590.82, "total_tokens": 94781440} -{"current_steps": 11580, "total_steps": 20825, "loss": 1.0515, "learning_rate": 2.236052352853177e-05, "epoch": 0.556062424969988, "percentage": 55.61, "elapsed_time": "16:33:54", "remaining_time": "13:13:29", "throughput": 1590.76, "total_tokens": 94863360} -{"current_steps": 11590, "total_steps": 20825, "loss": 0.9887, "learning_rate": 2.232113172646878e-05, "epoch": 0.5565426170468187, "percentage": 55.65, "elapsed_time": "16:34:47", "remaining_time": "13:12:39", "throughput": 1590.71, "total_tokens": 94945280} -{"current_steps": 11600, "total_steps": 20825, "loss": 0.8613, "learning_rate": 2.2281746651455272e-05, "epoch": 0.5570228091236494, "percentage": 55.7, "elapsed_time": "16:35:40", "remaining_time": "13:11:49", "throughput": 1590.66, "total_tokens": 95027200} -{"current_steps": 11610, "total_steps": 20825, "loss": 1.061, "learning_rate": 2.2242368402393198e-05, "epoch": 0.5575030012004802, "percentage": 55.75, "elapsed_time": "16:36:34", "remaining_time": "13:10:59", "throughput": 1590.61, "total_tokens": 95109120} -{"current_steps": 11620, "total_steps": 20825, "loss": 0.8245, "learning_rate": 2.220299707816738e-05, "epoch": 0.5579831932773109, "percentage": 55.8, "elapsed_time": "16:37:27", "remaining_time": "13:10:09", "throughput": 1590.56, "total_tokens": 95191040} -{"current_steps": 11630, "total_steps": 20825, "loss": 0.8227, "learning_rate": 2.2163632777645282e-05, "epoch": 0.5584633853541416, "percentage": 55.85, "elapsed_time": "16:38:20", "remaining_time": "13:09:19", "throughput": 1590.51, "total_tokens": 95272960} -{"current_steps": 11640, "total_steps": 20825, "loss": 0.9013, "learning_rate": 2.2124275599676676e-05, "epoch": 0.5589435774309723, "percentage": 55.89, "elapsed_time": "16:39:14", "remaining_time": "13:08:29", "throughput": 1590.46, "total_tokens": 95354880} -{"current_steps": 11650, "total_steps": 20825, "loss": 0.9034, "learning_rate": 2.20849256430935e-05, "epoch": 0.5594237695078031, "percentage": 55.94, "elapsed_time": "16:40:07", "remaining_time": "13:07:38", "throughput": 1590.42, "total_tokens": 95436800} -{"current_steps": 11660, "total_steps": 20825, "loss": 0.919, "learning_rate": 2.2045583006709536e-05, "epoch": 0.5599039615846338, "percentage": 55.99, "elapsed_time": "16:41:00", "remaining_time": "13:06:48", "throughput": 1590.37, "total_tokens": 95518720} -{"current_steps": 11670, "total_steps": 20825, "loss": 0.868, "learning_rate": 2.2006247789320162e-05, "epoch": 0.5603841536614645, "percentage": 56.04, "elapsed_time": "16:41:54", "remaining_time": "13:05:58", "throughput": 1590.32, "total_tokens": 95600640} -{"current_steps": 11680, "total_steps": 20825, "loss": 0.9287, "learning_rate": 2.1966920089702157e-05, "epoch": 0.5608643457382954, "percentage": 56.09, "elapsed_time": "16:42:47", "remaining_time": "13:05:08", "throughput": 1590.27, "total_tokens": 95682560} -{"current_steps": 11690, "total_steps": 20825, "loss": 0.8022, "learning_rate": 2.192760000661343e-05, "epoch": 0.561344537815126, "percentage": 56.13, "elapsed_time": "16:43:42", "remaining_time": "13:04:20", "throughput": 1590.17, "total_tokens": 95764480} -{"current_steps": 11700, "total_steps": 20825, "loss": 0.8273, "learning_rate": 2.1888287638792722e-05, "epoch": 0.5618247298919568, "percentage": 56.18, "elapsed_time": "16:44:38", "remaining_time": "13:03:32", "throughput": 1590.05, "total_tokens": 95846400} -{"current_steps": 11710, "total_steps": 20825, "loss": 0.8902, "learning_rate": 2.184898308495943e-05, "epoch": 0.5623049219687876, "percentage": 56.23, "elapsed_time": "16:45:34", "remaining_time": "13:02:43", "throughput": 1589.94, "total_tokens": 95928320} -{"current_steps": 11720, "total_steps": 20825, "loss": 0.9926, "learning_rate": 2.180968644381334e-05, "epoch": 0.5627851140456183, "percentage": 56.28, "elapsed_time": "16:46:30", "remaining_time": "13:01:55", "throughput": 1589.82, "total_tokens": 96010240} -{"current_steps": 11730, "total_steps": 20825, "loss": 0.8164, "learning_rate": 2.1770397814034315e-05, "epoch": 0.563265306122449, "percentage": 56.33, "elapsed_time": "16:47:26", "remaining_time": "13:01:07", "throughput": 1589.72, "total_tokens": 96092160} -{"current_steps": 11740, "total_steps": 20825, "loss": 0.9192, "learning_rate": 2.1731117294282166e-05, "epoch": 0.5637454981992797, "percentage": 56.37, "elapsed_time": "16:48:21", "remaining_time": "13:00:19", "throughput": 1589.61, "total_tokens": 96174080} -{"current_steps": 11750, "total_steps": 20825, "loss": 0.841, "learning_rate": 2.16918449831963e-05, "epoch": 0.5642256902761105, "percentage": 56.42, "elapsed_time": "16:49:17", "remaining_time": "12:59:30", "throughput": 1589.5, "total_tokens": 96256000} -{"current_steps": 11760, "total_steps": 20825, "loss": 0.8303, "learning_rate": 2.165258097939551e-05, "epoch": 0.5647058823529412, "percentage": 56.47, "elapsed_time": "16:50:12", "remaining_time": "12:58:42", "throughput": 1589.4, "total_tokens": 96337920} -{"current_steps": 11770, "total_steps": 20825, "loss": 0.6811, "learning_rate": 2.1613325381477744e-05, "epoch": 0.5651860744297719, "percentage": 56.52, "elapsed_time": "16:51:08", "remaining_time": "12:57:54", "throughput": 1589.28, "total_tokens": 96419840} -{"current_steps": 11780, "total_steps": 20825, "loss": 0.9841, "learning_rate": 2.1574078288019846e-05, "epoch": 0.5656662665066027, "percentage": 56.57, "elapsed_time": "16:52:04", "remaining_time": "12:57:06", "throughput": 1589.17, "total_tokens": 96501760} -{"current_steps": 11790, "total_steps": 20825, "loss": 1.0156, "learning_rate": 2.1534839797577268e-05, "epoch": 0.5661464585834334, "percentage": 56.61, "elapsed_time": "16:53:00", "remaining_time": "12:56:17", "throughput": 1589.06, "total_tokens": 96583680} -{"current_steps": 11800, "total_steps": 20825, "loss": 0.813, "learning_rate": 2.14956100086839e-05, "epoch": 0.5666266506602641, "percentage": 56.66, "elapsed_time": "16:53:55", "remaining_time": "12:55:28", "throughput": 1588.97, "total_tokens": 96665600} -{"current_steps": 11810, "total_steps": 20825, "loss": 0.8036, "learning_rate": 2.1456389019851762e-05, "epoch": 0.5671068427370949, "percentage": 56.71, "elapsed_time": "16:54:51", "remaining_time": "12:54:40", "throughput": 1588.85, "total_tokens": 96747520} -{"current_steps": 11820, "total_steps": 20825, "loss": 0.8429, "learning_rate": 2.1417176929570768e-05, "epoch": 0.5675870348139256, "percentage": 56.76, "elapsed_time": "16:55:47", "remaining_time": "12:53:52", "throughput": 1588.74, "total_tokens": 96829440} -{"current_steps": 11830, "total_steps": 20825, "loss": 0.8213, "learning_rate": 2.137797383630851e-05, "epoch": 0.5680672268907563, "percentage": 56.81, "elapsed_time": "16:56:42", "remaining_time": "12:53:03", "throughput": 1588.63, "total_tokens": 96911360} -{"current_steps": 11840, "total_steps": 20825, "loss": 0.8338, "learning_rate": 2.1338779838509965e-05, "epoch": 0.568547418967587, "percentage": 56.85, "elapsed_time": "16:57:38", "remaining_time": "12:52:15", "throughput": 1588.52, "total_tokens": 96993280} -{"current_steps": 11850, "total_steps": 20825, "loss": 1.0187, "learning_rate": 2.129959503459728e-05, "epoch": 0.5690276110444178, "percentage": 56.9, "elapsed_time": "16:58:34", "remaining_time": "12:51:27", "throughput": 1588.42, "total_tokens": 97075200} -{"current_steps": 11860, "total_steps": 20825, "loss": 0.8479, "learning_rate": 2.126041952296951e-05, "epoch": 0.5695078031212485, "percentage": 56.95, "elapsed_time": "16:59:30", "remaining_time": "12:50:39", "throughput": 1588.29, "total_tokens": 97157120} -{"current_steps": 11870, "total_steps": 20825, "loss": 1.0873, "learning_rate": 2.122125340200239e-05, "epoch": 0.5699879951980792, "percentage": 57.0, "elapsed_time": "17:00:26", "remaining_time": "12:49:50", "throughput": 1588.18, "total_tokens": 97239040} -{"current_steps": 11880, "total_steps": 20825, "loss": 1.1087, "learning_rate": 2.1182096770048045e-05, "epoch": 0.57046818727491, "percentage": 57.05, "elapsed_time": "17:01:22", "remaining_time": "12:49:02", "throughput": 1588.06, "total_tokens": 97320960} -{"current_steps": 11890, "total_steps": 20825, "loss": 0.872, "learning_rate": 2.11429497254348e-05, "epoch": 0.5709483793517407, "percentage": 57.09, "elapsed_time": "17:02:18", "remaining_time": "12:48:14", "throughput": 1587.96, "total_tokens": 97402880} -{"current_steps": 11900, "total_steps": 20825, "loss": 0.9375, "learning_rate": 2.1103812366466896e-05, "epoch": 0.5714285714285714, "percentage": 57.14, "elapsed_time": "17:03:14", "remaining_time": "12:47:25", "throughput": 1587.85, "total_tokens": 97484800} -{"current_steps": 11910, "total_steps": 20825, "loss": 0.9402, "learning_rate": 2.1064684791424236e-05, "epoch": 0.5719087635054022, "percentage": 57.19, "elapsed_time": "17:04:10", "remaining_time": "12:46:37", "throughput": 1587.74, "total_tokens": 97566720} -{"current_steps": 11920, "total_steps": 20825, "loss": 0.83, "learning_rate": 2.1025567098562177e-05, "epoch": 0.5723889555822329, "percentage": 57.24, "elapsed_time": "17:05:06", "remaining_time": "12:45:48", "throughput": 1587.62, "total_tokens": 97648640} -{"current_steps": 11930, "total_steps": 20825, "loss": 0.8851, "learning_rate": 2.0986459386111256e-05, "epoch": 0.5728691476590636, "percentage": 57.29, "elapsed_time": "17:06:01", "remaining_time": "12:45:00", "throughput": 1587.52, "total_tokens": 97730560} -{"current_steps": 11940, "total_steps": 20825, "loss": 0.8404, "learning_rate": 2.0947361752276935e-05, "epoch": 0.5733493397358943, "percentage": 57.33, "elapsed_time": "17:06:57", "remaining_time": "12:44:11", "throughput": 1587.41, "total_tokens": 97812480} -{"current_steps": 11950, "total_steps": 20825, "loss": 1.0064, "learning_rate": 2.0908274295239365e-05, "epoch": 0.5738295318127251, "percentage": 57.38, "elapsed_time": "17:07:53", "remaining_time": "12:43:23", "throughput": 1587.3, "total_tokens": 97894400} -{"current_steps": 11960, "total_steps": 20825, "loss": 0.882, "learning_rate": 2.0869197113153175e-05, "epoch": 0.5743097238895558, "percentage": 57.43, "elapsed_time": "17:08:48", "remaining_time": "12:42:34", "throughput": 1587.21, "total_tokens": 97976320} -{"current_steps": 11970, "total_steps": 20825, "loss": 0.7295, "learning_rate": 2.083013030414714e-05, "epoch": 0.5747899159663865, "percentage": 57.48, "elapsed_time": "17:09:45", "remaining_time": "12:41:46", "throughput": 1587.08, "total_tokens": 98058240} -{"current_steps": 11980, "total_steps": 20825, "loss": 0.808, "learning_rate": 2.0791073966324037e-05, "epoch": 0.5752701080432173, "percentage": 57.53, "elapsed_time": "17:10:41", "remaining_time": "12:40:58", "throughput": 1586.97, "total_tokens": 98140160} -{"current_steps": 11990, "total_steps": 20825, "loss": 0.7292, "learning_rate": 2.0752028197760323e-05, "epoch": 0.575750300120048, "percentage": 57.58, "elapsed_time": "17:11:37", "remaining_time": "12:40:09", "throughput": 1586.86, "total_tokens": 98222080} -{"current_steps": 12000, "total_steps": 20825, "loss": 0.9465, "learning_rate": 2.07129930965059e-05, "epoch": 0.5762304921968787, "percentage": 57.62, "elapsed_time": "17:12:32", "remaining_time": "12:39:20", "throughput": 1586.77, "total_tokens": 98304000} -{"current_steps": 12010, "total_steps": 20825, "loss": 0.8273, "learning_rate": 2.0673968760583912e-05, "epoch": 0.5767106842737095, "percentage": 57.67, "elapsed_time": "17:13:31", "remaining_time": "12:38:34", "throughput": 1586.57, "total_tokens": 98385920} -{"current_steps": 12020, "total_steps": 20825, "loss": 1.0037, "learning_rate": 2.0634955287990465e-05, "epoch": 0.5771908763505402, "percentage": 57.72, "elapsed_time": "17:14:27", "remaining_time": "12:37:46", "throughput": 1586.47, "total_tokens": 98467840} -{"current_steps": 12030, "total_steps": 20825, "loss": 0.7684, "learning_rate": 2.059595277669436e-05, "epoch": 0.5776710684273709, "percentage": 57.77, "elapsed_time": "17:15:22", "remaining_time": "12:36:57", "throughput": 1586.37, "total_tokens": 98549760} -{"current_steps": 12040, "total_steps": 20825, "loss": 0.9755, "learning_rate": 2.0556961324636903e-05, "epoch": 0.5781512605042017, "percentage": 57.82, "elapsed_time": "17:16:18", "remaining_time": "12:36:08", "throughput": 1586.26, "total_tokens": 98631680} -{"current_steps": 12050, "total_steps": 20825, "loss": 0.9699, "learning_rate": 2.0517981029731616e-05, "epoch": 0.5786314525810324, "percentage": 57.86, "elapsed_time": "17:17:14", "remaining_time": "12:35:20", "throughput": 1586.16, "total_tokens": 98713600} -{"current_steps": 12060, "total_steps": 20825, "loss": 1.0823, "learning_rate": 2.0479011989863988e-05, "epoch": 0.5791116446578631, "percentage": 57.91, "elapsed_time": "17:18:10", "remaining_time": "12:34:31", "throughput": 1586.05, "total_tokens": 98795520} -{"current_steps": 12070, "total_steps": 20825, "loss": 0.8871, "learning_rate": 2.0440054302891276e-05, "epoch": 0.5795918367346938, "percentage": 57.96, "elapsed_time": "17:19:05", "remaining_time": "12:33:42", "throughput": 1585.95, "total_tokens": 98877440} -{"current_steps": 12080, "total_steps": 20825, "loss": 0.7901, "learning_rate": 2.0401108066642217e-05, "epoch": 0.5800720288115246, "percentage": 58.01, "elapsed_time": "17:20:01", "remaining_time": "12:32:54", "throughput": 1585.84, "total_tokens": 98959360} -{"current_steps": 12090, "total_steps": 20825, "loss": 0.844, "learning_rate": 2.0362173378916763e-05, "epoch": 0.5805522208883553, "percentage": 58.06, "elapsed_time": "17:20:57", "remaining_time": "12:32:05", "throughput": 1585.73, "total_tokens": 99041280} -{"current_steps": 12100, "total_steps": 20825, "loss": 0.8851, "learning_rate": 2.032325033748591e-05, "epoch": 0.581032412965186, "percentage": 58.1, "elapsed_time": "17:21:53", "remaining_time": "12:31:17", "throughput": 1585.62, "total_tokens": 99123200} -{"current_steps": 12110, "total_steps": 20825, "loss": 0.9621, "learning_rate": 2.0284339040091403e-05, "epoch": 0.5815126050420169, "percentage": 58.15, "elapsed_time": "17:22:49", "remaining_time": "12:30:28", "throughput": 1585.51, "total_tokens": 99205120} -{"current_steps": 12120, "total_steps": 20825, "loss": 0.7169, "learning_rate": 2.0245439584445457e-05, "epoch": 0.5819927971188475, "percentage": 58.2, "elapsed_time": "17:23:45", "remaining_time": "12:29:39", "throughput": 1585.4, "total_tokens": 99287040} -{"current_steps": 12130, "total_steps": 20825, "loss": 0.9376, "learning_rate": 2.0206552068230587e-05, "epoch": 0.5824729891956782, "percentage": 58.25, "elapsed_time": "17:24:41", "remaining_time": "12:28:51", "throughput": 1585.3, "total_tokens": 99368960} -{"current_steps": 12140, "total_steps": 20825, "loss": 0.9773, "learning_rate": 2.0167676589099324e-05, "epoch": 0.5829531812725091, "percentage": 58.3, "elapsed_time": "17:25:37", "remaining_time": "12:28:02", "throughput": 1585.2, "total_tokens": 99450880} -{"current_steps": 12150, "total_steps": 20825, "loss": 0.8787, "learning_rate": 2.0128813244673946e-05, "epoch": 0.5834333733493398, "percentage": 58.34, "elapsed_time": "17:26:33", "remaining_time": "12:27:13", "throughput": 1585.09, "total_tokens": 99532800} -{"current_steps": 12160, "total_steps": 20825, "loss": 0.9362, "learning_rate": 2.0089962132546296e-05, "epoch": 0.5839135654261705, "percentage": 58.39, "elapsed_time": "17:27:29", "remaining_time": "12:26:25", "throughput": 1584.97, "total_tokens": 99614720} -{"current_steps": 12170, "total_steps": 20825, "loss": 0.8472, "learning_rate": 2.0051123350277477e-05, "epoch": 0.5843937575030012, "percentage": 58.44, "elapsed_time": "17:28:25", "remaining_time": "12:25:36", "throughput": 1584.88, "total_tokens": 99696640} -{"current_steps": 12180, "total_steps": 20825, "loss": 0.6606, "learning_rate": 2.0012296995397613e-05, "epoch": 0.584873949579832, "percentage": 58.49, "elapsed_time": "17:29:20", "remaining_time": "12:24:47", "throughput": 1584.77, "total_tokens": 99778560} -{"current_steps": 12190, "total_steps": 20825, "loss": 0.7587, "learning_rate": 1.997348316540566e-05, "epoch": 0.5853541416566627, "percentage": 58.54, "elapsed_time": "17:30:16", "remaining_time": "12:23:58", "throughput": 1584.67, "total_tokens": 99860480} -{"current_steps": 12200, "total_steps": 20825, "loss": 0.7988, "learning_rate": 1.9934681957769107e-05, "epoch": 0.5858343337334934, "percentage": 58.58, "elapsed_time": "17:31:12", "remaining_time": "12:23:10", "throughput": 1584.56, "total_tokens": 99942400} -{"current_steps": 12210, "total_steps": 20825, "loss": 0.9584, "learning_rate": 1.9895893469923736e-05, "epoch": 0.5863145258103242, "percentage": 58.63, "elapsed_time": "17:32:08", "remaining_time": "12:22:21", "throughput": 1584.46, "total_tokens": 100024320} -{"current_steps": 12220, "total_steps": 20825, "loss": 1.1023, "learning_rate": 1.985711779927339e-05, "epoch": 0.5867947178871549, "percentage": 58.68, "elapsed_time": "17:33:04", "remaining_time": "12:21:32", "throughput": 1584.35, "total_tokens": 100106240} -{"current_steps": 12230, "total_steps": 20825, "loss": 0.8485, "learning_rate": 1.9818355043189732e-05, "epoch": 0.5872749099639856, "percentage": 58.73, "elapsed_time": "17:34:00", "remaining_time": "12:20:44", "throughput": 1584.23, "total_tokens": 100188160} -{"current_steps": 12240, "total_steps": 20825, "loss": 0.9277, "learning_rate": 1.9779605299012005e-05, "epoch": 0.5877551020408164, "percentage": 58.78, "elapsed_time": "17:34:56", "remaining_time": "12:19:55", "throughput": 1584.12, "total_tokens": 100270080} -{"current_steps": 12250, "total_steps": 20825, "loss": 0.9011, "learning_rate": 1.974086866404675e-05, "epoch": 0.5882352941176471, "percentage": 58.82, "elapsed_time": "17:35:52", "remaining_time": "12:19:07", "throughput": 1584.01, "total_tokens": 100352000} -{"current_steps": 12260, "total_steps": 20825, "loss": 1.0077, "learning_rate": 1.970214523556761e-05, "epoch": 0.5887154861944778, "percentage": 58.87, "elapsed_time": "17:36:48", "remaining_time": "12:18:18", "throughput": 1583.91, "total_tokens": 100433920} -{"current_steps": 12270, "total_steps": 20825, "loss": 0.9088, "learning_rate": 1.9663435110815065e-05, "epoch": 0.5891956782713085, "percentage": 58.92, "elapsed_time": "17:37:44", "remaining_time": "12:17:29", "throughput": 1583.82, "total_tokens": 100515840} -{"current_steps": 12280, "total_steps": 20825, "loss": 0.8294, "learning_rate": 1.9624738386996163e-05, "epoch": 0.5896758703481393, "percentage": 58.97, "elapsed_time": "17:38:39", "remaining_time": "12:16:40", "throughput": 1583.72, "total_tokens": 100597760} -{"current_steps": 12290, "total_steps": 20825, "loss": 0.914, "learning_rate": 1.9586055161284332e-05, "epoch": 0.59015606242497, "percentage": 59.02, "elapsed_time": "17:39:35", "remaining_time": "12:15:51", "throughput": 1583.62, "total_tokens": 100679680} -{"current_steps": 12300, "total_steps": 20825, "loss": 1.1152, "learning_rate": 1.954738553081909e-05, "epoch": 0.5906362545018007, "percentage": 59.06, "elapsed_time": "17:40:31", "remaining_time": "12:15:02", "throughput": 1583.51, "total_tokens": 100761600} -{"current_steps": 12310, "total_steps": 20825, "loss": 0.8391, "learning_rate": 1.950872959270581e-05, "epoch": 0.5911164465786315, "percentage": 59.11, "elapsed_time": "17:41:27", "remaining_time": "12:14:13", "throughput": 1583.42, "total_tokens": 100843520} -{"current_steps": 12320, "total_steps": 20825, "loss": 0.8974, "learning_rate": 1.9470087444015484e-05, "epoch": 0.5915966386554622, "percentage": 59.16, "elapsed_time": "17:42:23", "remaining_time": "12:13:24", "throughput": 1583.31, "total_tokens": 100925440} -{"current_steps": 12330, "total_steps": 20825, "loss": 1.1511, "learning_rate": 1.9431459181784495e-05, "epoch": 0.5920768307322929, "percentage": 59.21, "elapsed_time": "17:43:19", "remaining_time": "12:12:35", "throughput": 1583.21, "total_tokens": 101007360} -{"current_steps": 12340, "total_steps": 20825, "loss": 0.8286, "learning_rate": 1.939284490301432e-05, "epoch": 0.5925570228091237, "percentage": 59.26, "elapsed_time": "17:44:15", "remaining_time": "12:11:46", "throughput": 1583.1, "total_tokens": 101089280} -{"current_steps": 12350, "total_steps": 20825, "loss": 0.7323, "learning_rate": 1.935424470467135e-05, "epoch": 0.5930372148859544, "percentage": 59.3, "elapsed_time": "17:45:11", "remaining_time": "12:10:58", "throughput": 1582.99, "total_tokens": 101171200} -{"current_steps": 12360, "total_steps": 20825, "loss": 0.9878, "learning_rate": 1.9315658683686615e-05, "epoch": 0.5935174069627851, "percentage": 59.35, "elapsed_time": "17:46:07", "remaining_time": "12:10:09", "throughput": 1582.88, "total_tokens": 101253120} -{"current_steps": 12370, "total_steps": 20825, "loss": 0.8682, "learning_rate": 1.9277086936955517e-05, "epoch": 0.5939975990396158, "percentage": 59.4, "elapsed_time": "17:47:03", "remaining_time": "12:09:20", "throughput": 1582.79, "total_tokens": 101335040} -{"current_steps": 12380, "total_steps": 20825, "loss": 0.8724, "learning_rate": 1.9238529561337646e-05, "epoch": 0.5944777911164466, "percentage": 59.45, "elapsed_time": "17:47:59", "remaining_time": "12:08:31", "throughput": 1582.68, "total_tokens": 101416960} -{"current_steps": 12390, "total_steps": 20825, "loss": 0.9832, "learning_rate": 1.9199986653656502e-05, "epoch": 0.5949579831932773, "percentage": 59.5, "elapsed_time": "17:48:55", "remaining_time": "12:07:42", "throughput": 1582.58, "total_tokens": 101498880} -{"current_steps": 12400, "total_steps": 20825, "loss": 0.8047, "learning_rate": 1.9161458310699225e-05, "epoch": 0.595438175270108, "percentage": 59.54, "elapsed_time": "17:49:51", "remaining_time": "12:06:53", "throughput": 1582.47, "total_tokens": 101580800} -{"current_steps": 12410, "total_steps": 20825, "loss": 0.9766, "learning_rate": 1.9122944629216402e-05, "epoch": 0.5959183673469388, "percentage": 59.59, "elapsed_time": "17:50:47", "remaining_time": "12:06:04", "throughput": 1582.36, "total_tokens": 101662720} -{"current_steps": 12420, "total_steps": 20825, "loss": 0.8339, "learning_rate": 1.9084445705921815e-05, "epoch": 0.5963985594237695, "percentage": 59.64, "elapsed_time": "17:51:43", "remaining_time": "12:05:15", "throughput": 1582.27, "total_tokens": 101744640} -{"current_steps": 12430, "total_steps": 20825, "loss": 1.0445, "learning_rate": 1.9045961637492145e-05, "epoch": 0.5968787515006002, "percentage": 59.69, "elapsed_time": "17:52:38", "remaining_time": "12:04:26", "throughput": 1582.17, "total_tokens": 101826560} -{"current_steps": 12440, "total_steps": 20825, "loss": 0.9611, "learning_rate": 1.9007492520566814e-05, "epoch": 0.597358943577431, "percentage": 59.74, "elapsed_time": "17:53:34", "remaining_time": "12:03:37", "throughput": 1582.08, "total_tokens": 101908480} -{"current_steps": 12450, "total_steps": 20825, "loss": 0.9063, "learning_rate": 1.896903845174768e-05, "epoch": 0.5978391356542617, "percentage": 59.78, "elapsed_time": "17:54:30", "remaining_time": "12:02:48", "throughput": 1581.98, "total_tokens": 101990400} -{"current_steps": 12460, "total_steps": 20825, "loss": 0.8149, "learning_rate": 1.8930599527598797e-05, "epoch": 0.5983193277310924, "percentage": 59.83, "elapsed_time": "17:55:26", "remaining_time": "12:01:59", "throughput": 1581.88, "total_tokens": 102072320} -{"current_steps": 12470, "total_steps": 20825, "loss": 1.05, "learning_rate": 1.8892175844646215e-05, "epoch": 0.5987995198079231, "percentage": 59.88, "elapsed_time": "17:56:22", "remaining_time": "12:01:10", "throughput": 1581.77, "total_tokens": 102154240} -{"current_steps": 12480, "total_steps": 20825, "loss": 0.7995, "learning_rate": 1.8853767499377712e-05, "epoch": 0.5992797118847539, "percentage": 59.93, "elapsed_time": "17:57:19", "remaining_time": "12:00:22", "throughput": 1581.65, "total_tokens": 102236160} -{"current_steps": 12490, "total_steps": 20825, "loss": 0.7582, "learning_rate": 1.8815374588242523e-05, "epoch": 0.5997599039615846, "percentage": 59.98, "elapsed_time": "17:58:15", "remaining_time": "11:59:33", "throughput": 1581.54, "total_tokens": 102318080} -{"current_steps": 12500, "total_steps": 20825, "loss": 0.8494, "learning_rate": 1.877699720765114e-05, "epoch": 0.6002400960384153, "percentage": 60.02, "elapsed_time": "17:59:10", "remaining_time": "11:58:44", "throughput": 1581.45, "total_tokens": 102400000} -{"current_steps": 12510, "total_steps": 20825, "loss": 0.7685, "learning_rate": 1.873863545397507e-05, "epoch": 0.6007202881152461, "percentage": 60.07, "elapsed_time": "18:00:07", "remaining_time": "11:57:55", "throughput": 1581.33, "total_tokens": 102481920} -{"current_steps": 12520, "total_steps": 20825, "loss": 0.9137, "learning_rate": 1.870028942354655e-05, "epoch": 0.6012004801920768, "percentage": 60.12, "elapsed_time": "18:01:03", "remaining_time": "11:57:06", "throughput": 1581.22, "total_tokens": 102563840} -{"current_steps": 12530, "total_steps": 20825, "loss": 0.8186, "learning_rate": 1.8661959212658365e-05, "epoch": 0.6016806722689075, "percentage": 60.17, "elapsed_time": "18:01:59", "remaining_time": "11:56:17", "throughput": 1581.12, "total_tokens": 102645760} -{"current_steps": 12540, "total_steps": 20825, "loss": 0.8923, "learning_rate": 1.862364491756355e-05, "epoch": 0.6021608643457383, "percentage": 60.22, "elapsed_time": "18:02:55", "remaining_time": "11:55:28", "throughput": 1581.02, "total_tokens": 102727680} -{"current_steps": 12550, "total_steps": 20825, "loss": 0.9799, "learning_rate": 1.8585346634475175e-05, "epoch": 0.602641056422569, "percentage": 60.26, "elapsed_time": "18:03:51", "remaining_time": "11:54:39", "throughput": 1580.92, "total_tokens": 102809600} -{"current_steps": 12560, "total_steps": 20825, "loss": 0.9472, "learning_rate": 1.8547064459566117e-05, "epoch": 0.6031212484993997, "percentage": 60.31, "elapsed_time": "18:04:47", "remaining_time": "11:53:50", "throughput": 1580.83, "total_tokens": 102891520} -{"current_steps": 12570, "total_steps": 20825, "loss": 0.7548, "learning_rate": 1.8508798488968803e-05, "epoch": 0.6036014405762304, "percentage": 60.36, "elapsed_time": "18:05:42", "remaining_time": "11:53:00", "throughput": 1580.73, "total_tokens": 102973440} -{"current_steps": 12580, "total_steps": 20825, "loss": 0.9321, "learning_rate": 1.8470548818774942e-05, "epoch": 0.6040816326530613, "percentage": 60.41, "elapsed_time": "18:06:38", "remaining_time": "11:52:11", "throughput": 1580.64, "total_tokens": 103055360} -{"current_steps": 12590, "total_steps": 20825, "loss": 0.8554, "learning_rate": 1.8432315545035328e-05, "epoch": 0.604561824729892, "percentage": 60.46, "elapsed_time": "18:07:34", "remaining_time": "11:51:22", "throughput": 1580.54, "total_tokens": 103137280} -{"current_steps": 12600, "total_steps": 20825, "loss": 0.9034, "learning_rate": 1.83940987637596e-05, "epoch": 0.6050420168067226, "percentage": 60.5, "elapsed_time": "18:08:29", "remaining_time": "11:50:32", "throughput": 1580.45, "total_tokens": 103219200} -{"current_steps": 12610, "total_steps": 20825, "loss": 1.0032, "learning_rate": 1.8355898570915937e-05, "epoch": 0.6055222088835535, "percentage": 60.55, "elapsed_time": "18:09:25", "remaining_time": "11:49:43", "throughput": 1580.36, "total_tokens": 103301120} -{"current_steps": 12620, "total_steps": 20825, "loss": 0.9037, "learning_rate": 1.8317715062430902e-05, "epoch": 0.6060024009603842, "percentage": 60.6, "elapsed_time": "18:10:21", "remaining_time": "11:48:54", "throughput": 1580.26, "total_tokens": 103383040} -{"current_steps": 12630, "total_steps": 20825, "loss": 0.9669, "learning_rate": 1.8279548334189146e-05, "epoch": 0.6064825930372149, "percentage": 60.65, "elapsed_time": "18:11:17", "remaining_time": "11:48:05", "throughput": 1580.16, "total_tokens": 103464960} -{"current_steps": 12640, "total_steps": 20825, "loss": 0.9426, "learning_rate": 1.8241398482033185e-05, "epoch": 0.6069627851140457, "percentage": 60.7, "elapsed_time": "18:12:13", "remaining_time": "11:47:15", "throughput": 1580.07, "total_tokens": 103546880} -{"current_steps": 12650, "total_steps": 20825, "loss": 0.9299, "learning_rate": 1.8203265601763136e-05, "epoch": 0.6074429771908764, "percentage": 60.74, "elapsed_time": "18:13:09", "remaining_time": "11:46:26", "throughput": 1579.97, "total_tokens": 103628800} -{"current_steps": 12660, "total_steps": 20825, "loss": 0.8059, "learning_rate": 1.816514978913655e-05, "epoch": 0.6079231692677071, "percentage": 60.79, "elapsed_time": "18:14:04", "remaining_time": "11:45:37", "throughput": 1579.87, "total_tokens": 103710720} -{"current_steps": 12670, "total_steps": 20825, "loss": 0.963, "learning_rate": 1.8127051139868044e-05, "epoch": 0.6084033613445378, "percentage": 60.84, "elapsed_time": "18:15:01", "remaining_time": "11:44:48", "throughput": 1579.77, "total_tokens": 103792640} -{"current_steps": 12680, "total_steps": 20825, "loss": 0.9894, "learning_rate": 1.8088969749629197e-05, "epoch": 0.6088835534213686, "percentage": 60.89, "elapsed_time": "18:15:57", "remaining_time": "11:43:59", "throughput": 1579.67, "total_tokens": 103874560} -{"current_steps": 12690, "total_steps": 20825, "loss": 1.0683, "learning_rate": 1.8050905714048233e-05, "epoch": 0.6093637454981993, "percentage": 60.94, "elapsed_time": "18:16:52", "remaining_time": "11:43:09", "throughput": 1579.58, "total_tokens": 103956480} -{"current_steps": 12700, "total_steps": 20825, "loss": 0.7611, "learning_rate": 1.8012859128709766e-05, "epoch": 0.60984393757503, "percentage": 60.98, "elapsed_time": "18:17:48", "remaining_time": "11:42:20", "throughput": 1579.48, "total_tokens": 104038400} -{"current_steps": 12710, "total_steps": 20825, "loss": 0.9293, "learning_rate": 1.7974830089154624e-05, "epoch": 0.6103241296518608, "percentage": 61.03, "elapsed_time": "18:18:44", "remaining_time": "11:41:30", "throughput": 1579.39, "total_tokens": 104120320} -{"current_steps": 12720, "total_steps": 20825, "loss": 0.9849, "learning_rate": 1.7936818690879574e-05, "epoch": 0.6108043217286915, "percentage": 61.08, "elapsed_time": "18:19:40", "remaining_time": "11:40:41", "throughput": 1579.3, "total_tokens": 104202240} -{"current_steps": 12730, "total_steps": 20825, "loss": 0.9917, "learning_rate": 1.7898825029337054e-05, "epoch": 0.6112845138055222, "percentage": 61.13, "elapsed_time": "18:20:36", "remaining_time": "11:39:52", "throughput": 1579.19, "total_tokens": 104284160} -{"current_steps": 12740, "total_steps": 20825, "loss": 0.8664, "learning_rate": 1.7860849199934983e-05, "epoch": 0.611764705882353, "percentage": 61.18, "elapsed_time": "18:21:32", "remaining_time": "11:39:03", "throughput": 1579.1, "total_tokens": 104366080} -{"current_steps": 12750, "total_steps": 20825, "loss": 0.9739, "learning_rate": 1.7822891298036515e-05, "epoch": 0.6122448979591837, "percentage": 61.22, "elapsed_time": "18:22:27", "remaining_time": "11:38:13", "throughput": 1579.02, "total_tokens": 104448000} -{"current_steps": 12760, "total_steps": 20825, "loss": 0.9441, "learning_rate": 1.7784951418959747e-05, "epoch": 0.6127250900360144, "percentage": 61.27, "elapsed_time": "18:23:23", "remaining_time": "11:37:24", "throughput": 1578.92, "total_tokens": 104529920} -{"current_steps": 12770, "total_steps": 20825, "loss": 0.9443, "learning_rate": 1.7747029657977556e-05, "epoch": 0.6132052821128451, "percentage": 61.32, "elapsed_time": "18:24:19", "remaining_time": "11:36:34", "throughput": 1578.83, "total_tokens": 104611840} -{"current_steps": 12780, "total_steps": 20825, "loss": 1.0327, "learning_rate": 1.7709126110317297e-05, "epoch": 0.6136854741896759, "percentage": 61.37, "elapsed_time": "18:25:14", "remaining_time": "11:35:45", "throughput": 1578.74, "total_tokens": 104693760} -{"current_steps": 12790, "total_steps": 20825, "loss": 0.9103, "learning_rate": 1.7671240871160593e-05, "epoch": 0.6141656662665066, "percentage": 61.42, "elapsed_time": "18:26:10", "remaining_time": "11:34:55", "throughput": 1578.64, "total_tokens": 104775680} -{"current_steps": 12800, "total_steps": 20825, "loss": 0.8165, "learning_rate": 1.76333740356431e-05, "epoch": 0.6146458583433373, "percentage": 61.46, "elapsed_time": "18:27:06", "remaining_time": "11:34:06", "throughput": 1578.54, "total_tokens": 104857600} -{"current_steps": 12810, "total_steps": 20825, "loss": 0.8398, "learning_rate": 1.7595525698854263e-05, "epoch": 0.6151260504201681, "percentage": 61.51, "elapsed_time": "18:28:02", "remaining_time": "11:33:17", "throughput": 1578.45, "total_tokens": 104939520} -{"current_steps": 12820, "total_steps": 20825, "loss": 0.8922, "learning_rate": 1.7557695955837063e-05, "epoch": 0.6156062424969988, "percentage": 61.56, "elapsed_time": "18:28:58", "remaining_time": "11:32:27", "throughput": 1578.35, "total_tokens": 105021440} -{"current_steps": 12830, "total_steps": 20825, "loss": 0.8345, "learning_rate": 1.7519884901587772e-05, "epoch": 0.6160864345738295, "percentage": 61.61, "elapsed_time": "18:29:59", "remaining_time": "11:31:41", "throughput": 1578.14, "total_tokens": 105103360} -{"current_steps": 12840, "total_steps": 20825, "loss": 1.0156, "learning_rate": 1.748209263105577e-05, "epoch": 0.6165666266506603, "percentage": 61.66, "elapsed_time": "18:31:00", "remaining_time": "11:30:55", "throughput": 1577.92, "total_tokens": 105185280} -{"current_steps": 12850, "total_steps": 20825, "loss": 0.9688, "learning_rate": 1.744431923914326e-05, "epoch": 0.617046818727491, "percentage": 61.7, "elapsed_time": "18:32:03", "remaining_time": "11:30:09", "throughput": 1577.67, "total_tokens": 105267200} -{"current_steps": 12860, "total_steps": 20825, "loss": 0.9532, "learning_rate": 1.7406564820705e-05, "epoch": 0.6175270108043217, "percentage": 61.75, "elapsed_time": "18:32:58", "remaining_time": "11:29:19", "throughput": 1577.6, "total_tokens": 105349120} -{"current_steps": 12870, "total_steps": 20825, "loss": 0.818, "learning_rate": 1.736882947054815e-05, "epoch": 0.6180072028811524, "percentage": 61.8, "elapsed_time": "18:33:44", "remaining_time": "11:28:24", "throughput": 1577.74, "total_tokens": 105431040} -{"current_steps": 12880, "total_steps": 20825, "loss": 0.994, "learning_rate": 1.7331113283431966e-05, "epoch": 0.6184873949579832, "percentage": 61.85, "elapsed_time": "18:34:30", "remaining_time": "11:27:28", "throughput": 1577.88, "total_tokens": 105512960} -{"current_steps": 12890, "total_steps": 20825, "loss": 0.7879, "learning_rate": 1.729341635406757e-05, "epoch": 0.6189675870348139, "percentage": 61.9, "elapsed_time": "18:35:15", "remaining_time": "11:26:32", "throughput": 1578.03, "total_tokens": 105594880} -{"current_steps": 12900, "total_steps": 20825, "loss": 0.9374, "learning_rate": 1.725573877711776e-05, "epoch": 0.6194477791116446, "percentage": 61.94, "elapsed_time": "18:36:01", "remaining_time": "11:25:36", "throughput": 1578.18, "total_tokens": 105676800} -{"current_steps": 12910, "total_steps": 20825, "loss": 0.9342, "learning_rate": 1.7218080647196698e-05, "epoch": 0.6199279711884754, "percentage": 61.99, "elapsed_time": "18:36:46", "remaining_time": "11:24:41", "throughput": 1578.33, "total_tokens": 105758720} -{"current_steps": 12920, "total_steps": 20825, "loss": 0.8143, "learning_rate": 1.7180442058869732e-05, "epoch": 0.6204081632653061, "percentage": 62.04, "elapsed_time": "18:37:32", "remaining_time": "11:23:45", "throughput": 1578.47, "total_tokens": 105840640} -{"current_steps": 12930, "total_steps": 20825, "loss": 0.8115, "learning_rate": 1.7142823106653135e-05, "epoch": 0.6208883553421368, "percentage": 62.09, "elapsed_time": "18:38:18", "remaining_time": "11:22:49", "throughput": 1578.62, "total_tokens": 105922560} -{"current_steps": 12940, "total_steps": 20825, "loss": 0.8874, "learning_rate": 1.7105223885013884e-05, "epoch": 0.6213685474189676, "percentage": 62.14, "elapsed_time": "18:39:03", "remaining_time": "11:21:54", "throughput": 1578.77, "total_tokens": 106004480} -{"current_steps": 12950, "total_steps": 20825, "loss": 0.9164, "learning_rate": 1.706764448836938e-05, "epoch": 0.6218487394957983, "percentage": 62.18, "elapsed_time": "18:39:49", "remaining_time": "11:20:58", "throughput": 1578.92, "total_tokens": 106086400} -{"current_steps": 12960, "total_steps": 20825, "loss": 0.9694, "learning_rate": 1.703008501108726e-05, "epoch": 0.622328931572629, "percentage": 62.23, "elapsed_time": "18:40:35", "remaining_time": "11:20:02", "throughput": 1579.06, "total_tokens": 106168320} -{"current_steps": 12970, "total_steps": 20825, "loss": 0.9424, "learning_rate": 1.699254554748515e-05, "epoch": 0.6228091236494598, "percentage": 62.28, "elapsed_time": "18:41:20", "remaining_time": "11:19:07", "throughput": 1579.21, "total_tokens": 106250240} -{"current_steps": 12980, "total_steps": 20825, "loss": 0.8038, "learning_rate": 1.6955026191830385e-05, "epoch": 0.6232893157262905, "percentage": 62.33, "elapsed_time": "18:42:06", "remaining_time": "11:18:11", "throughput": 1579.36, "total_tokens": 106332160} -{"current_steps": 12990, "total_steps": 20825, "loss": 0.9074, "learning_rate": 1.691752703833984e-05, "epoch": 0.6237695078031212, "percentage": 62.38, "elapsed_time": "18:42:51", "remaining_time": "11:17:15", "throughput": 1579.51, "total_tokens": 106414080} -{"current_steps": 13000, "total_steps": 20825, "loss": 0.8315, "learning_rate": 1.6880048181179652e-05, "epoch": 0.6242496998799519, "percentage": 62.42, "elapsed_time": "18:43:37", "remaining_time": "11:16:20", "throughput": 1579.65, "total_tokens": 106496000} -{"current_steps": 13010, "total_steps": 20825, "loss": 0.9378, "learning_rate": 1.684258971446497e-05, "epoch": 0.6247298919567827, "percentage": 62.47, "elapsed_time": "18:44:27", "remaining_time": "11:15:27", "throughput": 1579.7, "total_tokens": 106577920} -{"current_steps": 13020, "total_steps": 20825, "loss": 0.8081, "learning_rate": 1.6805151732259755e-05, "epoch": 0.6252100840336134, "percentage": 62.52, "elapsed_time": "18:45:12", "remaining_time": "11:14:31", "throughput": 1579.85, "total_tokens": 106659840} -{"current_steps": 13030, "total_steps": 20825, "loss": 0.8395, "learning_rate": 1.6767734328576544e-05, "epoch": 0.6256902761104441, "percentage": 62.57, "elapsed_time": "18:45:58", "remaining_time": "11:13:35", "throughput": 1579.99, "total_tokens": 106741760} -{"current_steps": 13040, "total_steps": 20825, "loss": 0.8904, "learning_rate": 1.6730337597376165e-05, "epoch": 0.626170468187275, "percentage": 62.62, "elapsed_time": "18:46:44", "remaining_time": "11:12:40", "throughput": 1580.13, "total_tokens": 106823680} -{"current_steps": 13050, "total_steps": 20825, "loss": 0.7173, "learning_rate": 1.669296163256755e-05, "epoch": 0.6266506602641057, "percentage": 62.67, "elapsed_time": "18:47:30", "remaining_time": "11:11:45", "throughput": 1580.27, "total_tokens": 106905600} -{"current_steps": 13060, "total_steps": 20825, "loss": 1.0009, "learning_rate": 1.6655606528007505e-05, "epoch": 0.6271308523409364, "percentage": 62.71, "elapsed_time": "18:48:16", "remaining_time": "11:10:49", "throughput": 1580.41, "total_tokens": 106987520} -{"current_steps": 13070, "total_steps": 20825, "loss": 0.9796, "learning_rate": 1.6618272377500406e-05, "epoch": 0.6276110444177672, "percentage": 62.76, "elapsed_time": "18:49:01", "remaining_time": "11:09:54", "throughput": 1580.55, "total_tokens": 107069440} -{"current_steps": 13080, "total_steps": 20825, "loss": 0.7448, "learning_rate": 1.658095927479805e-05, "epoch": 0.6280912364945979, "percentage": 62.81, "elapsed_time": "18:49:47", "remaining_time": "11:08:58", "throughput": 1580.7, "total_tokens": 107151360} -{"current_steps": 13090, "total_steps": 20825, "loss": 1.1406, "learning_rate": 1.6543667313599365e-05, "epoch": 0.6285714285714286, "percentage": 62.86, "elapsed_time": "18:50:33", "remaining_time": "11:08:03", "throughput": 1580.83, "total_tokens": 107233280} -{"current_steps": 13100, "total_steps": 20825, "loss": 0.8865, "learning_rate": 1.6506396587550188e-05, "epoch": 0.6290516206482593, "percentage": 62.91, "elapsed_time": "18:51:18", "remaining_time": "11:07:07", "throughput": 1580.98, "total_tokens": 107315200} -{"current_steps": 13110, "total_steps": 20825, "loss": 0.8561, "learning_rate": 1.6469147190243027e-05, "epoch": 0.6295318127250901, "percentage": 62.95, "elapsed_time": "18:52:04", "remaining_time": "11:06:12", "throughput": 1581.11, "total_tokens": 107397120} -{"current_steps": 13120, "total_steps": 20825, "loss": 0.8364, "learning_rate": 1.6431919215216862e-05, "epoch": 0.6300120048019208, "percentage": 63.0, "elapsed_time": "18:52:50", "remaining_time": "11:05:17", "throughput": 1581.26, "total_tokens": 107479040} -{"current_steps": 13130, "total_steps": 20825, "loss": 0.996, "learning_rate": 1.6394712755956817e-05, "epoch": 0.6304921968787515, "percentage": 63.05, "elapsed_time": "18:53:36", "remaining_time": "11:04:21", "throughput": 1581.4, "total_tokens": 107560960} -{"current_steps": 13140, "total_steps": 20825, "loss": 0.8958, "learning_rate": 1.635752790589405e-05, "epoch": 0.6309723889555823, "percentage": 63.1, "elapsed_time": "18:54:22", "remaining_time": "11:03:26", "throughput": 1581.54, "total_tokens": 107642880} -{"current_steps": 13150, "total_steps": 20825, "loss": 0.9864, "learning_rate": 1.6320364758405422e-05, "epoch": 0.631452581032413, "percentage": 63.15, "elapsed_time": "18:55:07", "remaining_time": "11:02:31", "throughput": 1581.68, "total_tokens": 107724800} -{"current_steps": 13160, "total_steps": 20825, "loss": 0.9916, "learning_rate": 1.628322340681329e-05, "epoch": 0.6319327731092437, "percentage": 63.19, "elapsed_time": "18:55:53", "remaining_time": "11:01:35", "throughput": 1581.82, "total_tokens": 107806720} -{"current_steps": 13170, "total_steps": 20825, "loss": 1.0281, "learning_rate": 1.6246103944385295e-05, "epoch": 0.6324129651860745, "percentage": 63.24, "elapsed_time": "18:56:39", "remaining_time": "11:00:40", "throughput": 1581.95, "total_tokens": 107888640} -{"current_steps": 13180, "total_steps": 20825, "loss": 0.8902, "learning_rate": 1.620900646433412e-05, "epoch": 0.6328931572629052, "percentage": 63.29, "elapsed_time": "18:57:25", "remaining_time": "10:59:45", "throughput": 1582.09, "total_tokens": 107970560} -{"current_steps": 13190, "total_steps": 20825, "loss": 0.9968, "learning_rate": 1.6171931059817214e-05, "epoch": 0.6333733493397359, "percentage": 63.34, "elapsed_time": "18:58:11", "remaining_time": "10:58:50", "throughput": 1582.22, "total_tokens": 108052480} -{"current_steps": 13200, "total_steps": 20825, "loss": 0.6298, "learning_rate": 1.613487782393661e-05, "epoch": 0.6338535414165666, "percentage": 63.39, "elapsed_time": "18:58:57", "remaining_time": "10:57:55", "throughput": 1582.35, "total_tokens": 108134400} -{"current_steps": 13210, "total_steps": 20825, "loss": 0.7394, "learning_rate": 1.6097846849738685e-05, "epoch": 0.6343337334933974, "percentage": 63.43, "elapsed_time": "18:59:43", "remaining_time": "10:57:00", "throughput": 1582.49, "total_tokens": 108216320} -{"current_steps": 13220, "total_steps": 20825, "loss": 0.9741, "learning_rate": 1.6060838230213883e-05, "epoch": 0.6348139255702281, "percentage": 63.48, "elapsed_time": "19:00:29", "remaining_time": "10:56:04", "throughput": 1582.63, "total_tokens": 108298240} -{"current_steps": 13230, "total_steps": 20825, "loss": 1.0429, "learning_rate": 1.6023852058296544e-05, "epoch": 0.6352941176470588, "percentage": 63.53, "elapsed_time": "19:01:15", "remaining_time": "10:55:09", "throughput": 1582.77, "total_tokens": 108380160} -{"current_steps": 13240, "total_steps": 20825, "loss": 0.8975, "learning_rate": 1.5986888426864617e-05, "epoch": 0.6357743097238896, "percentage": 63.58, "elapsed_time": "19:02:00", "remaining_time": "10:54:14", "throughput": 1582.91, "total_tokens": 108462080} -{"current_steps": 13250, "total_steps": 20825, "loss": 0.8076, "learning_rate": 1.5949947428739448e-05, "epoch": 0.6362545018007203, "percentage": 63.63, "elapsed_time": "19:02:46", "remaining_time": "10:53:19", "throughput": 1583.05, "total_tokens": 108544000} -{"current_steps": 13260, "total_steps": 20825, "loss": 0.747, "learning_rate": 1.591302915668556e-05, "epoch": 0.636734693877551, "percentage": 63.67, "elapsed_time": "19:03:33", "remaining_time": "10:52:24", "throughput": 1583.17, "total_tokens": 108625920} -{"current_steps": 13270, "total_steps": 20825, "loss": 0.9432, "learning_rate": 1.5876133703410412e-05, "epoch": 0.6372148859543818, "percentage": 63.72, "elapsed_time": "19:04:18", "remaining_time": "10:51:29", "throughput": 1583.3, "total_tokens": 108707840} -{"current_steps": 13280, "total_steps": 20825, "loss": 1.0365, "learning_rate": 1.5839261161564138e-05, "epoch": 0.6376950780312125, "percentage": 63.77, "elapsed_time": "19:05:04", "remaining_time": "10:50:34", "throughput": 1583.44, "total_tokens": 108789760} -{"current_steps": 13290, "total_steps": 20825, "loss": 0.9743, "learning_rate": 1.5802411623739345e-05, "epoch": 0.6381752701080432, "percentage": 63.82, "elapsed_time": "19:05:50", "remaining_time": "10:49:39", "throughput": 1583.57, "total_tokens": 108871680} -{"current_steps": 13300, "total_steps": 20825, "loss": 0.8376, "learning_rate": 1.57655851824709e-05, "epoch": 0.6386554621848739, "percentage": 63.87, "elapsed_time": "19:06:36", "remaining_time": "10:48:44", "throughput": 1583.71, "total_tokens": 108953600} -{"current_steps": 13310, "total_steps": 20825, "loss": 0.9858, "learning_rate": 1.5728781930235627e-05, "epoch": 0.6391356542617047, "percentage": 63.91, "elapsed_time": "19:07:22", "remaining_time": "10:47:49", "throughput": 1583.84, "total_tokens": 109035520} -{"current_steps": 13320, "total_steps": 20825, "loss": 1.0486, "learning_rate": 1.5692001959452164e-05, "epoch": 0.6396158463385354, "percentage": 63.96, "elapsed_time": "19:08:08", "remaining_time": "10:46:54", "throughput": 1583.98, "total_tokens": 109117440} -{"current_steps": 13330, "total_steps": 20825, "loss": 0.8965, "learning_rate": 1.5655245362480654e-05, "epoch": 0.6400960384153661, "percentage": 64.01, "elapsed_time": "19:08:54", "remaining_time": "10:45:59", "throughput": 1584.11, "total_tokens": 109199360} -{"current_steps": 13340, "total_steps": 20825, "loss": 0.8839, "learning_rate": 1.561851223162254e-05, "epoch": 0.6405762304921969, "percentage": 64.06, "elapsed_time": "19:09:39", "remaining_time": "10:45:04", "throughput": 1584.25, "total_tokens": 109281280} -{"current_steps": 13350, "total_steps": 20825, "loss": 0.9363, "learning_rate": 1.558180265912037e-05, "epoch": 0.6410564225690276, "percentage": 64.11, "elapsed_time": "19:10:25", "remaining_time": "10:44:09", "throughput": 1584.39, "total_tokens": 109363200} -{"current_steps": 13360, "total_steps": 20825, "loss": 0.9724, "learning_rate": 1.5545116737157522e-05, "epoch": 0.6415366146458583, "percentage": 64.15, "elapsed_time": "19:11:11", "remaining_time": "10:43:14", "throughput": 1584.53, "total_tokens": 109445120} -{"current_steps": 13370, "total_steps": 20825, "loss": 0.7562, "learning_rate": 1.5508454557857966e-05, "epoch": 0.6420168067226891, "percentage": 64.2, "elapsed_time": "19:11:57", "remaining_time": "10:42:19", "throughput": 1584.66, "total_tokens": 109527040} -{"current_steps": 13380, "total_steps": 20825, "loss": 0.8147, "learning_rate": 1.5471816213286054e-05, "epoch": 0.6424969987995198, "percentage": 64.25, "elapsed_time": "19:12:43", "remaining_time": "10:41:24", "throughput": 1584.79, "total_tokens": 109608960} -{"current_steps": 13390, "total_steps": 20825, "loss": 0.9489, "learning_rate": 1.5435201795446317e-05, "epoch": 0.6429771908763505, "percentage": 64.3, "elapsed_time": "19:13:29", "remaining_time": "10:40:29", "throughput": 1584.92, "total_tokens": 109690880} -{"current_steps": 13400, "total_steps": 20825, "loss": 0.8655, "learning_rate": 1.5398611396283153e-05, "epoch": 0.6434573829531812, "percentage": 64.35, "elapsed_time": "19:14:15", "remaining_time": "10:39:34", "throughput": 1585.05, "total_tokens": 109772800} -{"current_steps": 13410, "total_steps": 20825, "loss": 0.8621, "learning_rate": 1.536204510768069e-05, "epoch": 0.643937575030012, "percentage": 64.39, "elapsed_time": "19:15:01", "remaining_time": "10:38:39", "throughput": 1585.18, "total_tokens": 109854720} -{"current_steps": 13420, "total_steps": 20825, "loss": 0.8371, "learning_rate": 1.532550302146249e-05, "epoch": 0.6444177671068427, "percentage": 64.44, "elapsed_time": "19:15:46", "remaining_time": "10:37:44", "throughput": 1585.32, "total_tokens": 109936640} -{"current_steps": 13430, "total_steps": 20825, "loss": 0.7762, "learning_rate": 1.528898522939133e-05, "epoch": 0.6448979591836734, "percentage": 64.49, "elapsed_time": "19:16:33", "remaining_time": "10:36:50", "throughput": 1585.44, "total_tokens": 110018560} -{"current_steps": 13440, "total_steps": 20825, "loss": 0.9059, "learning_rate": 1.5252491823168994e-05, "epoch": 0.6453781512605042, "percentage": 64.54, "elapsed_time": "19:17:18", "remaining_time": "10:35:55", "throughput": 1585.57, "total_tokens": 110100480} -{"current_steps": 13450, "total_steps": 20825, "loss": 0.9104, "learning_rate": 1.5216022894436043e-05, "epoch": 0.6458583433373349, "percentage": 64.59, "elapsed_time": "19:18:05", "remaining_time": "10:35:00", "throughput": 1585.7, "total_tokens": 110182400} -{"current_steps": 13460, "total_steps": 20825, "loss": 0.9764, "learning_rate": 1.517957853477154e-05, "epoch": 0.6463385354141656, "percentage": 64.63, "elapsed_time": "19:18:50", "remaining_time": "10:34:05", "throughput": 1585.84, "total_tokens": 110264320} -{"current_steps": 13470, "total_steps": 20825, "loss": 0.8985, "learning_rate": 1.5143158835692866e-05, "epoch": 0.6468187274909964, "percentage": 64.68, "elapsed_time": "19:19:36", "remaining_time": "10:33:10", "throughput": 1585.97, "total_tokens": 110346240} -{"current_steps": 13480, "total_steps": 20825, "loss": 1.1936, "learning_rate": 1.5106763888655478e-05, "epoch": 0.6472989195678271, "percentage": 64.73, "elapsed_time": "19:20:22", "remaining_time": "10:32:15", "throughput": 1586.11, "total_tokens": 110428160} -{"current_steps": 13490, "total_steps": 20825, "loss": 0.9241, "learning_rate": 1.5070393785052695e-05, "epoch": 0.6477791116446578, "percentage": 64.78, "elapsed_time": "19:21:07", "remaining_time": "10:31:20", "throughput": 1586.24, "total_tokens": 110510080} -{"current_steps": 13500, "total_steps": 20825, "loss": 0.7714, "learning_rate": 1.5034048616215402e-05, "epoch": 0.6482593037214885, "percentage": 64.83, "elapsed_time": "19:21:53", "remaining_time": "10:30:26", "throughput": 1586.37, "total_tokens": 110592000} -{"current_steps": 13510, "total_steps": 20825, "loss": 1.0863, "learning_rate": 1.4997728473411903e-05, "epoch": 0.6487394957983194, "percentage": 64.87, "elapsed_time": "19:22:39", "remaining_time": "10:29:31", "throughput": 1586.5, "total_tokens": 110673920} -{"current_steps": 13520, "total_steps": 20825, "loss": 0.8677, "learning_rate": 1.4961433447847672e-05, "epoch": 0.64921968787515, "percentage": 64.92, "elapsed_time": "19:23:25", "remaining_time": "10:28:36", "throughput": 1586.64, "total_tokens": 110755840} -{"current_steps": 13530, "total_steps": 20825, "loss": 0.8387, "learning_rate": 1.4925163630665065e-05, "epoch": 0.6496998799519808, "percentage": 64.97, "elapsed_time": "19:24:10", "remaining_time": "10:27:41", "throughput": 1586.78, "total_tokens": 110837760} -{"current_steps": 13540, "total_steps": 20825, "loss": 0.9952, "learning_rate": 1.4888919112943173e-05, "epoch": 0.6501800720288116, "percentage": 65.02, "elapsed_time": "19:24:56", "remaining_time": "10:26:46", "throughput": 1586.91, "total_tokens": 110919680} -{"current_steps": 13550, "total_steps": 20825, "loss": 0.8378, "learning_rate": 1.4852699985697546e-05, "epoch": 0.6506602641056423, "percentage": 65.07, "elapsed_time": "19:25:42", "remaining_time": "10:25:52", "throughput": 1587.03, "total_tokens": 111001600} -{"current_steps": 13560, "total_steps": 20825, "loss": 0.8531, "learning_rate": 1.4816506339879965e-05, "epoch": 0.651140456182473, "percentage": 65.11, "elapsed_time": "19:26:28", "remaining_time": "10:24:57", "throughput": 1587.16, "total_tokens": 111083520} -{"current_steps": 13570, "total_steps": 20825, "loss": 0.8573, "learning_rate": 1.4780338266378232e-05, "epoch": 0.6516206482593038, "percentage": 65.16, "elapsed_time": "19:27:14", "remaining_time": "10:24:02", "throughput": 1587.3, "total_tokens": 111165440} -{"current_steps": 13580, "total_steps": 20825, "loss": 0.6841, "learning_rate": 1.4744195856015947e-05, "epoch": 0.6521008403361345, "percentage": 65.21, "elapsed_time": "19:28:00", "remaining_time": "10:23:08", "throughput": 1587.42, "total_tokens": 111247360} -{"current_steps": 13590, "total_steps": 20825, "loss": 0.8537, "learning_rate": 1.4708079199552221e-05, "epoch": 0.6525810324129652, "percentage": 65.26, "elapsed_time": "19:28:46", "remaining_time": "10:22:13", "throughput": 1587.55, "total_tokens": 111329280} -{"current_steps": 13600, "total_steps": 20825, "loss": 1.038, "learning_rate": 1.4671988387681549e-05, "epoch": 0.6530612244897959, "percentage": 65.31, "elapsed_time": "19:29:32", "remaining_time": "10:21:19", "throughput": 1587.68, "total_tokens": 111411200} -{"current_steps": 13610, "total_steps": 20825, "loss": 0.9946, "learning_rate": 1.4635923511033494e-05, "epoch": 0.6535414165666267, "percentage": 65.35, "elapsed_time": "19:30:18", "remaining_time": "10:20:24", "throughput": 1587.8, "total_tokens": 111493120} -{"current_steps": 13620, "total_steps": 20825, "loss": 1.8003, "learning_rate": 1.4599884660172485e-05, "epoch": 0.6540216086434574, "percentage": 65.4, "elapsed_time": "19:31:04", "remaining_time": "10:19:30", "throughput": 1587.92, "total_tokens": 111575040} -{"current_steps": 13630, "total_steps": 20825, "loss": 0.8789, "learning_rate": 1.4563871925597622e-05, "epoch": 0.6545018007202881, "percentage": 65.45, "elapsed_time": "19:31:50", "remaining_time": "10:18:35", "throughput": 1588.06, "total_tokens": 111656960} -{"current_steps": 13640, "total_steps": 20825, "loss": 0.6229, "learning_rate": 1.452788539774241e-05, "epoch": 0.6549819927971189, "percentage": 65.5, "elapsed_time": "19:32:37", "remaining_time": "10:17:41", "throughput": 1588.17, "total_tokens": 111738880} -{"current_steps": 13650, "total_steps": 20825, "loss": 0.8647, "learning_rate": 1.4491925166974532e-05, "epoch": 0.6554621848739496, "percentage": 65.55, "elapsed_time": "19:33:23", "remaining_time": "10:16:46", "throughput": 1588.29, "total_tokens": 111820800} -{"current_steps": 13660, "total_steps": 20825, "loss": 0.8938, "learning_rate": 1.4455991323595655e-05, "epoch": 0.6559423769507803, "percentage": 65.59, "elapsed_time": "19:34:09", "remaining_time": "10:15:52", "throughput": 1588.41, "total_tokens": 111902720} -{"current_steps": 13670, "total_steps": 20825, "loss": 0.8419, "learning_rate": 1.4420083957841185e-05, "epoch": 0.6564225690276111, "percentage": 65.64, "elapsed_time": "19:34:55", "remaining_time": "10:14:57", "throughput": 1588.54, "total_tokens": 111984640} -{"current_steps": 13680, "total_steps": 20825, "loss": 0.8683, "learning_rate": 1.4384203159880017e-05, "epoch": 0.6569027611044418, "percentage": 65.69, "elapsed_time": "19:35:41", "remaining_time": "10:14:03", "throughput": 1588.67, "total_tokens": 112066560} -{"current_steps": 13690, "total_steps": 20825, "loss": 1.1068, "learning_rate": 1.4348349019814344e-05, "epoch": 0.6573829531812725, "percentage": 65.74, "elapsed_time": "19:36:27", "remaining_time": "10:13:09", "throughput": 1588.79, "total_tokens": 112148480} -{"current_steps": 13700, "total_steps": 20825, "loss": 0.9632, "learning_rate": 1.4312521627679428e-05, "epoch": 0.6578631452581032, "percentage": 65.79, "elapsed_time": "19:37:13", "remaining_time": "10:12:14", "throughput": 1588.92, "total_tokens": 112230400} -{"current_steps": 13710, "total_steps": 20825, "loss": 0.8043, "learning_rate": 1.4276721073443344e-05, "epoch": 0.658343337334934, "percentage": 65.83, "elapsed_time": "19:37:59", "remaining_time": "10:11:19", "throughput": 1589.04, "total_tokens": 112312320} -{"current_steps": 13720, "total_steps": 20825, "loss": 1.025, "learning_rate": 1.4240947447006764e-05, "epoch": 0.6588235294117647, "percentage": 65.88, "elapsed_time": "19:38:45", "remaining_time": "10:10:25", "throughput": 1589.16, "total_tokens": 112394240} -{"current_steps": 13730, "total_steps": 20825, "loss": 1.0484, "learning_rate": 1.4205200838202782e-05, "epoch": 0.6593037214885954, "percentage": 65.93, "elapsed_time": "19:39:31", "remaining_time": "10:09:31", "throughput": 1589.29, "total_tokens": 112476160} -{"current_steps": 13740, "total_steps": 20825, "loss": 1.0862, "learning_rate": 1.4169481336796597e-05, "epoch": 0.6597839135654262, "percentage": 65.98, "elapsed_time": "19:40:17", "remaining_time": "10:08:36", "throughput": 1589.42, "total_tokens": 112558080} -{"current_steps": 13750, "total_steps": 20825, "loss": 0.9006, "learning_rate": 1.4133789032485367e-05, "epoch": 0.6602641056422569, "percentage": 66.03, "elapsed_time": "19:41:02", "remaining_time": "10:07:42", "throughput": 1589.55, "total_tokens": 112640000} -{"current_steps": 13760, "total_steps": 20825, "loss": 0.8773, "learning_rate": 1.4098124014897961e-05, "epoch": 0.6607442977190876, "percentage": 66.07, "elapsed_time": "19:41:48", "remaining_time": "10:06:47", "throughput": 1589.68, "total_tokens": 112721920} -{"current_steps": 13770, "total_steps": 20825, "loss": 0.802, "learning_rate": 1.4062486373594694e-05, "epoch": 0.6612244897959184, "percentage": 66.12, "elapsed_time": "19:42:34", "remaining_time": "10:05:53", "throughput": 1589.81, "total_tokens": 112803840} -{"current_steps": 13780, "total_steps": 20825, "loss": 1.0097, "learning_rate": 1.4026876198067163e-05, "epoch": 0.6617046818727491, "percentage": 66.17, "elapsed_time": "19:43:20", "remaining_time": "10:04:58", "throughput": 1589.93, "total_tokens": 112885760} -{"current_steps": 13790, "total_steps": 20825, "loss": 0.9333, "learning_rate": 1.399129357773799e-05, "epoch": 0.6621848739495798, "percentage": 66.22, "elapsed_time": "19:44:06", "remaining_time": "10:04:04", "throughput": 1590.06, "total_tokens": 112967680} -{"current_steps": 13800, "total_steps": 20825, "loss": 0.8832, "learning_rate": 1.3955738601960588e-05, "epoch": 0.6626650660264105, "percentage": 66.27, "elapsed_time": "19:44:52", "remaining_time": "10:03:09", "throughput": 1590.19, "total_tokens": 113049600} -{"current_steps": 13810, "total_steps": 20825, "loss": 0.7867, "learning_rate": 1.392021136001897e-05, "epoch": 0.6631452581032413, "percentage": 66.31, "elapsed_time": "19:45:38", "remaining_time": "10:02:15", "throughput": 1590.31, "total_tokens": 113131520} -{"current_steps": 13820, "total_steps": 20825, "loss": 0.9924, "learning_rate": 1.3884711941127487e-05, "epoch": 0.663625450180072, "percentage": 66.36, "elapsed_time": "19:46:23", "remaining_time": "10:01:21", "throughput": 1590.44, "total_tokens": 113213440} -{"current_steps": 13830, "total_steps": 20825, "loss": 0.7811, "learning_rate": 1.384924043443062e-05, "epoch": 0.6641056422569027, "percentage": 66.41, "elapsed_time": "19:47:10", "remaining_time": "10:00:27", "throughput": 1590.56, "total_tokens": 113295360} -{"current_steps": 13840, "total_steps": 20825, "loss": 0.7269, "learning_rate": 1.3813796929002779e-05, "epoch": 0.6645858343337335, "percentage": 66.46, "elapsed_time": "19:47:55", "remaining_time": "9:59:32", "throughput": 1590.69, "total_tokens": 113377280} -{"current_steps": 13850, "total_steps": 20825, "loss": 0.7797, "learning_rate": 1.3778381513848055e-05, "epoch": 0.6650660264105642, "percentage": 66.51, "elapsed_time": "19:48:41", "remaining_time": "9:58:38", "throughput": 1590.8, "total_tokens": 113459200} -{"current_steps": 13860, "total_steps": 20825, "loss": 0.7852, "learning_rate": 1.3742994277899967e-05, "epoch": 0.6655462184873949, "percentage": 66.55, "elapsed_time": "19:49:27", "remaining_time": "9:57:44", "throughput": 1590.93, "total_tokens": 113541120} -{"current_steps": 13870, "total_steps": 20825, "loss": 1.2018, "learning_rate": 1.370763531002132e-05, "epoch": 0.6660264105642257, "percentage": 66.6, "elapsed_time": "19:50:13", "remaining_time": "9:56:49", "throughput": 1591.05, "total_tokens": 113623040} -{"current_steps": 13880, "total_steps": 20825, "loss": 0.7667, "learning_rate": 1.3672304699003908e-05, "epoch": 0.6665066026410564, "percentage": 66.65, "elapsed_time": "19:51:00", "remaining_time": "9:55:55", "throughput": 1591.16, "total_tokens": 113704960} -{"current_steps": 13890, "total_steps": 20825, "loss": 0.8471, "learning_rate": 1.3637002533568302e-05, "epoch": 0.6669867947178871, "percentage": 66.7, "elapsed_time": "19:51:47", "remaining_time": "9:55:02", "throughput": 1591.26, "total_tokens": 113786880} -{"current_steps": 13900, "total_steps": 20825, "loss": 1.1894, "learning_rate": 1.3601728902363681e-05, "epoch": 0.6674669867947179, "percentage": 66.75, "elapsed_time": "19:52:38", "remaining_time": "9:54:10", "throughput": 1591.27, "total_tokens": 113868800} -{"current_steps": 13910, "total_steps": 20825, "loss": 0.9134, "learning_rate": 1.356648389396754e-05, "epoch": 0.6679471788715486, "percentage": 66.79, "elapsed_time": "19:53:31", "remaining_time": "9:53:19", "throughput": 1591.24, "total_tokens": 113950720} -{"current_steps": 13920, "total_steps": 20825, "loss": 1.1423, "learning_rate": 1.3531267596885488e-05, "epoch": 0.6684273709483793, "percentage": 66.84, "elapsed_time": "19:54:18", "remaining_time": "9:52:26", "throughput": 1591.34, "total_tokens": 114032640} -{"current_steps": 13930, "total_steps": 20825, "loss": 0.7921, "learning_rate": 1.349608009955107e-05, "epoch": 0.66890756302521, "percentage": 66.89, "elapsed_time": "19:55:04", "remaining_time": "9:51:31", "throughput": 1591.46, "total_tokens": 114114560} -{"current_steps": 13940, "total_steps": 20825, "loss": 0.8029, "learning_rate": 1.34609214903255e-05, "epoch": 0.6693877551020408, "percentage": 66.94, "elapsed_time": "19:55:52", "remaining_time": "9:50:38", "throughput": 1591.54, "total_tokens": 114196480} -{"current_steps": 13950, "total_steps": 20825, "loss": 0.9638, "learning_rate": 1.3425791857497422e-05, "epoch": 0.6698679471788715, "percentage": 66.99, "elapsed_time": "19:56:43", "remaining_time": "9:49:47", "throughput": 1591.54, "total_tokens": 114278400} -{"current_steps": 13960, "total_steps": 20825, "loss": 0.8415, "learning_rate": 1.3390691289282754e-05, "epoch": 0.6703481392557022, "percentage": 67.03, "elapsed_time": "19:57:38", "remaining_time": "9:48:57", "throughput": 1591.46, "total_tokens": 114360320} -{"current_steps": 13970, "total_steps": 20825, "loss": 0.9274, "learning_rate": 1.335561987382441e-05, "epoch": 0.6708283313325331, "percentage": 67.08, "elapsed_time": "19:58:29", "remaining_time": "9:48:05", "throughput": 1591.49, "total_tokens": 114442240} -{"current_steps": 13980, "total_steps": 20825, "loss": 0.7943, "learning_rate": 1.3320577699192086e-05, "epoch": 0.6713085234093638, "percentage": 67.13, "elapsed_time": "19:59:18", "remaining_time": "9:47:12", "throughput": 1591.53, "total_tokens": 114524160} -{"current_steps": 13990, "total_steps": 20825, "loss": 0.9644, "learning_rate": 1.3285564853382076e-05, "epoch": 0.6717887154861945, "percentage": 67.18, "elapsed_time": "20:00:08", "remaining_time": "9:46:20", "throughput": 1591.56, "total_tokens": 114606080} -{"current_steps": 14000, "total_steps": 20825, "loss": 0.8024, "learning_rate": 1.325058142431701e-05, "epoch": 0.6722689075630253, "percentage": 67.23, "elapsed_time": "20:01:00", "remaining_time": "9:45:29", "throughput": 1591.56, "total_tokens": 114688000} -{"current_steps": 14010, "total_steps": 20825, "loss": 0.7327, "learning_rate": 1.321562749984563e-05, "epoch": 0.672749099639856, "percentage": 67.27, "elapsed_time": "20:02:01", "remaining_time": "9:44:42", "throughput": 1591.34, "total_tokens": 114769920} -{"current_steps": 14020, "total_steps": 20825, "loss": 0.9788, "learning_rate": 1.318070316774262e-05, "epoch": 0.6732292917166867, "percentage": 67.32, "elapsed_time": "20:02:53", "remaining_time": "9:43:51", "throughput": 1591.34, "total_tokens": 114851840} -{"current_steps": 14030, "total_steps": 20825, "loss": 0.7022, "learning_rate": 1.3145808515708347e-05, "epoch": 0.6737094837935174, "percentage": 67.37, "elapsed_time": "20:03:42", "remaining_time": "9:42:58", "throughput": 1591.38, "total_tokens": 114933760} -{"current_steps": 14040, "total_steps": 20825, "loss": 0.9829, "learning_rate": 1.3110943631368616e-05, "epoch": 0.6741896758703482, "percentage": 67.42, "elapsed_time": "20:04:32", "remaining_time": "9:42:06", "throughput": 1591.42, "total_tokens": 115015680} -{"current_steps": 14050, "total_steps": 20825, "loss": 0.7022, "learning_rate": 1.3076108602274522e-05, "epoch": 0.6746698679471789, "percentage": 67.47, "elapsed_time": "20:05:21", "remaining_time": "9:41:14", "throughput": 1591.46, "total_tokens": 115097600} -{"current_steps": 14060, "total_steps": 20825, "loss": 0.8251, "learning_rate": 1.3041303515902179e-05, "epoch": 0.6751500600240096, "percentage": 67.52, "elapsed_time": "20:06:11", "remaining_time": "9:40:21", "throughput": 1591.49, "total_tokens": 115179520} -{"current_steps": 14070, "total_steps": 20825, "loss": 1.0901, "learning_rate": 1.3006528459652476e-05, "epoch": 0.6756302521008404, "percentage": 67.56, "elapsed_time": "20:07:02", "remaining_time": "9:39:29", "throughput": 1591.52, "total_tokens": 115261440} -{"current_steps": 14080, "total_steps": 20825, "loss": 0.9864, "learning_rate": 1.2971783520850939e-05, "epoch": 0.6761104441776711, "percentage": 67.61, "elapsed_time": "20:07:51", "remaining_time": "9:38:37", "throughput": 1591.56, "total_tokens": 115343360} -{"current_steps": 14090, "total_steps": 20825, "loss": 0.9465, "learning_rate": 1.2937068786747438e-05, "epoch": 0.6765906362545018, "percentage": 67.66, "elapsed_time": "20:08:40", "remaining_time": "9:37:44", "throughput": 1591.62, "total_tokens": 115425280} -{"current_steps": 14100, "total_steps": 20825, "loss": 0.9708, "learning_rate": 1.2902384344515986e-05, "epoch": 0.6770708283313326, "percentage": 67.71, "elapsed_time": "20:09:29", "remaining_time": "9:36:51", "throughput": 1591.69, "total_tokens": 115507200} -{"current_steps": 14110, "total_steps": 20825, "loss": 0.7833, "learning_rate": 1.286773028125455e-05, "epoch": 0.6775510204081633, "percentage": 67.76, "elapsed_time": "20:10:25", "remaining_time": "9:36:02", "throughput": 1591.57, "total_tokens": 115589120} -{"current_steps": 14120, "total_steps": 20825, "loss": 0.9278, "learning_rate": 1.2833106683984808e-05, "epoch": 0.678031212484994, "percentage": 67.8, "elapsed_time": "20:11:12", "remaining_time": "9:35:09", "throughput": 1591.68, "total_tokens": 115671040} -{"current_steps": 14130, "total_steps": 20825, "loss": 0.8275, "learning_rate": 1.279851363965193e-05, "epoch": 0.6785114045618247, "percentage": 67.85, "elapsed_time": "20:11:59", "remaining_time": "9:34:15", "throughput": 1591.77, "total_tokens": 115752960} -{"current_steps": 14140, "total_steps": 20825, "loss": 0.8764, "learning_rate": 1.2763951235124346e-05, "epoch": 0.6789915966386555, "percentage": 67.9, "elapsed_time": "20:12:47", "remaining_time": "9:33:22", "throughput": 1591.86, "total_tokens": 115834880} -{"current_steps": 14150, "total_steps": 20825, "loss": 0.9236, "learning_rate": 1.2729419557193573e-05, "epoch": 0.6794717887154862, "percentage": 67.95, "elapsed_time": "20:13:34", "remaining_time": "9:32:28", "throughput": 1591.94, "total_tokens": 115916800} -{"current_steps": 14160, "total_steps": 20825, "loss": 0.7963, "learning_rate": 1.2694918692573954e-05, "epoch": 0.6799519807923169, "percentage": 68.0, "elapsed_time": "20:14:28", "remaining_time": "9:31:38", "throughput": 1591.9, "total_tokens": 115998720} -{"current_steps": 14170, "total_steps": 20825, "loss": 0.7971, "learning_rate": 1.2660448727902457e-05, "epoch": 0.6804321728691477, "percentage": 68.04, "elapsed_time": "20:15:15", "remaining_time": "9:30:45", "throughput": 1591.99, "total_tokens": 116080640} -{"current_steps": 14180, "total_steps": 20825, "loss": 0.7678, "learning_rate": 1.2626009749738444e-05, "epoch": 0.6809123649459784, "percentage": 68.09, "elapsed_time": "20:16:02", "remaining_time": "9:29:51", "throughput": 1592.09, "total_tokens": 116162560} -{"current_steps": 14190, "total_steps": 20825, "loss": 0.8935, "learning_rate": 1.2591601844563488e-05, "epoch": 0.6813925570228091, "percentage": 68.14, "elapsed_time": "20:16:50", "remaining_time": "9:28:58", "throughput": 1592.17, "total_tokens": 116244480} -{"current_steps": 14200, "total_steps": 20825, "loss": 0.9236, "learning_rate": 1.2557225098781105e-05, "epoch": 0.6818727490996399, "percentage": 68.19, "elapsed_time": "20:17:37", "remaining_time": "9:28:05", "throughput": 1592.25, "total_tokens": 116326400} -{"current_steps": 14210, "total_steps": 20825, "loss": 0.8667, "learning_rate": 1.2522879598716595e-05, "epoch": 0.6823529411764706, "percentage": 68.24, "elapsed_time": "20:18:24", "remaining_time": "9:27:11", "throughput": 1592.35, "total_tokens": 116408320} -{"current_steps": 14220, "total_steps": 20825, "loss": 0.8728, "learning_rate": 1.2488565430616785e-05, "epoch": 0.6828331332533013, "percentage": 68.28, "elapsed_time": "20:19:10", "remaining_time": "9:26:17", "throughput": 1592.47, "total_tokens": 116490240} -{"current_steps": 14230, "total_steps": 20825, "loss": 0.6747, "learning_rate": 1.2454282680649804e-05, "epoch": 0.683313325330132, "percentage": 68.33, "elapsed_time": "20:19:57", "remaining_time": "9:25:24", "throughput": 1592.56, "total_tokens": 116572160} -{"current_steps": 14240, "total_steps": 20825, "loss": 0.864, "learning_rate": 1.2420031434904906e-05, "epoch": 0.6837935174069628, "percentage": 68.38, "elapsed_time": "20:20:43", "remaining_time": "9:24:30", "throughput": 1592.68, "total_tokens": 116654080} -{"current_steps": 14250, "total_steps": 20825, "loss": 0.8979, "learning_rate": 1.2385811779392236e-05, "epoch": 0.6842737094837935, "percentage": 68.43, "elapsed_time": "20:21:30", "remaining_time": "9:23:36", "throughput": 1592.79, "total_tokens": 116736000} -{"current_steps": 14260, "total_steps": 20825, "loss": 0.9371, "learning_rate": 1.2351623800042587e-05, "epoch": 0.6847539015606242, "percentage": 68.48, "elapsed_time": "20:22:15", "remaining_time": "9:22:42", "throughput": 1592.92, "total_tokens": 116817920} -{"current_steps": 14270, "total_steps": 20825, "loss": 0.9432, "learning_rate": 1.2317467582707238e-05, "epoch": 0.685234093637455, "percentage": 68.52, "elapsed_time": "20:23:02", "remaining_time": "9:21:48", "throughput": 1593.02, "total_tokens": 116899840} -{"current_steps": 14280, "total_steps": 20825, "loss": 0.8542, "learning_rate": 1.2283343213157688e-05, "epoch": 0.6857142857142857, "percentage": 68.57, "elapsed_time": "20:23:49", "remaining_time": "9:20:55", "throughput": 1593.12, "total_tokens": 116981760} -{"current_steps": 14290, "total_steps": 20825, "loss": 0.897, "learning_rate": 1.2249250777085456e-05, "epoch": 0.6861944777911164, "percentage": 68.62, "elapsed_time": "20:24:37", "remaining_time": "9:20:02", "throughput": 1593.18, "total_tokens": 117063680} -{"current_steps": 14300, "total_steps": 20825, "loss": 0.9898, "learning_rate": 1.221519036010189e-05, "epoch": 0.6866746698679472, "percentage": 68.67, "elapsed_time": "20:25:25", "remaining_time": "9:19:09", "throughput": 1593.26, "total_tokens": 117145600} -{"current_steps": 14310, "total_steps": 20825, "loss": 0.7581, "learning_rate": 1.2181162047737942e-05, "epoch": 0.6871548619447779, "percentage": 68.72, "elapsed_time": "20:26:12", "remaining_time": "9:18:15", "throughput": 1593.35, "total_tokens": 117227520} -{"current_steps": 14320, "total_steps": 20825, "loss": 1.0274, "learning_rate": 1.2147165925443904e-05, "epoch": 0.6876350540216086, "percentage": 68.76, "elapsed_time": "20:27:00", "remaining_time": "9:17:22", "throughput": 1593.44, "total_tokens": 117309440} -{"current_steps": 14330, "total_steps": 20825, "loss": 0.8403, "learning_rate": 1.2113202078589267e-05, "epoch": 0.6881152460984393, "percentage": 68.81, "elapsed_time": "20:27:48", "remaining_time": "9:16:29", "throughput": 1593.51, "total_tokens": 117391360} -{"current_steps": 14340, "total_steps": 20825, "loss": 0.8582, "learning_rate": 1.2079270592462475e-05, "epoch": 0.6885954381752701, "percentage": 68.86, "elapsed_time": "20:28:35", "remaining_time": "9:15:36", "throughput": 1593.61, "total_tokens": 117473280} -{"current_steps": 14350, "total_steps": 20825, "loss": 0.876, "learning_rate": 1.204537155227068e-05, "epoch": 0.6890756302521008, "percentage": 68.91, "elapsed_time": "20:29:22", "remaining_time": "9:14:43", "throughput": 1593.7, "total_tokens": 117555200} -{"current_steps": 14360, "total_steps": 20825, "loss": 0.9847, "learning_rate": 1.201150504313959e-05, "epoch": 0.6895558223289315, "percentage": 68.96, "elapsed_time": "20:30:08", "remaining_time": "9:13:49", "throughput": 1593.82, "total_tokens": 117637120} -{"current_steps": 14370, "total_steps": 20825, "loss": 0.8981, "learning_rate": 1.1977671150113206e-05, "epoch": 0.6900360144057623, "percentage": 69.0, "elapsed_time": "20:30:53", "remaining_time": "9:12:55", "throughput": 1593.94, "total_tokens": 117719040} -{"current_steps": 14380, "total_steps": 20825, "loss": 0.929, "learning_rate": 1.1943869958153613e-05, "epoch": 0.690516206482593, "percentage": 69.05, "elapsed_time": "20:31:39", "remaining_time": "9:12:01", "throughput": 1594.06, "total_tokens": 117800960} -{"current_steps": 14390, "total_steps": 20825, "loss": 0.9613, "learning_rate": 1.1910101552140806e-05, "epoch": 0.6909963985594237, "percentage": 69.1, "elapsed_time": "20:32:25", "remaining_time": "9:11:07", "throughput": 1594.18, "total_tokens": 117882880} -{"current_steps": 14400, "total_steps": 20825, "loss": 0.9258, "learning_rate": 1.1876366016872445e-05, "epoch": 0.6914765906362546, "percentage": 69.15, "elapsed_time": "20:33:11", "remaining_time": "9:10:13", "throughput": 1594.31, "total_tokens": 117964800} -{"current_steps": 14410, "total_steps": 20825, "loss": 0.7828, "learning_rate": 1.1842663437063613e-05, "epoch": 0.6919567827130852, "percentage": 69.2, "elapsed_time": "20:33:56", "remaining_time": "9:09:19", "throughput": 1594.43, "total_tokens": 118046720} -{"current_steps": 14420, "total_steps": 20825, "loss": 0.9457, "learning_rate": 1.180899389734668e-05, "epoch": 0.692436974789916, "percentage": 69.24, "elapsed_time": "20:34:42", "remaining_time": "9:08:25", "throughput": 1594.55, "total_tokens": 118128640} -{"current_steps": 14430, "total_steps": 20825, "loss": 0.872, "learning_rate": 1.1775357482271032e-05, "epoch": 0.6929171668667466, "percentage": 69.29, "elapsed_time": "20:35:28", "remaining_time": "9:07:31", "throughput": 1594.67, "total_tokens": 118210560} -{"current_steps": 14440, "total_steps": 20825, "loss": 0.8554, "learning_rate": 1.1741754276302851e-05, "epoch": 0.6933973589435775, "percentage": 69.34, "elapsed_time": "20:36:14", "remaining_time": "9:06:37", "throughput": 1594.8, "total_tokens": 118292480} -{"current_steps": 14450, "total_steps": 20825, "loss": 0.9142, "learning_rate": 1.170818436382497e-05, "epoch": 0.6938775510204082, "percentage": 69.39, "elapsed_time": "20:36:59", "remaining_time": "9:05:43", "throughput": 1594.93, "total_tokens": 118374400} -{"current_steps": 14460, "total_steps": 20825, "loss": 0.9356, "learning_rate": 1.1674647829136581e-05, "epoch": 0.6943577430972389, "percentage": 69.44, "elapsed_time": "20:37:44", "remaining_time": "9:04:49", "throughput": 1595.06, "total_tokens": 118456320} -{"current_steps": 14470, "total_steps": 20825, "loss": 0.9423, "learning_rate": 1.164114475645306e-05, "epoch": 0.6948379351740697, "percentage": 69.48, "elapsed_time": "20:38:29", "remaining_time": "9:03:55", "throughput": 1595.19, "total_tokens": 118538240} -{"current_steps": 14480, "total_steps": 20825, "loss": 0.8267, "learning_rate": 1.1607675229905776e-05, "epoch": 0.6953181272509004, "percentage": 69.53, "elapsed_time": "20:39:15", "remaining_time": "9:03:01", "throughput": 1595.32, "total_tokens": 118620160} -{"current_steps": 14490, "total_steps": 20825, "loss": 0.8272, "learning_rate": 1.1574239333541856e-05, "epoch": 0.6957983193277311, "percentage": 69.58, "elapsed_time": "20:40:01", "remaining_time": "9:02:08", "throughput": 1595.43, "total_tokens": 118702080} -{"current_steps": 14500, "total_steps": 20825, "loss": 1.0219, "learning_rate": 1.1540837151323951e-05, "epoch": 0.6962785114045619, "percentage": 69.63, "elapsed_time": "20:40:46", "remaining_time": "9:01:14", "throughput": 1595.56, "total_tokens": 118784000} -{"current_steps": 14510, "total_steps": 20825, "loss": 1.0269, "learning_rate": 1.150746876713008e-05, "epoch": 0.6967587034813926, "percentage": 69.68, "elapsed_time": "20:41:31", "remaining_time": "9:00:20", "throughput": 1595.69, "total_tokens": 118865920} -{"current_steps": 14520, "total_steps": 20825, "loss": 0.9424, "learning_rate": 1.1474134264753384e-05, "epoch": 0.6972388955582233, "percentage": 69.72, "elapsed_time": "20:42:17", "remaining_time": "8:59:26", "throughput": 1595.81, "total_tokens": 118947840} -{"current_steps": 14530, "total_steps": 20825, "loss": 0.8436, "learning_rate": 1.1440833727901894e-05, "epoch": 0.697719087635054, "percentage": 69.77, "elapsed_time": "20:43:02", "remaining_time": "8:58:32", "throughput": 1595.94, "total_tokens": 119029760} -{"current_steps": 14540, "total_steps": 20825, "loss": 0.7876, "learning_rate": 1.1407567240198397e-05, "epoch": 0.6981992797118848, "percentage": 69.82, "elapsed_time": "20:43:48", "remaining_time": "8:57:38", "throughput": 1596.06, "total_tokens": 119111680} -{"current_steps": 14550, "total_steps": 20825, "loss": 0.8579, "learning_rate": 1.1374334885180135e-05, "epoch": 0.6986794717887155, "percentage": 69.87, "elapsed_time": "20:44:33", "remaining_time": "8:56:44", "throughput": 1596.19, "total_tokens": 119193600} -{"current_steps": 14560, "total_steps": 20825, "loss": 0.9189, "learning_rate": 1.1341136746298647e-05, "epoch": 0.6991596638655462, "percentage": 69.92, "elapsed_time": "20:45:19", "remaining_time": "8:55:50", "throughput": 1596.32, "total_tokens": 119275520} -{"current_steps": 14570, "total_steps": 20825, "loss": 0.834, "learning_rate": 1.1307972906919562e-05, "epoch": 0.699639855942377, "percentage": 69.96, "elapsed_time": "20:46:04", "remaining_time": "8:54:56", "throughput": 1596.45, "total_tokens": 119357440} -{"current_steps": 14580, "total_steps": 20825, "loss": 0.8542, "learning_rate": 1.1274843450322381e-05, "epoch": 0.7001200480192077, "percentage": 70.01, "elapsed_time": "20:46:50", "remaining_time": "8:54:03", "throughput": 1596.57, "total_tokens": 119439360} -{"current_steps": 14590, "total_steps": 20825, "loss": 0.8792, "learning_rate": 1.1241748459700241e-05, "epoch": 0.7006002400960384, "percentage": 70.06, "elapsed_time": "20:47:42", "remaining_time": "8:53:12", "throughput": 1596.54, "total_tokens": 119521280} -{"current_steps": 14600, "total_steps": 20825, "loss": 0.9641, "learning_rate": 1.1208688018159746e-05, "epoch": 0.7010804321728692, "percentage": 70.11, "elapsed_time": "20:48:27", "remaining_time": "8:52:18", "throughput": 1596.67, "total_tokens": 119603200} -{"current_steps": 14610, "total_steps": 20825, "loss": 1.0869, "learning_rate": 1.1175662208720758e-05, "epoch": 0.7015606242496999, "percentage": 70.16, "elapsed_time": "20:49:13", "remaining_time": "8:51:24", "throughput": 1596.8, "total_tokens": 119685120} -{"current_steps": 14620, "total_steps": 20825, "loss": 0.9409, "learning_rate": 1.1142671114316127e-05, "epoch": 0.7020408163265306, "percentage": 70.2, "elapsed_time": "20:49:58", "remaining_time": "8:50:30", "throughput": 1596.92, "total_tokens": 119767040} -{"current_steps": 14630, "total_steps": 20825, "loss": 0.9631, "learning_rate": 1.1109714817791584e-05, "epoch": 0.7025210084033613, "percentage": 70.25, "elapsed_time": "20:50:43", "remaining_time": "8:49:36", "throughput": 1597.06, "total_tokens": 119848960} -{"current_steps": 14640, "total_steps": 20825, "loss": 0.8025, "learning_rate": 1.1076793401905419e-05, "epoch": 0.7030012004801921, "percentage": 70.3, "elapsed_time": "20:51:28", "remaining_time": "8:48:42", "throughput": 1597.19, "total_tokens": 119930880} -{"current_steps": 14650, "total_steps": 20825, "loss": 0.8847, "learning_rate": 1.1043906949328387e-05, "epoch": 0.7034813925570228, "percentage": 70.35, "elapsed_time": "20:52:13", "remaining_time": "8:47:49", "throughput": 1597.32, "total_tokens": 120012800} -{"current_steps": 14660, "total_steps": 20825, "loss": 0.8116, "learning_rate": 1.1011055542643398e-05, "epoch": 0.7039615846338535, "percentage": 70.4, "elapsed_time": "20:52:59", "remaining_time": "8:46:55", "throughput": 1597.45, "total_tokens": 120094720} -{"current_steps": 14670, "total_steps": 20825, "loss": 0.9473, "learning_rate": 1.0978239264345397e-05, "epoch": 0.7044417767106843, "percentage": 70.44, "elapsed_time": "20:53:44", "remaining_time": "8:46:01", "throughput": 1597.58, "total_tokens": 120176640} -{"current_steps": 14680, "total_steps": 20825, "loss": 0.9452, "learning_rate": 1.0945458196841078e-05, "epoch": 0.704921968787515, "percentage": 70.49, "elapsed_time": "20:54:29", "remaining_time": "8:45:07", "throughput": 1597.7, "total_tokens": 120258560} -{"current_steps": 14690, "total_steps": 20825, "loss": 1.089, "learning_rate": 1.0912712422448737e-05, "epoch": 0.7054021608643457, "percentage": 70.54, "elapsed_time": "20:55:14", "remaining_time": "8:44:13", "throughput": 1597.84, "total_tokens": 120340480} -{"current_steps": 14700, "total_steps": 20825, "loss": 0.8222, "learning_rate": 1.0880002023398058e-05, "epoch": 0.7058823529411765, "percentage": 70.59, "elapsed_time": "20:55:59", "remaining_time": "8:43:19", "throughput": 1597.97, "total_tokens": 120422400} -{"current_steps": 14710, "total_steps": 20825, "loss": 0.8349, "learning_rate": 1.0847327081829853e-05, "epoch": 0.7063625450180072, "percentage": 70.64, "elapsed_time": "20:56:44", "remaining_time": "8:42:26", "throughput": 1598.09, "total_tokens": 120504320} -{"current_steps": 14720, "total_steps": 20825, "loss": 1.4205, "learning_rate": 1.0814687679795924e-05, "epoch": 0.7068427370948379, "percentage": 70.68, "elapsed_time": "20:57:30", "remaining_time": "8:41:32", "throughput": 1598.21, "total_tokens": 120586240} -{"current_steps": 14730, "total_steps": 20825, "loss": 0.9358, "learning_rate": 1.0782083899258827e-05, "epoch": 0.7073229291716686, "percentage": 70.73, "elapsed_time": "20:58:16", "remaining_time": "8:40:38", "throughput": 1598.34, "total_tokens": 120668160} -{"current_steps": 14740, "total_steps": 20825, "loss": 0.8712, "learning_rate": 1.0749515822091658e-05, "epoch": 0.7078031212484994, "percentage": 70.78, "elapsed_time": "20:59:01", "remaining_time": "8:39:45", "throughput": 1598.46, "total_tokens": 120750080} -{"current_steps": 14750, "total_steps": 20825, "loss": 1.2485, "learning_rate": 1.0716983530077843e-05, "epoch": 0.7082833133253301, "percentage": 70.83, "elapsed_time": "20:59:46", "remaining_time": "8:38:51", "throughput": 1598.59, "total_tokens": 120832000} -{"current_steps": 14760, "total_steps": 20825, "loss": 0.7965, "learning_rate": 1.0684487104910974e-05, "epoch": 0.7087635054021608, "percentage": 70.88, "elapsed_time": "21:00:31", "remaining_time": "8:37:57", "throughput": 1598.72, "total_tokens": 120913920} -{"current_steps": 14770, "total_steps": 20825, "loss": 0.8365, "learning_rate": 1.0652026628194567e-05, "epoch": 0.7092436974789916, "percentage": 70.92, "elapsed_time": "21:01:17", "remaining_time": "8:37:04", "throughput": 1598.84, "total_tokens": 120995840} -{"current_steps": 14780, "total_steps": 20825, "loss": 0.8742, "learning_rate": 1.0619602181441848e-05, "epoch": 0.7097238895558223, "percentage": 70.97, "elapsed_time": "21:02:02", "remaining_time": "8:36:10", "throughput": 1598.96, "total_tokens": 121077760} -{"current_steps": 14790, "total_steps": 20825, "loss": 0.7952, "learning_rate": 1.0587213846075591e-05, "epoch": 0.710204081632653, "percentage": 71.02, "elapsed_time": "21:02:48", "remaining_time": "8:35:16", "throughput": 1599.09, "total_tokens": 121159680} -{"current_steps": 14800, "total_steps": 20825, "loss": 0.9441, "learning_rate": 1.0554861703427884e-05, "epoch": 0.7106842737094838, "percentage": 71.07, "elapsed_time": "21:03:33", "remaining_time": "8:34:23", "throughput": 1599.21, "total_tokens": 121241600} -{"current_steps": 14810, "total_steps": 20825, "loss": 1.0587, "learning_rate": 1.0522545834739908e-05, "epoch": 0.7111644657863145, "percentage": 71.12, "elapsed_time": "21:04:19", "remaining_time": "8:33:29", "throughput": 1599.32, "total_tokens": 121323520} -{"current_steps": 14820, "total_steps": 20825, "loss": 0.9414, "learning_rate": 1.0490266321161785e-05, "epoch": 0.7116446578631452, "percentage": 71.16, "elapsed_time": "21:05:04", "remaining_time": "8:32:36", "throughput": 1599.45, "total_tokens": 121405440} -{"current_steps": 14830, "total_steps": 20825, "loss": 0.9523, "learning_rate": 1.0458023243752321e-05, "epoch": 0.712124849939976, "percentage": 71.21, "elapsed_time": "21:05:49", "remaining_time": "8:31:42", "throughput": 1599.58, "total_tokens": 121487360} -{"current_steps": 14840, "total_steps": 20825, "loss": 1.145, "learning_rate": 1.0425816683478823e-05, "epoch": 0.7126050420168067, "percentage": 71.26, "elapsed_time": "21:06:35", "remaining_time": "8:30:49", "throughput": 1599.68, "total_tokens": 121569280} -{"current_steps": 14850, "total_steps": 20825, "loss": 0.9529, "learning_rate": 1.039364672121692e-05, "epoch": 0.7130852340936374, "percentage": 71.31, "elapsed_time": "21:07:30", "remaining_time": "8:29:59", "throughput": 1599.61, "total_tokens": 121651200} -{"current_steps": 14860, "total_steps": 20825, "loss": 1.0087, "learning_rate": 1.0361513437750333e-05, "epoch": 0.7135654261704681, "percentage": 71.36, "elapsed_time": "21:08:24", "remaining_time": "8:29:09", "throughput": 1599.56, "total_tokens": 121733120} -{"current_steps": 14870, "total_steps": 20825, "loss": 0.8125, "learning_rate": 1.0329416913770651e-05, "epoch": 0.714045618247299, "percentage": 71.4, "elapsed_time": "21:09:18", "remaining_time": "8:28:19", "throughput": 1599.49, "total_tokens": 121815040} -{"current_steps": 14880, "total_steps": 20825, "loss": 0.8591, "learning_rate": 1.0297357229877183e-05, "epoch": 0.7145258103241297, "percentage": 71.45, "elapsed_time": "21:10:12", "remaining_time": "8:27:29", "throughput": 1599.44, "total_tokens": 121896960} -{"current_steps": 14890, "total_steps": 20825, "loss": 0.9232, "learning_rate": 1.0265334466576723e-05, "epoch": 0.7150060024009603, "percentage": 71.5, "elapsed_time": "21:10:58", "remaining_time": "8:26:35", "throughput": 1599.54, "total_tokens": 121978880} -{"current_steps": 14900, "total_steps": 20825, "loss": 0.7655, "learning_rate": 1.0233348704283332e-05, "epoch": 0.7154861944777912, "percentage": 71.55, "elapsed_time": "21:11:44", "remaining_time": "8:25:42", "throughput": 1599.65, "total_tokens": 122060800} -{"current_steps": 14910, "total_steps": 20825, "loss": 0.8836, "learning_rate": 1.0201400023318184e-05, "epoch": 0.7159663865546219, "percentage": 71.6, "elapsed_time": "21:12:30", "remaining_time": "8:24:49", "throughput": 1599.76, "total_tokens": 122142720} -{"current_steps": 14920, "total_steps": 20825, "loss": 0.9663, "learning_rate": 1.0169488503909313e-05, "epoch": 0.7164465786314526, "percentage": 71.64, "elapsed_time": "21:13:16", "remaining_time": "8:23:55", "throughput": 1599.88, "total_tokens": 122224640} -{"current_steps": 14930, "total_steps": 20825, "loss": 1.1426, "learning_rate": 1.0137614226191434e-05, "epoch": 0.7169267707082834, "percentage": 71.69, "elapsed_time": "21:14:01", "remaining_time": "8:23:02", "throughput": 1599.99, "total_tokens": 122306560} -{"current_steps": 14940, "total_steps": 20825, "loss": 1.0298, "learning_rate": 1.010577727020576e-05, "epoch": 0.7174069627851141, "percentage": 71.74, "elapsed_time": "21:14:47", "remaining_time": "8:22:09", "throughput": 1600.1, "total_tokens": 122388480} -{"current_steps": 14950, "total_steps": 20825, "loss": 1.0564, "learning_rate": 1.0073977715899785e-05, "epoch": 0.7178871548619448, "percentage": 71.79, "elapsed_time": "21:15:33", "remaining_time": "8:21:15", "throughput": 1600.22, "total_tokens": 122470400} -{"current_steps": 14960, "total_steps": 20825, "loss": 0.8569, "learning_rate": 1.0042215643127051e-05, "epoch": 0.7183673469387755, "percentage": 71.84, "elapsed_time": "21:16:18", "remaining_time": "8:20:22", "throughput": 1600.34, "total_tokens": 122552320} -{"current_steps": 14970, "total_steps": 20825, "loss": 0.9653, "learning_rate": 1.0010491131647013e-05, "epoch": 0.7188475390156063, "percentage": 71.88, "elapsed_time": "21:17:04", "remaining_time": "8:19:29", "throughput": 1600.46, "total_tokens": 122634240} -{"current_steps": 14980, "total_steps": 20825, "loss": 1.0368, "learning_rate": 9.978804261124792e-06, "epoch": 0.719327731092437, "percentage": 71.93, "elapsed_time": "21:17:50", "remaining_time": "8:18:35", "throughput": 1600.56, "total_tokens": 122716160} -{"current_steps": 14990, "total_steps": 20825, "loss": 0.8155, "learning_rate": 9.947155111130969e-06, "epoch": 0.7198079231692677, "percentage": 71.98, "elapsed_time": "21:18:36", "remaining_time": "8:17:42", "throughput": 1600.67, "total_tokens": 122798080} -{"current_steps": 15000, "total_steps": 20825, "loss": 0.9462, "learning_rate": 9.915543761141432e-06, "epoch": 0.7202881152460985, "percentage": 72.03, "elapsed_time": "21:19:22", "remaining_time": "8:16:49", "throughput": 1600.79, "total_tokens": 122880000} -{"current_steps": 15010, "total_steps": 20825, "loss": 0.7584, "learning_rate": 9.883970290537134e-06, "epoch": 0.7207683073229292, "percentage": 72.08, "elapsed_time": "21:20:11", "remaining_time": "8:15:57", "throughput": 1600.83, "total_tokens": 122961920} -{"current_steps": 15020, "total_steps": 20825, "loss": 0.9354, "learning_rate": 9.852434778603888e-06, "epoch": 0.7212484993997599, "percentage": 72.12, "elapsed_time": "21:20:57", "remaining_time": "8:15:04", "throughput": 1600.94, "total_tokens": 123043840} -{"current_steps": 15030, "total_steps": 20825, "loss": 0.8208, "learning_rate": 9.820937304532221e-06, "epoch": 0.7217286914765907, "percentage": 72.17, "elapsed_time": "21:21:43", "remaining_time": "8:14:10", "throughput": 1601.05, "total_tokens": 123125760} -{"current_steps": 15040, "total_steps": 20825, "loss": 1.0232, "learning_rate": 9.789477947417131e-06, "epoch": 0.7222088835534214, "percentage": 72.22, "elapsed_time": "21:22:29", "remaining_time": "8:13:17", "throughput": 1601.15, "total_tokens": 123207680} -{"current_steps": 15050, "total_steps": 20825, "loss": 0.8119, "learning_rate": 9.758056786257874e-06, "epoch": 0.7226890756302521, "percentage": 72.27, "elapsed_time": "21:23:15", "remaining_time": "8:12:24", "throughput": 1601.26, "total_tokens": 123289600} -{"current_steps": 15060, "total_steps": 20825, "loss": 0.9681, "learning_rate": 9.726673899957823e-06, "epoch": 0.7231692677070828, "percentage": 72.32, "elapsed_time": "21:24:01", "remaining_time": "8:11:31", "throughput": 1601.37, "total_tokens": 123371520} -{"current_steps": 15070, "total_steps": 20825, "loss": 0.831, "learning_rate": 9.695329367324226e-06, "epoch": 0.7236494597839136, "percentage": 72.36, "elapsed_time": "21:24:46", "remaining_time": "8:10:38", "throughput": 1601.49, "total_tokens": 123453440} -{"current_steps": 15080, "total_steps": 20825, "loss": 0.7507, "learning_rate": 9.664023267068007e-06, "epoch": 0.7241296518607443, "percentage": 72.41, "elapsed_time": "21:25:32", "remaining_time": "8:09:45", "throughput": 1601.6, "total_tokens": 123535360} -{"current_steps": 15090, "total_steps": 20825, "loss": 0.9068, "learning_rate": 9.632755677803595e-06, "epoch": 0.724609843937575, "percentage": 72.46, "elapsed_time": "21:26:18", "remaining_time": "8:08:51", "throughput": 1601.72, "total_tokens": 123617280} -{"current_steps": 15100, "total_steps": 20825, "loss": 0.9601, "learning_rate": 9.601526678048701e-06, "epoch": 0.7250900360144058, "percentage": 72.51, "elapsed_time": "21:27:03", "remaining_time": "8:07:58", "throughput": 1601.83, "total_tokens": 123699200} -{"current_steps": 15110, "total_steps": 20825, "loss": 0.8658, "learning_rate": 9.570336346224145e-06, "epoch": 0.7255702280912365, "percentage": 72.56, "elapsed_time": "21:27:49", "remaining_time": "8:07:05", "throughput": 1601.95, "total_tokens": 123781120} -{"current_steps": 15120, "total_steps": 20825, "loss": 0.9606, "learning_rate": 9.53918476065363e-06, "epoch": 0.7260504201680672, "percentage": 72.61, "elapsed_time": "21:28:34", "remaining_time": "8:06:12", "throughput": 1602.06, "total_tokens": 123863040} -{"current_steps": 15130, "total_steps": 20825, "loss": 0.8749, "learning_rate": 9.508071999563578e-06, "epoch": 0.726530612244898, "percentage": 72.65, "elapsed_time": "21:29:20", "remaining_time": "8:05:18", "throughput": 1602.17, "total_tokens": 123944960} -{"current_steps": 15140, "total_steps": 20825, "loss": 0.8534, "learning_rate": 9.476998141082896e-06, "epoch": 0.7270108043217287, "percentage": 72.7, "elapsed_time": "21:30:06", "remaining_time": "8:04:25", "throughput": 1602.27, "total_tokens": 124026880} -{"current_steps": 15150, "total_steps": 20825, "loss": 0.8115, "learning_rate": 9.445963263242822e-06, "epoch": 0.7274909963985594, "percentage": 72.75, "elapsed_time": "21:30:52", "remaining_time": "8:03:32", "throughput": 1602.38, "total_tokens": 124108800} -{"current_steps": 15160, "total_steps": 20825, "loss": 0.8173, "learning_rate": 9.414967443976705e-06, "epoch": 0.7279711884753901, "percentage": 72.8, "elapsed_time": "21:31:45", "remaining_time": "8:02:42", "throughput": 1602.36, "total_tokens": 124190720} -{"current_steps": 15170, "total_steps": 20825, "loss": 0.7552, "learning_rate": 9.384010761119787e-06, "epoch": 0.7284513805522209, "percentage": 72.85, "elapsed_time": "21:32:36", "remaining_time": "8:01:51", "throughput": 1602.34, "total_tokens": 124272640} -{"current_steps": 15180, "total_steps": 20825, "loss": 1.0986, "learning_rate": 9.353093292409063e-06, "epoch": 0.7289315726290516, "percentage": 72.89, "elapsed_time": "21:33:28", "remaining_time": "8:01:00", "throughput": 1602.33, "total_tokens": 124354560} -{"current_steps": 15190, "total_steps": 20825, "loss": 0.9024, "learning_rate": 9.322215115483049e-06, "epoch": 0.7294117647058823, "percentage": 72.94, "elapsed_time": "21:34:20", "remaining_time": "8:00:09", "throughput": 1602.32, "total_tokens": 124436480} -{"current_steps": 15200, "total_steps": 20825, "loss": 0.7029, "learning_rate": 9.291376307881577e-06, "epoch": 0.7298919567827131, "percentage": 72.99, "elapsed_time": "21:35:11", "remaining_time": "7:59:18", "throughput": 1602.31, "total_tokens": 124518400} -{"current_steps": 15210, "total_steps": 20825, "loss": 0.7564, "learning_rate": 9.260576947045624e-06, "epoch": 0.7303721488595438, "percentage": 73.04, "elapsed_time": "21:36:03", "remaining_time": "7:58:27", "throughput": 1602.3, "total_tokens": 124600320} -{"current_steps": 15220, "total_steps": 20825, "loss": 0.8904, "learning_rate": 9.229817110317126e-06, "epoch": 0.7308523409363745, "percentage": 73.09, "elapsed_time": "21:36:55", "remaining_time": "7:57:36", "throughput": 1602.28, "total_tokens": 124682240} -{"current_steps": 15230, "total_steps": 20825, "loss": 0.8753, "learning_rate": 9.19909687493874e-06, "epoch": 0.7313325330132053, "percentage": 73.13, "elapsed_time": "21:37:46", "remaining_time": "7:56:45", "throughput": 1602.28, "total_tokens": 124764160} -{"current_steps": 15240, "total_steps": 20825, "loss": 0.7468, "learning_rate": 9.168416318053701e-06, "epoch": 0.731812725090036, "percentage": 73.18, "elapsed_time": "21:38:38", "remaining_time": "7:55:54", "throughput": 1602.26, "total_tokens": 124846080} -{"current_steps": 15250, "total_steps": 20825, "loss": 0.7828, "learning_rate": 9.137775516705604e-06, "epoch": 0.7322929171668667, "percentage": 73.23, "elapsed_time": "21:39:29", "remaining_time": "7:55:03", "throughput": 1602.26, "total_tokens": 124928000} -{"current_steps": 15260, "total_steps": 20825, "loss": 0.978, "learning_rate": 9.107174547838188e-06, "epoch": 0.7327731092436974, "percentage": 73.28, "elapsed_time": "21:40:21", "remaining_time": "7:54:12", "throughput": 1602.25, "total_tokens": 125009920} -{"current_steps": 15270, "total_steps": 20825, "loss": 0.9886, "learning_rate": 9.076613488295193e-06, "epoch": 0.7332533013205282, "percentage": 73.33, "elapsed_time": "21:41:13", "remaining_time": "7:53:21", "throughput": 1602.24, "total_tokens": 125091840} -{"current_steps": 15280, "total_steps": 20825, "loss": 0.9165, "learning_rate": 9.04609241482014e-06, "epoch": 0.7337334933973589, "percentage": 73.37, "elapsed_time": "21:42:04", "remaining_time": "7:52:30", "throughput": 1602.23, "total_tokens": 125173760} -{"current_steps": 15290, "total_steps": 20825, "loss": 0.9454, "learning_rate": 9.015611404056121e-06, "epoch": 0.7342136854741896, "percentage": 73.42, "elapsed_time": "21:42:56", "remaining_time": "7:51:39", "throughput": 1602.22, "total_tokens": 125255680} -{"current_steps": 15300, "total_steps": 20825, "loss": 0.9743, "learning_rate": 8.985170532545622e-06, "epoch": 0.7346938775510204, "percentage": 73.47, "elapsed_time": "21:43:47", "remaining_time": "7:50:48", "throughput": 1602.22, "total_tokens": 125337600} -{"current_steps": 15310, "total_steps": 20825, "loss": 1.0288, "learning_rate": 8.954769876730368e-06, "epoch": 0.7351740696278511, "percentage": 73.52, "elapsed_time": "21:44:39", "remaining_time": "7:49:57", "throughput": 1602.21, "total_tokens": 125419520} -{"current_steps": 15320, "total_steps": 20825, "loss": 0.8448, "learning_rate": 8.924409512951045e-06, "epoch": 0.7356542617046818, "percentage": 73.57, "elapsed_time": "21:45:30", "remaining_time": "7:49:06", "throughput": 1602.2, "total_tokens": 125501440} -{"current_steps": 15330, "total_steps": 20825, "loss": 1.0112, "learning_rate": 8.894089517447206e-06, "epoch": 0.7361344537815127, "percentage": 73.61, "elapsed_time": "21:46:22", "remaining_time": "7:48:16", "throughput": 1602.19, "total_tokens": 125583360} -{"current_steps": 15340, "total_steps": 20825, "loss": 0.9288, "learning_rate": 8.863809966357017e-06, "epoch": 0.7366146458583434, "percentage": 73.66, "elapsed_time": "21:47:14", "remaining_time": "7:47:25", "throughput": 1602.17, "total_tokens": 125665280} -{"current_steps": 15350, "total_steps": 20825, "loss": 0.8124, "learning_rate": 8.833570935717064e-06, "epoch": 0.737094837935174, "percentage": 73.71, "elapsed_time": "21:48:06", "remaining_time": "7:46:34", "throughput": 1602.15, "total_tokens": 125747200} -{"current_steps": 15360, "total_steps": 20825, "loss": 0.8461, "learning_rate": 8.803372501462203e-06, "epoch": 0.7375750300120048, "percentage": 73.76, "elapsed_time": "21:48:58", "remaining_time": "7:45:43", "throughput": 1602.13, "total_tokens": 125829120} -{"current_steps": 15370, "total_steps": 20825, "loss": 0.7163, "learning_rate": 8.773214739425346e-06, "epoch": 0.7380552220888356, "percentage": 73.81, "elapsed_time": "21:49:49", "remaining_time": "7:44:52", "throughput": 1602.13, "total_tokens": 125911040} -{"current_steps": 15380, "total_steps": 20825, "loss": 0.5987, "learning_rate": 8.743097725337255e-06, "epoch": 0.7385354141656663, "percentage": 73.85, "elapsed_time": "21:50:44", "remaining_time": "7:44:02", "throughput": 1602.07, "total_tokens": 125992960} -{"current_steps": 15390, "total_steps": 20825, "loss": 0.8509, "learning_rate": 8.713021534826366e-06, "epoch": 0.739015606242497, "percentage": 73.9, "elapsed_time": "21:51:36", "remaining_time": "7:43:11", "throughput": 1602.04, "total_tokens": 126074880} -{"current_steps": 15400, "total_steps": 20825, "loss": 1.0267, "learning_rate": 8.68298624341862e-06, "epoch": 0.7394957983193278, "percentage": 73.95, "elapsed_time": "21:52:29", "remaining_time": "7:42:21", "throughput": 1602.01, "total_tokens": 126156800} -{"current_steps": 15410, "total_steps": 20825, "loss": 0.913, "learning_rate": 8.652991926537254e-06, "epoch": 0.7399759903961585, "percentage": 74.0, "elapsed_time": "21:53:23", "remaining_time": "7:41:31", "throughput": 1601.95, "total_tokens": 126238720} -{"current_steps": 15420, "total_steps": 20825, "loss": 0.9146, "learning_rate": 8.623038659502583e-06, "epoch": 0.7404561824729892, "percentage": 74.05, "elapsed_time": "21:54:16", "remaining_time": "7:40:40", "throughput": 1601.91, "total_tokens": 126320640} -{"current_steps": 15430, "total_steps": 20825, "loss": 0.7079, "learning_rate": 8.59312651753187e-06, "epoch": 0.74093637454982, "percentage": 74.09, "elapsed_time": "21:55:11", "remaining_time": "7:39:51", "throughput": 1601.82, "total_tokens": 126402560} -{"current_steps": 15440, "total_steps": 20825, "loss": 0.9282, "learning_rate": 8.5632555757391e-06, "epoch": 0.7414165666266507, "percentage": 74.14, "elapsed_time": "21:56:05", "remaining_time": "7:39:00", "throughput": 1601.76, "total_tokens": 126484480} -{"current_steps": 15450, "total_steps": 20825, "loss": 0.8451, "learning_rate": 8.53342590913478e-06, "epoch": 0.7418967587034814, "percentage": 74.19, "elapsed_time": "21:56:56", "remaining_time": "7:38:09", "throughput": 1601.77, "total_tokens": 126566400} -{"current_steps": 15460, "total_steps": 20825, "loss": 0.8644, "learning_rate": 8.503637592625796e-06, "epoch": 0.7423769507803121, "percentage": 74.24, "elapsed_time": "21:57:52", "remaining_time": "7:37:20", "throughput": 1601.67, "total_tokens": 126648320} -{"current_steps": 15470, "total_steps": 20825, "loss": 0.9529, "learning_rate": 8.473890701015177e-06, "epoch": 0.7428571428571429, "percentage": 74.29, "elapsed_time": "21:58:43", "remaining_time": "7:36:28", "throughput": 1601.69, "total_tokens": 126730240} -{"current_steps": 15480, "total_steps": 20825, "loss": 1.0753, "learning_rate": 8.444185309001926e-06, "epoch": 0.7433373349339736, "percentage": 74.33, "elapsed_time": "21:59:34", "remaining_time": "7:35:37", "throughput": 1601.68, "total_tokens": 126812160} -{"current_steps": 15490, "total_steps": 20825, "loss": 0.8009, "learning_rate": 8.41452149118085e-06, "epoch": 0.7438175270108043, "percentage": 74.38, "elapsed_time": "22:00:26", "remaining_time": "7:34:46", "throughput": 1601.66, "total_tokens": 126894080} -{"current_steps": 15500, "total_steps": 20825, "loss": 0.8622, "learning_rate": 8.384899322042356e-06, "epoch": 0.7442977190876351, "percentage": 74.43, "elapsed_time": "22:01:18", "remaining_time": "7:33:55", "throughput": 1601.65, "total_tokens": 126976000} -{"current_steps": 15510, "total_steps": 20825, "loss": 0.8215, "learning_rate": 8.355318875972243e-06, "epoch": 0.7447779111644658, "percentage": 74.48, "elapsed_time": "22:02:12", "remaining_time": "7:33:05", "throughput": 1601.59, "total_tokens": 127057920} -{"current_steps": 15520, "total_steps": 20825, "loss": 0.7382, "learning_rate": 8.325780227251562e-06, "epoch": 0.7452581032412965, "percentage": 74.53, "elapsed_time": "22:03:03", "remaining_time": "7:32:14", "throughput": 1601.58, "total_tokens": 127139840} -{"current_steps": 15530, "total_steps": 20825, "loss": 0.9809, "learning_rate": 8.2962834500564e-06, "epoch": 0.7457382953181273, "percentage": 74.57, "elapsed_time": "22:03:56", "remaining_time": "7:31:24", "throughput": 1601.56, "total_tokens": 127221760} -{"current_steps": 15540, "total_steps": 20825, "loss": 0.9193, "learning_rate": 8.266828618457678e-06, "epoch": 0.746218487394958, "percentage": 74.62, "elapsed_time": "22:04:47", "remaining_time": "7:30:32", "throughput": 1601.56, "total_tokens": 127303680} -{"current_steps": 15550, "total_steps": 20825, "loss": 1.1018, "learning_rate": 8.237415806421015e-06, "epoch": 0.7466986794717887, "percentage": 74.67, "elapsed_time": "22:05:37", "remaining_time": "7:29:41", "throughput": 1601.58, "total_tokens": 127385600} -{"current_steps": 15560, "total_steps": 20825, "loss": 0.7888, "learning_rate": 8.20804508780648e-06, "epoch": 0.7471788715486194, "percentage": 74.72, "elapsed_time": "22:06:28", "remaining_time": "7:28:50", "throughput": 1601.58, "total_tokens": 127467520} -{"current_steps": 15570, "total_steps": 20825, "loss": 1.0093, "learning_rate": 8.178716536368475e-06, "epoch": 0.7476590636254502, "percentage": 74.77, "elapsed_time": "22:07:19", "remaining_time": "7:27:59", "throughput": 1601.58, "total_tokens": 127549440} -{"current_steps": 15580, "total_steps": 20825, "loss": 0.9785, "learning_rate": 8.149430225755476e-06, "epoch": 0.7481392557022809, "percentage": 74.81, "elapsed_time": "22:08:10", "remaining_time": "7:27:07", "throughput": 1601.58, "total_tokens": 127631360} -{"current_steps": 15590, "total_steps": 20825, "loss": 0.8937, "learning_rate": 8.120186229509922e-06, "epoch": 0.7486194477791116, "percentage": 74.86, "elapsed_time": "22:09:00", "remaining_time": "7:26:16", "throughput": 1601.61, "total_tokens": 127713280} -{"current_steps": 15600, "total_steps": 20825, "loss": 1.0423, "learning_rate": 8.090984621067963e-06, "epoch": 0.7490996398559424, "percentage": 74.91, "elapsed_time": "22:09:52", "remaining_time": "7:25:25", "throughput": 1601.6, "total_tokens": 127795200} -{"current_steps": 15610, "total_steps": 20825, "loss": 0.8387, "learning_rate": 8.061825473759324e-06, "epoch": 0.7495798319327731, "percentage": 74.96, "elapsed_time": "22:10:44", "remaining_time": "7:24:34", "throughput": 1601.57, "total_tokens": 127877120} -{"current_steps": 15620, "total_steps": 20825, "loss": 0.8558, "learning_rate": 8.032708860807111e-06, "epoch": 0.7500600240096038, "percentage": 75.01, "elapsed_time": "22:11:38", "remaining_time": "7:23:44", "throughput": 1601.53, "total_tokens": 127959040} -{"current_steps": 15630, "total_steps": 20825, "loss": 0.7608, "learning_rate": 8.003634855327594e-06, "epoch": 0.7505402160864346, "percentage": 75.05, "elapsed_time": "22:12:27", "remaining_time": "7:22:52", "throughput": 1601.56, "total_tokens": 128040960} -{"current_steps": 15640, "total_steps": 20825, "loss": 0.7416, "learning_rate": 7.974603530330069e-06, "epoch": 0.7510204081632653, "percentage": 75.1, "elapsed_time": "22:14:00", "remaining_time": "7:22:15", "throughput": 1600.73, "total_tokens": 128122880} -{"current_steps": 15650, "total_steps": 20825, "loss": 0.7773, "learning_rate": 7.945614958716658e-06, "epoch": 0.751500600240096, "percentage": 75.15, "elapsed_time": "22:15:10", "remaining_time": "7:21:30", "throughput": 1600.35, "total_tokens": 128204800} -{"current_steps": 15660, "total_steps": 20825, "loss": 0.8304, "learning_rate": 7.916669213282107e-06, "epoch": 0.7519807923169267, "percentage": 75.2, "elapsed_time": "22:15:59", "remaining_time": "7:20:38", "throughput": 1600.4, "total_tokens": 128286720} -{"current_steps": 15670, "total_steps": 20825, "loss": 1.1004, "learning_rate": 7.88776636671362e-06, "epoch": 0.7524609843937575, "percentage": 75.25, "elapsed_time": "22:16:47", "remaining_time": "7:19:46", "throughput": 1600.45, "total_tokens": 128368640} -{"current_steps": 15680, "total_steps": 20825, "loss": 0.9029, "learning_rate": 7.858906491590697e-06, "epoch": 0.7529411764705882, "percentage": 75.29, "elapsed_time": "22:17:35", "remaining_time": "7:18:53", "throughput": 1600.53, "total_tokens": 128450560} -{"current_steps": 15690, "total_steps": 20825, "loss": 0.8456, "learning_rate": 7.830089660384895e-06, "epoch": 0.7534213685474189, "percentage": 75.34, "elapsed_time": "22:18:23", "remaining_time": "7:18:01", "throughput": 1600.59, "total_tokens": 128532480} -{"current_steps": 15700, "total_steps": 20825, "loss": 1.3139, "learning_rate": 7.801315945459714e-06, "epoch": 0.7539015606242497, "percentage": 75.39, "elapsed_time": "22:19:14", "remaining_time": "7:17:10", "throughput": 1600.58, "total_tokens": 128614400} -{"current_steps": 15710, "total_steps": 20825, "loss": 0.931, "learning_rate": 7.772585419070374e-06, "epoch": 0.7543817527010804, "percentage": 75.44, "elapsed_time": "22:20:04", "remaining_time": "7:16:18", "throughput": 1600.61, "total_tokens": 128696320} -{"current_steps": 15720, "total_steps": 20825, "loss": 0.7754, "learning_rate": 7.743898153363625e-06, "epoch": 0.7548619447779111, "percentage": 75.49, "elapsed_time": "22:20:54", "remaining_time": "7:15:27", "throughput": 1600.63, "total_tokens": 128778240} -{"current_steps": 15730, "total_steps": 20825, "loss": 0.8358, "learning_rate": 7.715254220377596e-06, "epoch": 0.7553421368547419, "percentage": 75.53, "elapsed_time": "22:21:44", "remaining_time": "7:14:35", "throughput": 1600.65, "total_tokens": 128860160} -{"current_steps": 15740, "total_steps": 20825, "loss": 0.7976, "learning_rate": 7.686653692041615e-06, "epoch": 0.7558223289315726, "percentage": 75.58, "elapsed_time": "22:22:34", "remaining_time": "7:13:44", "throughput": 1600.68, "total_tokens": 128942080} -{"current_steps": 15750, "total_steps": 20825, "loss": 0.834, "learning_rate": 7.658096640175988e-06, "epoch": 0.7563025210084033, "percentage": 75.63, "elapsed_time": "22:23:24", "remaining_time": "7:12:52", "throughput": 1600.71, "total_tokens": 129024000} -{"current_steps": 15760, "total_steps": 20825, "loss": 0.78, "learning_rate": 7.629583136491844e-06, "epoch": 0.7567827130852341, "percentage": 75.68, "elapsed_time": "22:24:13", "remaining_time": "7:12:00", "throughput": 1600.74, "total_tokens": 129105920} -{"current_steps": 15770, "total_steps": 20825, "loss": 0.855, "learning_rate": 7.601113252590991e-06, "epoch": 0.7572629051620648, "percentage": 75.73, "elapsed_time": "22:25:05", "remaining_time": "7:11:09", "throughput": 1600.74, "total_tokens": 129187840} -{"current_steps": 15780, "total_steps": 20825, "loss": 1.0542, "learning_rate": 7.572687059965661e-06, "epoch": 0.7577430972388955, "percentage": 75.77, "elapsed_time": "22:25:55", "remaining_time": "7:10:18", "throughput": 1600.76, "total_tokens": 129269760} -{"current_steps": 15790, "total_steps": 20825, "loss": 0.9999, "learning_rate": 7.544304629998389e-06, "epoch": 0.7582232893157262, "percentage": 75.82, "elapsed_time": "22:26:45", "remaining_time": "7:09:26", "throughput": 1600.78, "total_tokens": 129351680} -{"current_steps": 15800, "total_steps": 20825, "loss": 0.8808, "learning_rate": 7.51596603396183e-06, "epoch": 0.758703481392557, "percentage": 75.87, "elapsed_time": "22:27:34", "remaining_time": "7:08:34", "throughput": 1600.81, "total_tokens": 129433600} -{"current_steps": 15810, "total_steps": 20825, "loss": 0.9648, "learning_rate": 7.4876713430185265e-06, "epoch": 0.7591836734693878, "percentage": 75.92, "elapsed_time": "22:28:24", "remaining_time": "7:07:43", "throughput": 1600.85, "total_tokens": 129515520} -{"current_steps": 15820, "total_steps": 20825, "loss": 0.9263, "learning_rate": 7.4594206282208e-06, "epoch": 0.7596638655462185, "percentage": 75.97, "elapsed_time": "22:29:13", "remaining_time": "7:06:51", "throughput": 1600.89, "total_tokens": 129597440} -{"current_steps": 15830, "total_steps": 20825, "loss": 0.8364, "learning_rate": 7.431213960510544e-06, "epoch": 0.7601440576230493, "percentage": 76.01, "elapsed_time": "22:30:02", "remaining_time": "7:05:59", "throughput": 1600.92, "total_tokens": 129679360} -{"current_steps": 15840, "total_steps": 20825, "loss": 1.068, "learning_rate": 7.40305141071902e-06, "epoch": 0.76062424969988, "percentage": 76.06, "elapsed_time": "22:30:52", "remaining_time": "7:05:07", "throughput": 1600.96, "total_tokens": 129761280} -{"current_steps": 15850, "total_steps": 20825, "loss": 0.7245, "learning_rate": 7.374933049566704e-06, "epoch": 0.7611044417767107, "percentage": 76.11, "elapsed_time": "22:31:41", "remaining_time": "7:04:16", "throughput": 1600.99, "total_tokens": 129843200} -{"current_steps": 15860, "total_steps": 20825, "loss": 0.8833, "learning_rate": 7.346858947663138e-06, "epoch": 0.7615846338535415, "percentage": 76.16, "elapsed_time": "22:32:31", "remaining_time": "7:03:24", "throughput": 1601.03, "total_tokens": 129925120} -{"current_steps": 15870, "total_steps": 20825, "loss": 1.0079, "learning_rate": 7.318829175506684e-06, "epoch": 0.7620648259303722, "percentage": 76.21, "elapsed_time": "22:33:20", "remaining_time": "7:02:32", "throughput": 1601.06, "total_tokens": 130007040} -{"current_steps": 15880, "total_steps": 20825, "loss": 0.9743, "learning_rate": 7.290843803484409e-06, "epoch": 0.7625450180072029, "percentage": 76.25, "elapsed_time": "22:34:10", "remaining_time": "7:01:41", "throughput": 1601.09, "total_tokens": 130088960} -{"current_steps": 15890, "total_steps": 20825, "loss": 0.923, "learning_rate": 7.262902901871885e-06, "epoch": 0.7630252100840336, "percentage": 76.3, "elapsed_time": "22:34:59", "remaining_time": "7:00:49", "throughput": 1601.13, "total_tokens": 130170880} -{"current_steps": 15900, "total_steps": 20825, "loss": 0.947, "learning_rate": 7.235006540832995e-06, "epoch": 0.7635054021608644, "percentage": 76.35, "elapsed_time": "22:35:48", "remaining_time": "6:59:57", "throughput": 1601.16, "total_tokens": 130252800} -{"current_steps": 15910, "total_steps": 20825, "loss": 0.8526, "learning_rate": 7.207154790419784e-06, "epoch": 0.7639855942376951, "percentage": 76.4, "elapsed_time": "22:36:38", "remaining_time": "6:59:06", "throughput": 1601.19, "total_tokens": 130334720} -{"current_steps": 15920, "total_steps": 20825, "loss": 1.0454, "learning_rate": 7.179347720572288e-06, "epoch": 0.7644657863145258, "percentage": 76.45, "elapsed_time": "22:37:30", "remaining_time": "6:58:15", "throughput": 1601.18, "total_tokens": 130416640} -{"current_steps": 15930, "total_steps": 20825, "loss": 0.7704, "learning_rate": 7.151585401118316e-06, "epoch": 0.7649459783913566, "percentage": 76.49, "elapsed_time": "22:38:24", "remaining_time": "6:57:24", "throughput": 1601.12, "total_tokens": 130498560} -{"current_steps": 15940, "total_steps": 20825, "loss": 0.8247, "learning_rate": 7.12386790177331e-06, "epoch": 0.7654261704681873, "percentage": 76.54, "elapsed_time": "22:39:22", "remaining_time": "6:56:35", "throughput": 1600.98, "total_tokens": 130580480} -{"current_steps": 15950, "total_steps": 20825, "loss": 0.8725, "learning_rate": 7.096195292140173e-06, "epoch": 0.765906362545018, "percentage": 76.59, "elapsed_time": "22:40:18", "remaining_time": "6:55:46", "throughput": 1600.89, "total_tokens": 130662400} -{"current_steps": 15960, "total_steps": 20825, "loss": 0.7432, "learning_rate": 7.06856764170907e-06, "epoch": 0.7663865546218488, "percentage": 76.64, "elapsed_time": "22:41:12", "remaining_time": "6:54:55", "throughput": 1600.83, "total_tokens": 130744320} -{"current_steps": 15970, "total_steps": 20825, "loss": 0.959, "learning_rate": 7.040985019857274e-06, "epoch": 0.7668667466986795, "percentage": 76.69, "elapsed_time": "22:42:07", "remaining_time": "6:54:05", "throughput": 1600.75, "total_tokens": 130826240} -{"current_steps": 15980, "total_steps": 20825, "loss": 1.1146, "learning_rate": 7.013447495848996e-06, "epoch": 0.7673469387755102, "percentage": 76.73, "elapsed_time": "22:43:02", "remaining_time": "6:53:15", "throughput": 1600.68, "total_tokens": 130908160} -{"current_steps": 15990, "total_steps": 20825, "loss": 0.9096, "learning_rate": 6.985955138835162e-06, "epoch": 0.7678271308523409, "percentage": 76.78, "elapsed_time": "22:43:57", "remaining_time": "6:52:25", "throughput": 1600.61, "total_tokens": 130990080} -{"current_steps": 16000, "total_steps": 20825, "loss": 0.9424, "learning_rate": 6.958508017853319e-06, "epoch": 0.7683073229291717, "percentage": 76.83, "elapsed_time": "22:44:53", "remaining_time": "6:51:36", "throughput": 1600.51, "total_tokens": 131072000} -{"current_steps": 16010, "total_steps": 20825, "loss": 0.905, "learning_rate": 6.931106201827397e-06, "epoch": 0.7687875150060024, "percentage": 76.88, "elapsed_time": "22:45:53", "remaining_time": "6:50:47", "throughput": 1600.34, "total_tokens": 131153920} -{"current_steps": 16020, "total_steps": 20825, "loss": 0.8972, "learning_rate": 6.903749759567557e-06, "epoch": 0.7692677070828331, "percentage": 76.93, "elapsed_time": "22:46:48", "remaining_time": "6:49:57", "throughput": 1600.27, "total_tokens": 131235840} -{"current_steps": 16030, "total_steps": 20825, "loss": 0.8672, "learning_rate": 6.876438759770037e-06, "epoch": 0.7697478991596639, "percentage": 76.97, "elapsed_time": "22:47:43", "remaining_time": "6:49:07", "throughput": 1600.2, "total_tokens": 131317760} -{"current_steps": 16040, "total_steps": 20825, "loss": 1.0239, "learning_rate": 6.8491732710169344e-06, "epoch": 0.7702280912364946, "percentage": 77.02, "elapsed_time": "22:48:38", "remaining_time": "6:48:17", "throughput": 1600.12, "total_tokens": 131399680} -{"current_steps": 16050, "total_steps": 20825, "loss": 0.7971, "learning_rate": 6.821953361776093e-06, "epoch": 0.7707082833133253, "percentage": 77.07, "elapsed_time": "22:49:34", "remaining_time": "6:47:27", "throughput": 1600.04, "total_tokens": 131481600} -{"current_steps": 16060, "total_steps": 20825, "loss": 0.8697, "learning_rate": 6.7947791004008665e-06, "epoch": 0.7711884753901561, "percentage": 77.12, "elapsed_time": "22:50:30", "remaining_time": "6:46:37", "throughput": 1599.93, "total_tokens": 131563520} -{"current_steps": 16070, "total_steps": 20825, "loss": 0.8022, "learning_rate": 6.767650555130009e-06, "epoch": 0.7716686674669868, "percentage": 77.17, "elapsed_time": "22:51:26", "remaining_time": "6:45:48", "throughput": 1599.84, "total_tokens": 131645440} -{"current_steps": 16080, "total_steps": 20825, "loss": 0.9051, "learning_rate": 6.740567794087463e-06, "epoch": 0.7721488595438175, "percentage": 77.21, "elapsed_time": "22:52:21", "remaining_time": "6:44:58", "throughput": 1599.76, "total_tokens": 131727360} -{"current_steps": 16090, "total_steps": 20825, "loss": 1.1109, "learning_rate": 6.713530885282188e-06, "epoch": 0.7726290516206482, "percentage": 77.26, "elapsed_time": "22:53:17", "remaining_time": "6:44:08", "throughput": 1599.68, "total_tokens": 131809280} -{"current_steps": 16100, "total_steps": 20825, "loss": 0.781, "learning_rate": 6.686539896608016e-06, "epoch": 0.773109243697479, "percentage": 77.31, "elapsed_time": "22:54:13", "remaining_time": "6:43:18", "throughput": 1599.59, "total_tokens": 131891200} -{"current_steps": 16110, "total_steps": 20825, "loss": 0.7884, "learning_rate": 6.659594895843477e-06, "epoch": 0.7735894357743097, "percentage": 77.36, "elapsed_time": "22:55:07", "remaining_time": "6:42:27", "throughput": 1599.53, "total_tokens": 131973120} -{"current_steps": 16120, "total_steps": 20825, "loss": 0.8852, "learning_rate": 6.632695950651594e-06, "epoch": 0.7740696278511404, "percentage": 77.41, "elapsed_time": "22:56:01", "remaining_time": "6:41:37", "throughput": 1599.47, "total_tokens": 132055040} -{"current_steps": 16130, "total_steps": 20825, "loss": 0.9598, "learning_rate": 6.605843128579739e-06, "epoch": 0.7745498199279712, "percentage": 77.45, "elapsed_time": "22:56:57", "remaining_time": "6:40:47", "throughput": 1599.39, "total_tokens": 132136960} -{"current_steps": 16140, "total_steps": 20825, "loss": 0.8386, "learning_rate": 6.579036497059482e-06, "epoch": 0.7750300120048019, "percentage": 77.5, "elapsed_time": "22:57:52", "remaining_time": "6:39:57", "throughput": 1599.3, "total_tokens": 132218880} -{"current_steps": 16150, "total_steps": 20825, "loss": 0.8359, "learning_rate": 6.552276123406384e-06, "epoch": 0.7755102040816326, "percentage": 77.55, "elapsed_time": "22:58:47", "remaining_time": "6:39:07", "throughput": 1599.23, "total_tokens": 132300800} -{"current_steps": 16160, "total_steps": 20825, "loss": 1.043, "learning_rate": 6.525562074819852e-06, "epoch": 0.7759903961584634, "percentage": 77.6, "elapsed_time": "22:59:41", "remaining_time": "6:38:17", "throughput": 1599.17, "total_tokens": 132382720} -{"current_steps": 16170, "total_steps": 20825, "loss": 0.9455, "learning_rate": 6.4988944183829695e-06, "epoch": 0.7764705882352941, "percentage": 77.65, "elapsed_time": "23:00:36", "remaining_time": "6:37:26", "throughput": 1599.11, "total_tokens": 132464640} -{"current_steps": 16180, "total_steps": 20825, "loss": 1.1211, "learning_rate": 6.472273221062305e-06, "epoch": 0.7769507803121248, "percentage": 77.7, "elapsed_time": "23:01:34", "remaining_time": "6:36:37", "throughput": 1598.97, "total_tokens": 132546560} -{"current_steps": 16190, "total_steps": 20825, "loss": 1.0617, "learning_rate": 6.445698549707776e-06, "epoch": 0.7774309723889555, "percentage": 77.74, "elapsed_time": "23:02:29", "remaining_time": "6:35:47", "throughput": 1598.9, "total_tokens": 132628480} -{"current_steps": 16200, "total_steps": 20825, "loss": 0.7963, "learning_rate": 6.419170471052472e-06, "epoch": 0.7779111644657863, "percentage": 77.79, "elapsed_time": "23:03:25", "remaining_time": "6:34:57", "throughput": 1598.81, "total_tokens": 132710400} -{"current_steps": 16210, "total_steps": 20825, "loss": 0.9802, "learning_rate": 6.392689051712458e-06, "epoch": 0.778391356542617, "percentage": 77.84, "elapsed_time": "23:04:20", "remaining_time": "6:34:07", "throughput": 1598.75, "total_tokens": 132792320} -{"current_steps": 16220, "total_steps": 20825, "loss": 1.0569, "learning_rate": 6.3662543581866405e-06, "epoch": 0.7788715486194477, "percentage": 77.89, "elapsed_time": "23:05:17", "remaining_time": "6:33:17", "throughput": 1598.64, "total_tokens": 132874240} -{"current_steps": 16230, "total_steps": 20825, "loss": 0.7891, "learning_rate": 6.339866456856608e-06, "epoch": 0.7793517406962785, "percentage": 77.94, "elapsed_time": "23:06:12", "remaining_time": "6:32:27", "throughput": 1598.56, "total_tokens": 132956160} -{"current_steps": 16240, "total_steps": 20825, "loss": 0.9846, "learning_rate": 6.313525413986415e-06, "epoch": 0.7798319327731092, "percentage": 77.98, "elapsed_time": "23:07:19", "remaining_time": "6:31:40", "throughput": 1598.26, "total_tokens": 133038080} -{"current_steps": 16250, "total_steps": 20825, "loss": 0.8808, "learning_rate": 6.28723129572247e-06, "epoch": 0.78031212484994, "percentage": 78.03, "elapsed_time": "23:08:24", "remaining_time": "6:30:53", "throughput": 1597.99, "total_tokens": 133120000} -{"current_steps": 16260, "total_steps": 20825, "loss": 0.8577, "learning_rate": 6.260984168093353e-06, "epoch": 0.7807923169267708, "percentage": 78.08, "elapsed_time": "23:09:34", "remaining_time": "6:30:07", "throughput": 1597.64, "total_tokens": 133201920} -{"current_steps": 16270, "total_steps": 20825, "loss": 0.9177, "learning_rate": 6.234784097009608e-06, "epoch": 0.7812725090036015, "percentage": 78.13, "elapsed_time": "23:10:41", "remaining_time": "6:29:20", "throughput": 1597.34, "total_tokens": 133283840} -{"current_steps": 16280, "total_steps": 20825, "loss": 0.8475, "learning_rate": 6.208631148263649e-06, "epoch": 0.7817527010804322, "percentage": 78.18, "elapsed_time": "23:11:46", "remaining_time": "6:28:33", "throughput": 1597.07, "total_tokens": 133365760} -{"current_steps": 16290, "total_steps": 20825, "loss": 0.6443, "learning_rate": 6.18252538752955e-06, "epoch": 0.7822328931572629, "percentage": 78.22, "elapsed_time": "23:12:47", "remaining_time": "6:27:44", "throughput": 1596.89, "total_tokens": 133447680} -{"current_steps": 16300, "total_steps": 20825, "loss": 0.7558, "learning_rate": 6.156466880362877e-06, "epoch": 0.7827130852340937, "percentage": 78.27, "elapsed_time": "23:13:53", "remaining_time": "6:26:57", "throughput": 1596.6, "total_tokens": 133529600} -{"current_steps": 16310, "total_steps": 20825, "loss": 0.8476, "learning_rate": 6.1304556922005315e-06, "epoch": 0.7831932773109244, "percentage": 78.32, "elapsed_time": "23:14:56", "remaining_time": "6:26:09", "throughput": 1596.39, "total_tokens": 133611520} -{"current_steps": 16320, "total_steps": 20825, "loss": 0.8751, "learning_rate": 6.1044918883606225e-06, "epoch": 0.7836734693877551, "percentage": 78.37, "elapsed_time": "23:15:49", "remaining_time": "6:25:18", "throughput": 1596.35, "total_tokens": 133693440} -{"current_steps": 16330, "total_steps": 20825, "loss": 0.9734, "learning_rate": 6.078575534042222e-06, "epoch": 0.7841536614645859, "percentage": 78.42, "elapsed_time": "23:16:43", "remaining_time": "6:24:27", "throughput": 1596.3, "total_tokens": 133775360} -{"current_steps": 16340, "total_steps": 20825, "loss": 0.9515, "learning_rate": 6.052706694325292e-06, "epoch": 0.7846338535414166, "percentage": 78.46, "elapsed_time": "23:17:36", "remaining_time": "6:23:36", "throughput": 1596.27, "total_tokens": 133857280} -{"current_steps": 16350, "total_steps": 20825, "loss": 0.9599, "learning_rate": 6.026885434170457e-06, "epoch": 0.7851140456182473, "percentage": 78.51, "elapsed_time": "23:18:29", "remaining_time": "6:22:46", "throughput": 1596.23, "total_tokens": 133939200} -{"current_steps": 16360, "total_steps": 20825, "loss": 0.975, "learning_rate": 6.001111818418859e-06, "epoch": 0.7855942376950781, "percentage": 78.56, "elapsed_time": "23:19:23", "remaining_time": "6:21:55", "throughput": 1596.19, "total_tokens": 134021120} -{"current_steps": 16370, "total_steps": 20825, "loss": 0.9928, "learning_rate": 5.975385911792006e-06, "epoch": 0.7860744297719088, "percentage": 78.61, "elapsed_time": "23:20:16", "remaining_time": "6:21:04", "throughput": 1596.15, "total_tokens": 134103040} -{"current_steps": 16380, "total_steps": 20825, "loss": 1.0484, "learning_rate": 5.9497077788916055e-06, "epoch": 0.7865546218487395, "percentage": 78.66, "elapsed_time": "23:21:09", "remaining_time": "6:20:13", "throughput": 1596.12, "total_tokens": 134184960} -{"current_steps": 16390, "total_steps": 20825, "loss": 0.832, "learning_rate": 5.924077484199389e-06, "epoch": 0.7870348139255702, "percentage": 78.7, "elapsed_time": "23:22:04", "remaining_time": "6:19:23", "throughput": 1596.05, "total_tokens": 134266880} -{"current_steps": 16400, "total_steps": 20825, "loss": 0.7669, "learning_rate": 5.89849509207695e-06, "epoch": 0.787515006002401, "percentage": 78.75, "elapsed_time": "23:23:01", "remaining_time": "6:18:33", "throughput": 1595.94, "total_tokens": 134348800} -{"current_steps": 16410, "total_steps": 20825, "loss": 0.9089, "learning_rate": 5.872960666765618e-06, "epoch": 0.7879951980792317, "percentage": 78.8, "elapsed_time": "23:23:56", "remaining_time": "6:17:43", "throughput": 1595.88, "total_tokens": 134430720} -{"current_steps": 16420, "total_steps": 20825, "loss": 1.5337, "learning_rate": 5.847474272386239e-06, "epoch": 0.7884753901560624, "percentage": 78.85, "elapsed_time": "23:24:52", "remaining_time": "6:16:53", "throughput": 1595.79, "total_tokens": 134512640} -{"current_steps": 16430, "total_steps": 20825, "loss": 0.8218, "learning_rate": 5.822035972939069e-06, "epoch": 0.7889555822328932, "percentage": 78.9, "elapsed_time": "23:25:46", "remaining_time": "6:16:02", "throughput": 1595.74, "total_tokens": 134594560} -{"current_steps": 16440, "total_steps": 20825, "loss": 0.8714, "learning_rate": 5.79664583230359e-06, "epoch": 0.7894357743097239, "percentage": 78.94, "elapsed_time": "23:26:40", "remaining_time": "6:15:11", "throughput": 1595.69, "total_tokens": 134676480} -{"current_steps": 16450, "total_steps": 20825, "loss": 0.7859, "learning_rate": 5.771303914238333e-06, "epoch": 0.7899159663865546, "percentage": 78.99, "elapsed_time": "23:27:35", "remaining_time": "6:14:21", "throughput": 1595.61, "total_tokens": 134758400} -{"current_steps": 16460, "total_steps": 20825, "loss": 0.8862, "learning_rate": 5.746010282380745e-06, "epoch": 0.7903961584633854, "percentage": 79.04, "elapsed_time": "23:28:32", "remaining_time": "6:13:31", "throughput": 1595.51, "total_tokens": 134840320} -{"current_steps": 16470, "total_steps": 20825, "loss": 0.7945, "learning_rate": 5.7207650002470274e-06, "epoch": 0.7908763505402161, "percentage": 79.09, "elapsed_time": "23:29:27", "remaining_time": "6:12:41", "throughput": 1595.45, "total_tokens": 134922240} -{"current_steps": 16480, "total_steps": 20825, "loss": 0.8114, "learning_rate": 5.695568131231949e-06, "epoch": 0.7913565426170468, "percentage": 79.14, "elapsed_time": "23:30:22", "remaining_time": "6:11:50", "throughput": 1595.37, "total_tokens": 135004160} -{"current_steps": 16490, "total_steps": 20825, "loss": 0.7961, "learning_rate": 5.670419738608723e-06, "epoch": 0.7918367346938775, "percentage": 79.18, "elapsed_time": "23:31:17", "remaining_time": "6:11:00", "throughput": 1595.3, "total_tokens": 135086080} -{"current_steps": 16500, "total_steps": 20825, "loss": 0.867, "learning_rate": 5.645319885528824e-06, "epoch": 0.7923169267707083, "percentage": 79.23, "elapsed_time": "23:32:11", "remaining_time": "6:10:09", "throughput": 1595.25, "total_tokens": 135168000} -{"current_steps": 16510, "total_steps": 20825, "loss": 0.8139, "learning_rate": 5.620268635021825e-06, "epoch": 0.792797118847539, "percentage": 79.28, "elapsed_time": "23:33:05", "remaining_time": "6:09:19", "throughput": 1595.2, "total_tokens": 135249920} -{"current_steps": 16520, "total_steps": 20825, "loss": 0.9577, "learning_rate": 5.595266049995268e-06, "epoch": 0.7932773109243697, "percentage": 79.33, "elapsed_time": "23:34:00", "remaining_time": "6:08:28", "throughput": 1595.13, "total_tokens": 135331840} -{"current_steps": 16530, "total_steps": 20825, "loss": 0.9578, "learning_rate": 5.5703121932344896e-06, "epoch": 0.7937575030012005, "percentage": 79.38, "elapsed_time": "23:34:56", "remaining_time": "6:07:38", "throughput": 1595.05, "total_tokens": 135413760} -{"current_steps": 16540, "total_steps": 20825, "loss": 0.8885, "learning_rate": 5.5454071274024436e-06, "epoch": 0.7942376950780312, "percentage": 79.42, "elapsed_time": "23:35:51", "remaining_time": "6:06:48", "throughput": 1594.97, "total_tokens": 135495680} -{"current_steps": 16550, "total_steps": 20825, "loss": 0.9609, "learning_rate": 5.520550915039579e-06, "epoch": 0.7947178871548619, "percentage": 79.47, "elapsed_time": "23:36:46", "remaining_time": "6:05:57", "throughput": 1594.92, "total_tokens": 135577600} -{"current_steps": 16560, "total_steps": 20825, "loss": 0.8386, "learning_rate": 5.495743618563668e-06, "epoch": 0.7951980792316927, "percentage": 79.52, "elapsed_time": "23:37:40", "remaining_time": "6:05:07", "throughput": 1594.86, "total_tokens": 135659520} -{"current_steps": 16570, "total_steps": 20825, "loss": 0.8747, "learning_rate": 5.4709853002696236e-06, "epoch": 0.7956782713085234, "percentage": 79.57, "elapsed_time": "23:38:35", "remaining_time": "6:04:16", "throughput": 1594.79, "total_tokens": 135741440} -{"current_steps": 16580, "total_steps": 20825, "loss": 0.8467, "learning_rate": 5.4462760223294e-06, "epoch": 0.7961584633853541, "percentage": 79.62, "elapsed_time": "23:39:29", "remaining_time": "6:03:26", "throughput": 1594.74, "total_tokens": 135823360} -{"current_steps": 16590, "total_steps": 20825, "loss": 0.8295, "learning_rate": 5.42161584679178e-06, "epoch": 0.7966386554621848, "percentage": 79.66, "elapsed_time": "23:40:26", "remaining_time": "6:02:36", "throughput": 1594.64, "total_tokens": 135905280} -{"current_steps": 16600, "total_steps": 20825, "loss": 0.8218, "learning_rate": 5.397004835582242e-06, "epoch": 0.7971188475390156, "percentage": 79.71, "elapsed_time": "23:41:22", "remaining_time": "6:01:45", "throughput": 1594.56, "total_tokens": 135987200} -{"current_steps": 16610, "total_steps": 20825, "loss": 0.8522, "learning_rate": 5.372443050502823e-06, "epoch": 0.7975990396158463, "percentage": 79.76, "elapsed_time": "23:42:17", "remaining_time": "6:00:55", "throughput": 1594.48, "total_tokens": 136069120} -{"current_steps": 16620, "total_steps": 20825, "loss": 0.8879, "learning_rate": 5.347930553231942e-06, "epoch": 0.798079231692677, "percentage": 79.81, "elapsed_time": "23:43:11", "remaining_time": "6:00:04", "throughput": 1594.43, "total_tokens": 136151040} -{"current_steps": 16630, "total_steps": 20825, "loss": 1.0158, "learning_rate": 5.323467405324226e-06, "epoch": 0.7985594237695078, "percentage": 79.86, "elapsed_time": "23:44:06", "remaining_time": "5:59:14", "throughput": 1594.36, "total_tokens": 136232960} -{"current_steps": 16640, "total_steps": 20825, "loss": 1.0689, "learning_rate": 5.299053668210402e-06, "epoch": 0.7990396158463385, "percentage": 79.9, "elapsed_time": "23:45:03", "remaining_time": "5:58:24", "throughput": 1594.26, "total_tokens": 136314880} -{"current_steps": 16650, "total_steps": 20825, "loss": 0.7811, "learning_rate": 5.274689403197119e-06, "epoch": 0.7995198079231692, "percentage": 79.95, "elapsed_time": "23:45:58", "remaining_time": "5:57:33", "throughput": 1594.19, "total_tokens": 136396800} -{"current_steps": 16660, "total_steps": 20825, "loss": 0.8692, "learning_rate": 5.250374671466776e-06, "epoch": 0.8, "percentage": 80.0, "elapsed_time": "23:46:52", "remaining_time": "5:56:43", "throughput": 1594.14, "total_tokens": 136478720} -{"current_steps": 16670, "total_steps": 20825, "loss": 1.1452, "learning_rate": 5.2261095340774085e-06, "epoch": 0.8004801920768307, "percentage": 80.05, "elapsed_time": "23:47:47", "remaining_time": "5:55:52", "throughput": 1594.08, "total_tokens": 136560640} -{"current_steps": 16680, "total_steps": 20825, "loss": 1.0006, "learning_rate": 5.201894051962486e-06, "epoch": 0.8009603841536614, "percentage": 80.1, "elapsed_time": "23:48:41", "remaining_time": "5:55:01", "throughput": 1594.02, "total_tokens": 136642560} -{"current_steps": 16690, "total_steps": 20825, "loss": 0.897, "learning_rate": 5.177728285930816e-06, "epoch": 0.8014405762304923, "percentage": 80.14, "elapsed_time": "23:49:36", "remaining_time": "5:54:11", "throughput": 1593.97, "total_tokens": 136724480} -{"current_steps": 16700, "total_steps": 20825, "loss": 0.7989, "learning_rate": 5.153612296666335e-06, "epoch": 0.801920768307323, "percentage": 80.19, "elapsed_time": "23:50:30", "remaining_time": "5:53:20", "throughput": 1593.91, "total_tokens": 136806400} -{"current_steps": 16710, "total_steps": 20825, "loss": 0.9656, "learning_rate": 5.129546144727998e-06, "epoch": 0.8024009603841536, "percentage": 80.24, "elapsed_time": "23:51:26", "remaining_time": "5:52:30", "throughput": 1593.83, "total_tokens": 136888320} -{"current_steps": 16720, "total_steps": 20825, "loss": 0.8726, "learning_rate": 5.105529890549618e-06, "epoch": 0.8028811524609843, "percentage": 80.29, "elapsed_time": "23:52:21", "remaining_time": "5:51:39", "throughput": 1593.75, "total_tokens": 136970240} -{"current_steps": 16730, "total_steps": 20825, "loss": 0.7868, "learning_rate": 5.081563594439676e-06, "epoch": 0.8033613445378152, "percentage": 80.34, "elapsed_time": "23:53:16", "remaining_time": "5:50:49", "throughput": 1593.69, "total_tokens": 137052160} -{"current_steps": 16740, "total_steps": 20825, "loss": 1.0533, "learning_rate": 5.057647316581232e-06, "epoch": 0.8038415366146459, "percentage": 80.38, "elapsed_time": "23:54:10", "remaining_time": "5:49:58", "throughput": 1593.64, "total_tokens": 137134080} -{"current_steps": 16750, "total_steps": 20825, "loss": 0.9322, "learning_rate": 5.033781117031738e-06, "epoch": 0.8043217286914766, "percentage": 80.43, "elapsed_time": "23:55:05", "remaining_time": "5:49:07", "throughput": 1593.59, "total_tokens": 137216000} -{"current_steps": 16760, "total_steps": 20825, "loss": 1.0616, "learning_rate": 5.0099650557228785e-06, "epoch": 0.8048019207683074, "percentage": 80.48, "elapsed_time": "23:55:55", "remaining_time": "5:48:16", "throughput": 1593.6, "total_tokens": 137297920} -{"current_steps": 16770, "total_steps": 20825, "loss": 0.8815, "learning_rate": 4.986199192460428e-06, "epoch": 0.8052821128451381, "percentage": 80.53, "elapsed_time": "23:56:48", "remaining_time": "5:47:25", "throughput": 1593.58, "total_tokens": 137379840} -{"current_steps": 16780, "total_steps": 20825, "loss": 0.7737, "learning_rate": 4.962483586924136e-06, "epoch": 0.8057623049219688, "percentage": 80.58, "elapsed_time": "23:57:40", "remaining_time": "5:46:33", "throughput": 1593.57, "total_tokens": 137461760} -{"current_steps": 16790, "total_steps": 20825, "loss": 0.8263, "learning_rate": 4.93881829866751e-06, "epoch": 0.8062424969987996, "percentage": 80.62, "elapsed_time": "23:58:32", "remaining_time": "5:45:42", "throughput": 1593.55, "total_tokens": 137543680} -{"current_steps": 16800, "total_steps": 20825, "loss": 0.9976, "learning_rate": 4.915203387117736e-06, "epoch": 0.8067226890756303, "percentage": 80.67, "elapsed_time": "23:59:29", "remaining_time": "5:44:52", "throughput": 1593.44, "total_tokens": 137625600} -{"current_steps": 16810, "total_steps": 20825, "loss": 0.8821, "learning_rate": 4.891638911575483e-06, "epoch": 0.807202881152461, "percentage": 80.72, "elapsed_time": "1 day, 0:00:23", "remaining_time": "5:44:01", "throughput": 1593.4, "total_tokens": 137707520} -{"current_steps": 16820, "total_steps": 20825, "loss": 0.9083, "learning_rate": 4.868124931214752e-06, "epoch": 0.8076830732292917, "percentage": 80.77, "elapsed_time": "1 day, 0:01:17", "remaining_time": "5:43:11", "throughput": 1593.35, "total_tokens": 137789440} -{"current_steps": 16830, "total_steps": 20825, "loss": 0.8356, "learning_rate": 4.844661505082768e-06, "epoch": 0.8081632653061225, "percentage": 80.82, "elapsed_time": "1 day, 0:02:11", "remaining_time": "5:42:20", "throughput": 1593.31, "total_tokens": 137871360} -{"current_steps": 16840, "total_steps": 20825, "loss": 0.7684, "learning_rate": 4.8212486920998005e-06, "epoch": 0.8086434573829532, "percentage": 80.86, "elapsed_time": "1 day, 0:03:05", "remaining_time": "5:41:29", "throughput": 1593.27, "total_tokens": 137953280} -{"current_steps": 16850, "total_steps": 20825, "loss": 0.9145, "learning_rate": 4.797886551059011e-06, "epoch": 0.8091236494597839, "percentage": 80.91, "elapsed_time": "1 day, 0:03:58", "remaining_time": "5:40:38", "throughput": 1593.23, "total_tokens": 138035200} -{"current_steps": 16860, "total_steps": 20825, "loss": 0.9692, "learning_rate": 4.7745751406263165e-06, "epoch": 0.8096038415366147, "percentage": 80.96, "elapsed_time": "1 day, 0:04:52", "remaining_time": "5:39:47", "throughput": 1593.19, "total_tokens": 138117120} -{"current_steps": 16870, "total_steps": 20825, "loss": 0.8577, "learning_rate": 4.751314519340258e-06, "epoch": 0.8100840336134454, "percentage": 81.01, "elapsed_time": "1 day, 0:05:45", "remaining_time": "5:38:56", "throughput": 1593.15, "total_tokens": 138199040} -{"current_steps": 16880, "total_steps": 20825, "loss": 0.8875, "learning_rate": 4.728104745611814e-06, "epoch": 0.8105642256902761, "percentage": 81.06, "elapsed_time": "1 day, 0:06:40", "remaining_time": "5:38:06", "throughput": 1593.09, "total_tokens": 138280960} -{"current_steps": 16890, "total_steps": 20825, "loss": 1.0989, "learning_rate": 4.704945877724295e-06, "epoch": 0.8110444177671069, "percentage": 81.1, "elapsed_time": "1 day, 0:07:31", "remaining_time": "5:37:14", "throughput": 1593.1, "total_tokens": 138362880} -{"current_steps": 16900, "total_steps": 20825, "loss": 0.9019, "learning_rate": 4.681837973833181e-06, "epoch": 0.8115246098439376, "percentage": 81.15, "elapsed_time": "1 day, 0:08:29", "remaining_time": "5:36:24", "throughput": 1592.98, "total_tokens": 138444800} -{"current_steps": 16910, "total_steps": 20825, "loss": 0.8082, "learning_rate": 4.658781091965955e-06, "epoch": 0.8120048019207683, "percentage": 81.2, "elapsed_time": "1 day, 0:09:31", "remaining_time": "5:35:35", "throughput": 1592.79, "total_tokens": 138526720} -{"current_steps": 16920, "total_steps": 20825, "loss": 0.8978, "learning_rate": 4.635775290021988e-06, "epoch": 0.812484993997599, "percentage": 81.25, "elapsed_time": "1 day, 0:10:33", "remaining_time": "5:34:46", "throughput": 1592.59, "total_tokens": 138608640} -{"current_steps": 16930, "total_steps": 20825, "loss": 0.6356, "learning_rate": 4.612820625772391e-06, "epoch": 0.8129651860744298, "percentage": 81.3, "elapsed_time": "1 day, 0:11:35", "remaining_time": "5:33:57", "throughput": 1592.4, "total_tokens": 138690560} -{"current_steps": 16940, "total_steps": 20825, "loss": 0.8645, "learning_rate": 4.589917156859838e-06, "epoch": 0.8134453781512605, "percentage": 81.34, "elapsed_time": "1 day, 0:12:36", "remaining_time": "5:33:08", "throughput": 1592.22, "total_tokens": 138772480} -{"current_steps": 16950, "total_steps": 20825, "loss": 0.8896, "learning_rate": 4.5670649407984625e-06, "epoch": 0.8139255702280912, "percentage": 81.39, "elapsed_time": "1 day, 0:13:37", "remaining_time": "5:32:19", "throughput": 1592.04, "total_tokens": 138854400} -{"current_steps": 16960, "total_steps": 20825, "loss": 0.7794, "learning_rate": 4.544264034973686e-06, "epoch": 0.814405762304922, "percentage": 81.44, "elapsed_time": "1 day, 0:14:40", "remaining_time": "5:31:30", "throughput": 1591.83, "total_tokens": 138936320} -{"current_steps": 16970, "total_steps": 20825, "loss": 0.9631, "learning_rate": 4.521514496642074e-06, "epoch": 0.8148859543817527, "percentage": 81.49, "elapsed_time": "1 day, 0:15:42", "remaining_time": "5:30:41", "throughput": 1591.64, "total_tokens": 139018240} -{"current_steps": 16980, "total_steps": 20825, "loss": 0.9246, "learning_rate": 4.498816382931217e-06, "epoch": 0.8153661464585834, "percentage": 81.54, "elapsed_time": "1 day, 0:16:44", "remaining_time": "5:29:52", "throughput": 1591.44, "total_tokens": 139100160} -{"current_steps": 16990, "total_steps": 20825, "loss": 1.0151, "learning_rate": 4.476169750839571e-06, "epoch": 0.8158463385354142, "percentage": 81.58, "elapsed_time": "1 day, 0:17:44", "remaining_time": "5:29:02", "throughput": 1591.29, "total_tokens": 139182080} -{"current_steps": 17000, "total_steps": 20825, "loss": 0.8939, "learning_rate": 4.45357465723629e-06, "epoch": 0.8163265306122449, "percentage": 81.63, "elapsed_time": "1 day, 0:18:37", "remaining_time": "5:28:11", "throughput": 1591.26, "total_tokens": 139264000} -{"current_steps": 17010, "total_steps": 20825, "loss": 0.8846, "learning_rate": 4.4310311588611294e-06, "epoch": 0.8168067226890756, "percentage": 81.68, "elapsed_time": "1 day, 0:19:33", "remaining_time": "5:27:21", "throughput": 1591.18, "total_tokens": 139345920} -{"current_steps": 17020, "total_steps": 20825, "loss": 0.8446, "learning_rate": 4.408539312324281e-06, "epoch": 0.8172869147659063, "percentage": 81.73, "elapsed_time": "1 day, 0:20:26", "remaining_time": "5:26:29", "throughput": 1591.16, "total_tokens": 139427840} -{"current_steps": 17030, "total_steps": 20825, "loss": 0.8381, "learning_rate": 4.386099174106212e-06, "epoch": 0.8177671068427371, "percentage": 81.78, "elapsed_time": "1 day, 0:21:22", "remaining_time": "5:25:39", "throughput": 1591.09, "total_tokens": 139509760} -{"current_steps": 17040, "total_steps": 20825, "loss": 0.9471, "learning_rate": 4.363710800557566e-06, "epoch": 0.8182472989195678, "percentage": 81.82, "elapsed_time": "1 day, 0:22:15", "remaining_time": "5:24:48", "throughput": 1591.06, "total_tokens": 139591680} -{"current_steps": 17050, "total_steps": 20825, "loss": 0.7787, "learning_rate": 4.341374247898983e-06, "epoch": 0.8187274909963985, "percentage": 81.87, "elapsed_time": "1 day, 0:23:16", "remaining_time": "5:23:58", "throughput": 1590.88, "total_tokens": 139673600} -{"current_steps": 17060, "total_steps": 20825, "loss": 0.9487, "learning_rate": 4.3190895722209635e-06, "epoch": 0.8192076830732293, "percentage": 81.92, "elapsed_time": "1 day, 0:24:11", "remaining_time": "5:23:08", "throughput": 1590.82, "total_tokens": 139755520} -{"current_steps": 17070, "total_steps": 20825, "loss": 0.884, "learning_rate": 4.296856829483759e-06, "epoch": 0.81968787515006, "percentage": 81.97, "elapsed_time": "1 day, 0:25:10", "remaining_time": "5:22:18", "throughput": 1590.68, "total_tokens": 139837440} -{"current_steps": 17080, "total_steps": 20825, "loss": 0.741, "learning_rate": 4.274676075517206e-06, "epoch": 0.8201680672268907, "percentage": 82.02, "elapsed_time": "1 day, 0:26:05", "remaining_time": "5:21:27", "throughput": 1590.62, "total_tokens": 139919360} -{"current_steps": 17090, "total_steps": 20825, "loss": 0.8349, "learning_rate": 4.252547366020568e-06, "epoch": 0.8206482593037215, "percentage": 82.06, "elapsed_time": "1 day, 0:26:57", "remaining_time": "5:20:36", "throughput": 1590.61, "total_tokens": 140001280} -{"current_steps": 17100, "total_steps": 20825, "loss": 0.9832, "learning_rate": 4.230470756562438e-06, "epoch": 0.8211284513805522, "percentage": 82.11, "elapsed_time": "1 day, 0:27:48", "remaining_time": "5:19:44", "throughput": 1590.61, "total_tokens": 140083200} -{"current_steps": 17110, "total_steps": 20825, "loss": 0.7601, "learning_rate": 4.208446302580582e-06, "epoch": 0.8216086434573829, "percentage": 82.16, "elapsed_time": "1 day, 0:28:45", "remaining_time": "5:18:54", "throughput": 1590.52, "total_tokens": 140165120} -{"current_steps": 17120, "total_steps": 20825, "loss": 0.7198, "learning_rate": 4.186474059381768e-06, "epoch": 0.8220888355342136, "percentage": 82.21, "elapsed_time": "1 day, 0:29:39", "remaining_time": "5:18:03", "throughput": 1590.47, "total_tokens": 140247040} -{"current_steps": 17130, "total_steps": 20825, "loss": 0.8547, "learning_rate": 4.164554082141683e-06, "epoch": 0.8225690276110444, "percentage": 82.26, "elapsed_time": "1 day, 0:30:34", "remaining_time": "5:17:12", "throughput": 1590.4, "total_tokens": 140328960} -{"current_steps": 17140, "total_steps": 20825, "loss": 0.8511, "learning_rate": 4.142686425904752e-06, "epoch": 0.8230492196878751, "percentage": 82.3, "elapsed_time": "1 day, 0:31:28", "remaining_time": "5:16:21", "throughput": 1590.36, "total_tokens": 140410880} -{"current_steps": 17150, "total_steps": 20825, "loss": 0.8076, "learning_rate": 4.12087114558401e-06, "epoch": 0.8235294117647058, "percentage": 82.35, "elapsed_time": "1 day, 0:32:22", "remaining_time": "5:15:30", "throughput": 1590.32, "total_tokens": 140492800} -{"current_steps": 17160, "total_steps": 20825, "loss": 0.7348, "learning_rate": 4.099108295960977e-06, "epoch": 0.8240096038415367, "percentage": 82.4, "elapsed_time": "1 day, 0:33:17", "remaining_time": "5:14:39", "throughput": 1590.26, "total_tokens": 140574720} -{"current_steps": 17170, "total_steps": 20825, "loss": 0.8413, "learning_rate": 4.077397931685523e-06, "epoch": 0.8244897959183674, "percentage": 82.45, "elapsed_time": "1 day, 0:34:11", "remaining_time": "5:13:48", "throughput": 1590.2, "total_tokens": 140656640} -{"current_steps": 17180, "total_steps": 20825, "loss": 1.1131, "learning_rate": 4.055740107275685e-06, "epoch": 0.824969987995198, "percentage": 82.5, "elapsed_time": "1 day, 0:35:06", "remaining_time": "5:12:57", "throughput": 1590.16, "total_tokens": 140738560} -{"current_steps": 17190, "total_steps": 20825, "loss": 0.9822, "learning_rate": 4.0341348771175955e-06, "epoch": 0.8254501800720289, "percentage": 82.55, "elapsed_time": "1 day, 0:35:58", "remaining_time": "5:12:06", "throughput": 1590.13, "total_tokens": 140820480} -{"current_steps": 17200, "total_steps": 20825, "loss": 0.834, "learning_rate": 4.012582295465308e-06, "epoch": 0.8259303721488596, "percentage": 82.59, "elapsed_time": "1 day, 0:39:22", "remaining_time": "5:11:47", "throughput": 1587.41, "total_tokens": 140902400} -{"current_steps": 17210, "total_steps": 20825, "loss": 0.8526, "learning_rate": 3.991082416440656e-06, "epoch": 0.8264105642256903, "percentage": 82.64, "elapsed_time": "1 day, 0:43:35", "remaining_time": "5:11:37", "throughput": 1583.82, "total_tokens": 140984320} -{"current_steps": 17220, "total_steps": 20825, "loss": 0.794, "learning_rate": 3.969635294033144e-06, "epoch": 0.826890756302521, "percentage": 82.69, "elapsed_time": "1 day, 0:44:28", "remaining_time": "5:10:46", "throughput": 1583.79, "total_tokens": 141066240} -{"current_steps": 17230, "total_steps": 20825, "loss": 0.8676, "learning_rate": 3.9482409820997826e-06, "epoch": 0.8273709483793518, "percentage": 82.74, "elapsed_time": "1 day, 0:45:23", "remaining_time": "5:09:55", "throughput": 1583.73, "total_tokens": 141148160} -{"current_steps": 17240, "total_steps": 20825, "loss": 0.9085, "learning_rate": 3.926899534364969e-06, "epoch": 0.8278511404561825, "percentage": 82.79, "elapsed_time": "1 day, 0:46:20", "remaining_time": "5:09:04", "throughput": 1583.65, "total_tokens": 141230080} -{"current_steps": 17250, "total_steps": 20825, "loss": 0.8688, "learning_rate": 3.90561100442036e-06, "epoch": 0.8283313325330132, "percentage": 82.83, "elapsed_time": "1 day, 0:47:17", "remaining_time": "5:08:14", "throughput": 1583.54, "total_tokens": 141312000} -{"current_steps": 17260, "total_steps": 20825, "loss": 1.0517, "learning_rate": 3.8843754457247275e-06, "epoch": 0.828811524609844, "percentage": 82.88, "elapsed_time": "1 day, 0:48:14", "remaining_time": "5:07:23", "throughput": 1583.45, "total_tokens": 141393920} -{"current_steps": 17270, "total_steps": 20825, "loss": 0.9196, "learning_rate": 3.863192911603808e-06, "epoch": 0.8292917166866747, "percentage": 82.93, "elapsed_time": "1 day, 0:49:12", "remaining_time": "5:06:33", "throughput": 1583.34, "total_tokens": 141475840} -{"current_steps": 17280, "total_steps": 20825, "loss": 0.9045, "learning_rate": 3.842063455250203e-06, "epoch": 0.8297719087635054, "percentage": 82.98, "elapsed_time": "1 day, 0:50:08", "remaining_time": "5:05:42", "throughput": 1583.28, "total_tokens": 141557760} -{"current_steps": 17290, "total_steps": 20825, "loss": 0.8666, "learning_rate": 3.820987129723228e-06, "epoch": 0.8302521008403362, "percentage": 83.03, "elapsed_time": "1 day, 0:51:02", "remaining_time": "5:04:50", "throughput": 1583.24, "total_tokens": 141639680} -{"current_steps": 17300, "total_steps": 20825, "loss": 0.788, "learning_rate": 3.799963987948757e-06, "epoch": 0.8307322929171669, "percentage": 83.07, "elapsed_time": "1 day, 0:51:56", "remaining_time": "5:03:59", "throughput": 1583.19, "total_tokens": 141721600} -{"current_steps": 17310, "total_steps": 20825, "loss": 0.8889, "learning_rate": 3.7789940827191395e-06, "epoch": 0.8312124849939976, "percentage": 83.12, "elapsed_time": "1 day, 0:52:52", "remaining_time": "5:03:08", "throughput": 1583.11, "total_tokens": 141803520} -{"current_steps": 17320, "total_steps": 20825, "loss": 0.8877, "learning_rate": 3.7580774666930134e-06, "epoch": 0.8316926770708283, "percentage": 83.17, "elapsed_time": "1 day, 0:53:49", "remaining_time": "5:02:18", "throughput": 1583.03, "total_tokens": 141885440} -{"current_steps": 17330, "total_steps": 20825, "loss": 0.8935, "learning_rate": 3.737214192395225e-06, "epoch": 0.8321728691476591, "percentage": 83.22, "elapsed_time": "1 day, 0:54:45", "remaining_time": "5:01:27", "throughput": 1582.95, "total_tokens": 141967360} -{"current_steps": 17340, "total_steps": 20825, "loss": 1.0336, "learning_rate": 3.7164043122166508e-06, "epoch": 0.8326530612244898, "percentage": 83.27, "elapsed_time": "1 day, 0:55:42", "remaining_time": "5:00:36", "throughput": 1582.85, "total_tokens": 142049280} -{"current_steps": 17350, "total_steps": 20825, "loss": 1.0014, "learning_rate": 3.6956478784140937e-06, "epoch": 0.8331332533013205, "percentage": 83.31, "elapsed_time": "1 day, 0:56:39", "remaining_time": "4:59:45", "throughput": 1582.77, "total_tokens": 142131200} -{"current_steps": 17360, "total_steps": 20825, "loss": 0.9075, "learning_rate": 3.674944943110156e-06, "epoch": 0.8336134453781513, "percentage": 83.36, "elapsed_time": "1 day, 0:57:32", "remaining_time": "4:58:54", "throughput": 1582.74, "total_tokens": 142213120} -{"current_steps": 17370, "total_steps": 20825, "loss": 0.7461, "learning_rate": 3.6542955582930748e-06, "epoch": 0.834093637454982, "percentage": 83.41, "elapsed_time": "1 day, 0:58:25", "remaining_time": "4:58:02", "throughput": 1582.72, "total_tokens": 142295040} -{"current_steps": 17380, "total_steps": 20825, "loss": 0.9869, "learning_rate": 3.6336997758166263e-06, "epoch": 0.8345738295318127, "percentage": 83.46, "elapsed_time": "1 day, 0:59:17", "remaining_time": "4:57:10", "throughput": 1582.72, "total_tokens": 142376960} -{"current_steps": 17390, "total_steps": 20825, "loss": 0.775, "learning_rate": 3.6131576473999924e-06, "epoch": 0.8350540216086435, "percentage": 83.51, "elapsed_time": "1 day, 1:00:08", "remaining_time": "4:56:19", "throughput": 1582.73, "total_tokens": 142458880} -{"current_steps": 17400, "total_steps": 20825, "loss": 0.916, "learning_rate": 3.592669224627601e-06, "epoch": 0.8355342136854742, "percentage": 83.55, "elapsed_time": "1 day, 1:00:59", "remaining_time": "4:55:27", "throughput": 1582.73, "total_tokens": 142540800} -{"current_steps": 17410, "total_steps": 20825, "loss": 1.0457, "learning_rate": 3.5722345589490306e-06, "epoch": 0.8360144057623049, "percentage": 83.6, "elapsed_time": "1 day, 1:01:50", "remaining_time": "4:54:35", "throughput": 1582.75, "total_tokens": 142622720} -{"current_steps": 17420, "total_steps": 20825, "loss": 1.0179, "learning_rate": 3.5518537016788646e-06, "epoch": 0.8364945978391356, "percentage": 83.65, "elapsed_time": "1 day, 1:02:39", "remaining_time": "4:53:43", "throughput": 1582.8, "total_tokens": 142704640} -{"current_steps": 17430, "total_steps": 20825, "loss": 0.8232, "learning_rate": 3.531526703996557e-06, "epoch": 0.8369747899159664, "percentage": 83.7, "elapsed_time": "1 day, 1:03:28", "remaining_time": "4:52:50", "throughput": 1582.86, "total_tokens": 142786560} -{"current_steps": 17440, "total_steps": 20825, "loss": 0.9279, "learning_rate": 3.511253616946325e-06, "epoch": 0.8374549819927971, "percentage": 83.75, "elapsed_time": "1 day, 1:04:17", "remaining_time": "4:51:58", "throughput": 1582.9, "total_tokens": 142868480} -{"current_steps": 17450, "total_steps": 20825, "loss": 0.8721, "learning_rate": 3.4910344914370093e-06, "epoch": 0.8379351740696278, "percentage": 83.79, "elapsed_time": "1 day, 1:05:08", "remaining_time": "4:51:06", "throughput": 1582.91, "total_tokens": 142950400} -{"current_steps": 17460, "total_steps": 20825, "loss": 0.8941, "learning_rate": 3.4708693782419225e-06, "epoch": 0.8384153661464586, "percentage": 83.84, "elapsed_time": "1 day, 1:05:58", "remaining_time": "4:50:14", "throughput": 1582.95, "total_tokens": 143032320} -{"current_steps": 17470, "total_steps": 20825, "loss": 0.8403, "learning_rate": 3.450758327998768e-06, "epoch": 0.8388955582232893, "percentage": 83.89, "elapsed_time": "1 day, 1:06:48", "remaining_time": "4:49:22", "throughput": 1582.98, "total_tokens": 143114240} -{"current_steps": 17480, "total_steps": 20825, "loss": 0.9405, "learning_rate": 3.4307013912094845e-06, "epoch": 0.83937575030012, "percentage": 83.94, "elapsed_time": "1 day, 1:07:39", "remaining_time": "4:48:30", "throughput": 1582.99, "total_tokens": 143196160} -{"current_steps": 17490, "total_steps": 20825, "loss": 0.6972, "learning_rate": 3.41069861824011e-06, "epoch": 0.8398559423769508, "percentage": 83.99, "elapsed_time": "1 day, 1:08:32", "remaining_time": "4:47:38", "throughput": 1582.97, "total_tokens": 143278080} -{"current_steps": 17500, "total_steps": 20825, "loss": 0.9488, "learning_rate": 3.390750059320688e-06, "epoch": 0.8403361344537815, "percentage": 84.03, "elapsed_time": "1 day, 1:09:24", "remaining_time": "4:46:47", "throughput": 1582.96, "total_tokens": 143360000} -{"current_steps": 17510, "total_steps": 20825, "loss": 0.7979, "learning_rate": 3.3708557645451053e-06, "epoch": 0.8408163265306122, "percentage": 84.08, "elapsed_time": "1 day, 1:10:18", "remaining_time": "4:45:55", "throughput": 1582.92, "total_tokens": 143441920} -{"current_steps": 17520, "total_steps": 20825, "loss": 0.9223, "learning_rate": 3.3510157838709895e-06, "epoch": 0.8412965186074429, "percentage": 84.13, "elapsed_time": "1 day, 1:11:15", "remaining_time": "4:45:05", "throughput": 1582.83, "total_tokens": 143523840} -{"current_steps": 17530, "total_steps": 20825, "loss": 1.0832, "learning_rate": 3.3312301671195784e-06, "epoch": 0.8417767106842737, "percentage": 84.18, "elapsed_time": "1 day, 1:12:08", "remaining_time": "4:44:13", "throughput": 1582.81, "total_tokens": 143605760} -{"current_steps": 17540, "total_steps": 20825, "loss": 0.8365, "learning_rate": 3.3114989639755983e-06, "epoch": 0.8422569027611044, "percentage": 84.23, "elapsed_time": "1 day, 1:13:02", "remaining_time": "4:43:22", "throughput": 1582.78, "total_tokens": 143687680} -{"current_steps": 17550, "total_steps": 20825, "loss": 0.8637, "learning_rate": 3.2918222239871206e-06, "epoch": 0.8427370948379351, "percentage": 84.27, "elapsed_time": "1 day, 1:13:52", "remaining_time": "4:42:30", "throughput": 1582.8, "total_tokens": 143769600} -{"current_steps": 17560, "total_steps": 20825, "loss": 0.8599, "learning_rate": 3.272199996565464e-06, "epoch": 0.8432172869147659, "percentage": 84.32, "elapsed_time": "1 day, 1:14:41", "remaining_time": "4:41:37", "throughput": 1582.85, "total_tokens": 143851520} -{"current_steps": 17570, "total_steps": 20825, "loss": 0.8833, "learning_rate": 3.252632330985059e-06, "epoch": 0.8436974789915966, "percentage": 84.37, "elapsed_time": "1 day, 1:15:29", "remaining_time": "4:40:45", "throughput": 1582.91, "total_tokens": 143933440} -{"current_steps": 17580, "total_steps": 20825, "loss": 0.8098, "learning_rate": 3.233119276383309e-06, "epoch": 0.8441776710684273, "percentage": 84.42, "elapsed_time": "1 day, 1:16:17", "remaining_time": "4:39:53", "throughput": 1582.98, "total_tokens": 144015360} -{"current_steps": 17590, "total_steps": 20825, "loss": 0.8137, "learning_rate": 3.2136608817604998e-06, "epoch": 0.8446578631452581, "percentage": 84.47, "elapsed_time": "1 day, 1:17:06", "remaining_time": "4:39:00", "throughput": 1583.03, "total_tokens": 144097280} -{"current_steps": 17600, "total_steps": 20825, "loss": 0.9244, "learning_rate": 3.1942571959796414e-06, "epoch": 0.8451380552220888, "percentage": 84.51, "elapsed_time": "1 day, 1:17:55", "remaining_time": "4:38:08", "throughput": 1583.07, "total_tokens": 144179200} -{"current_steps": 17610, "total_steps": 20825, "loss": 0.9445, "learning_rate": 3.1749082677663606e-06, "epoch": 0.8456182472989195, "percentage": 84.56, "elapsed_time": "1 day, 1:18:45", "remaining_time": "4:37:16", "throughput": 1583.11, "total_tokens": 144261120} -{"current_steps": 17620, "total_steps": 20825, "loss": 1.0138, "learning_rate": 3.1556141457087932e-06, "epoch": 0.8460984393757504, "percentage": 84.61, "elapsed_time": "1 day, 1:19:35", "remaining_time": "4:36:24", "throughput": 1583.14, "total_tokens": 144343040} -{"current_steps": 17630, "total_steps": 20825, "loss": 0.8728, "learning_rate": 3.1363748782574475e-06, "epoch": 0.846578631452581, "percentage": 84.66, "elapsed_time": "1 day, 1:20:58", "remaining_time": "4:35:38", "throughput": 1582.6, "total_tokens": 144424960} -{"current_steps": 17640, "total_steps": 20825, "loss": 0.8881, "learning_rate": 3.1171905137250655e-06, "epoch": 0.8470588235294118, "percentage": 84.71, "elapsed_time": "1 day, 1:22:11", "remaining_time": "4:34:50", "throughput": 1582.23, "total_tokens": 144506880} -{"current_steps": 17650, "total_steps": 20825, "loss": 0.8107, "learning_rate": 3.098061100286537e-06, "epoch": 0.8475390156062425, "percentage": 84.75, "elapsed_time": "1 day, 1:23:06", "remaining_time": "4:33:59", "throughput": 1582.17, "total_tokens": 144588800} -{"current_steps": 17660, "total_steps": 20825, "loss": 1.0014, "learning_rate": 3.078986685978763e-06, "epoch": 0.8480192076830733, "percentage": 84.8, "elapsed_time": "1 day, 1:23:57", "remaining_time": "4:33:07", "throughput": 1582.17, "total_tokens": 144670720} -{"current_steps": 17670, "total_steps": 20825, "loss": 0.7933, "learning_rate": 3.059967318700513e-06, "epoch": 0.848499399759904, "percentage": 84.85, "elapsed_time": "1 day, 1:24:56", "remaining_time": "4:32:16", "throughput": 1582.06, "total_tokens": 144752640} -{"current_steps": 17680, "total_steps": 20825, "loss": 0.8734, "learning_rate": 3.0410030462123486e-06, "epoch": 0.8489795918367347, "percentage": 84.9, "elapsed_time": "1 day, 1:25:57", "remaining_time": "4:31:26", "throughput": 1581.9, "total_tokens": 144834560} -{"current_steps": 17690, "total_steps": 20825, "loss": 1.1692, "learning_rate": 3.022093916136465e-06, "epoch": 0.8494597839135655, "percentage": 84.95, "elapsed_time": "1 day, 1:26:52", "remaining_time": "4:30:35", "throughput": 1581.85, "total_tokens": 144916480} -{"current_steps": 17700, "total_steps": 20825, "loss": 0.8841, "learning_rate": 3.0032399759565845e-06, "epoch": 0.8499399759903962, "percentage": 84.99, "elapsed_time": "1 day, 1:27:46", "remaining_time": "4:29:43", "throughput": 1581.81, "total_tokens": 144998400} -{"current_steps": 17710, "total_steps": 20825, "loss": 0.9305, "learning_rate": 2.9844412730178515e-06, "epoch": 0.8504201680672269, "percentage": 85.04, "elapsed_time": "1 day, 1:28:38", "remaining_time": "4:28:52", "throughput": 1581.8, "total_tokens": 145080320} -{"current_steps": 17720, "total_steps": 20825, "loss": 0.9277, "learning_rate": 2.9656978545267002e-06, "epoch": 0.8509003601440577, "percentage": 85.09, "elapsed_time": "1 day, 1:29:32", "remaining_time": "4:28:00", "throughput": 1581.77, "total_tokens": 145162240} -{"current_steps": 17730, "total_steps": 20825, "loss": 0.9099, "learning_rate": 2.947009767550718e-06, "epoch": 0.8513805522208884, "percentage": 85.14, "elapsed_time": "1 day, 1:30:25", "remaining_time": "4:27:09", "throughput": 1581.75, "total_tokens": 145244160} -{"current_steps": 17740, "total_steps": 20825, "loss": 1.0301, "learning_rate": 2.9283770590185696e-06, "epoch": 0.8518607442977191, "percentage": 85.19, "elapsed_time": "1 day, 1:31:18", "remaining_time": "4:26:17", "throughput": 1581.72, "total_tokens": 145326080} -{"current_steps": 17750, "total_steps": 20825, "loss": 1.1378, "learning_rate": 2.9097997757198516e-06, "epoch": 0.8523409363745498, "percentage": 85.23, "elapsed_time": "1 day, 1:32:10", "remaining_time": "4:25:25", "throughput": 1581.72, "total_tokens": 145408000} -{"current_steps": 17760, "total_steps": 20825, "loss": 0.8219, "learning_rate": 2.891277964304959e-06, "epoch": 0.8528211284513806, "percentage": 85.28, "elapsed_time": "1 day, 1:33:04", "remaining_time": "4:24:34", "throughput": 1581.68, "total_tokens": 145489920} -{"current_steps": 17770, "total_steps": 20825, "loss": 0.8583, "learning_rate": 2.8728116712850193e-06, "epoch": 0.8533013205282113, "percentage": 85.33, "elapsed_time": "1 day, 1:33:55", "remaining_time": "4:23:42", "throughput": 1581.69, "total_tokens": 145571840} -{"current_steps": 17780, "total_steps": 20825, "loss": 0.9945, "learning_rate": 2.8544009430317153e-06, "epoch": 0.853781512605042, "percentage": 85.38, "elapsed_time": "1 day, 1:34:40", "remaining_time": "4:22:49", "throughput": 1581.81, "total_tokens": 145653760} -{"current_steps": 17790, "total_steps": 20825, "loss": 0.9056, "learning_rate": 2.8360458257772228e-06, "epoch": 0.8542617046818728, "percentage": 85.43, "elapsed_time": "1 day, 1:35:26", "remaining_time": "4:21:56", "throughput": 1581.91, "total_tokens": 145735680} -{"current_steps": 17800, "total_steps": 20825, "loss": 0.8998, "learning_rate": 2.817746365614049e-06, "epoch": 0.8547418967587035, "percentage": 85.47, "elapsed_time": "1 day, 1:36:11", "remaining_time": "4:21:03", "throughput": 1582.03, "total_tokens": 145817600} -{"current_steps": 17810, "total_steps": 20825, "loss": 0.931, "learning_rate": 2.7995026084949584e-06, "epoch": 0.8552220888355342, "percentage": 85.52, "elapsed_time": "1 day, 1:37:04", "remaining_time": "4:20:12", "throughput": 1582.0, "total_tokens": 145899520} -{"current_steps": 17820, "total_steps": 20825, "loss": 1.0527, "learning_rate": 2.781314600232815e-06, "epoch": 0.855702280912365, "percentage": 85.57, "elapsed_time": "1 day, 1:37:59", "remaining_time": "4:19:21", "throughput": 1581.94, "total_tokens": 145981440} -{"current_steps": 17830, "total_steps": 20825, "loss": 0.8695, "learning_rate": 2.763182386500504e-06, "epoch": 0.8561824729891957, "percentage": 85.62, "elapsed_time": "1 day, 1:38:55", "remaining_time": "4:18:30", "throughput": 1581.87, "total_tokens": 146063360} -{"current_steps": 17840, "total_steps": 20825, "loss": 0.9396, "learning_rate": 2.745106012830806e-06, "epoch": 0.8566626650660264, "percentage": 85.67, "elapsed_time": "1 day, 1:39:50", "remaining_time": "4:17:38", "throughput": 1581.82, "total_tokens": 146145280} -{"current_steps": 17850, "total_steps": 20825, "loss": 1.0026, "learning_rate": 2.7270855246162547e-06, "epoch": 0.8571428571428571, "percentage": 85.71, "elapsed_time": "1 day, 1:40:45", "remaining_time": "4:16:47", "throughput": 1581.76, "total_tokens": 146227200} -{"current_steps": 17860, "total_steps": 20825, "loss": 0.9145, "learning_rate": 2.7091209671090715e-06, "epoch": 0.8576230492196879, "percentage": 85.76, "elapsed_time": "1 day, 1:41:40", "remaining_time": "4:15:56", "throughput": 1581.71, "total_tokens": 146309120} -{"current_steps": 17870, "total_steps": 20825, "loss": 0.8782, "learning_rate": 2.6912123854210212e-06, "epoch": 0.8581032412965186, "percentage": 85.81, "elapsed_time": "1 day, 1:42:35", "remaining_time": "4:15:05", "throughput": 1581.66, "total_tokens": 146391040} -{"current_steps": 17880, "total_steps": 20825, "loss": 0.9368, "learning_rate": 2.673359824523297e-06, "epoch": 0.8585834333733493, "percentage": 85.86, "elapsed_time": "1 day, 1:43:30", "remaining_time": "4:14:13", "throughput": 1581.61, "total_tokens": 146472960} -{"current_steps": 17890, "total_steps": 20825, "loss": 0.946, "learning_rate": 2.655563329246413e-06, "epoch": 0.8590636254501801, "percentage": 85.91, "elapsed_time": "1 day, 1:44:25", "remaining_time": "4:13:22", "throughput": 1581.55, "total_tokens": 146554880} -{"current_steps": 17900, "total_steps": 20825, "loss": 0.8075, "learning_rate": 2.637822944280116e-06, "epoch": 0.8595438175270108, "percentage": 85.95, "elapsed_time": "1 day, 1:45:20", "remaining_time": "4:12:31", "throughput": 1581.5, "total_tokens": 146636800} -{"current_steps": 17910, "total_steps": 20825, "loss": 0.9612, "learning_rate": 2.6201387141732205e-06, "epoch": 0.8600240096038415, "percentage": 86.0, "elapsed_time": "1 day, 1:46:07", "remaining_time": "4:11:38", "throughput": 1581.58, "total_tokens": 146718720} -{"current_steps": 17920, "total_steps": 20825, "loss": 1.0511, "learning_rate": 2.6025106833335505e-06, "epoch": 0.8605042016806723, "percentage": 86.05, "elapsed_time": "1 day, 1:46:52", "remaining_time": "4:10:45", "throughput": 1581.69, "total_tokens": 146800640} -{"current_steps": 17930, "total_steps": 20825, "loss": 0.7721, "learning_rate": 2.5849388960277997e-06, "epoch": 0.860984393757503, "percentage": 86.1, "elapsed_time": "1 day, 1:47:38", "remaining_time": "4:09:53", "throughput": 1581.79, "total_tokens": 146882560} -{"current_steps": 17940, "total_steps": 20825, "loss": 0.7826, "learning_rate": 2.567423396381419e-06, "epoch": 0.8614645858343337, "percentage": 86.15, "elapsed_time": "1 day, 1:48:23", "remaining_time": "4:09:00", "throughput": 1581.9, "total_tokens": 146964480} -{"current_steps": 17950, "total_steps": 20825, "loss": 0.7408, "learning_rate": 2.549964228378518e-06, "epoch": 0.8619447779111644, "percentage": 86.19, "elapsed_time": "1 day, 1:49:09", "remaining_time": "4:08:07", "throughput": 1582.01, "total_tokens": 147046400} -{"current_steps": 17960, "total_steps": 20825, "loss": 0.906, "learning_rate": 2.532561435861755e-06, "epoch": 0.8624249699879952, "percentage": 86.24, "elapsed_time": "1 day, 1:49:54", "remaining_time": "4:07:14", "throughput": 1582.12, "total_tokens": 147128320} -{"current_steps": 17970, "total_steps": 20825, "loss": 0.8907, "learning_rate": 2.515215062532206e-06, "epoch": 0.8629051620648259, "percentage": 86.29, "elapsed_time": "1 day, 1:50:40", "remaining_time": "4:06:21", "throughput": 1582.22, "total_tokens": 147210240} -{"current_steps": 17980, "total_steps": 20825, "loss": 0.9341, "learning_rate": 2.497925151949271e-06, "epoch": 0.8633853541416566, "percentage": 86.34, "elapsed_time": "1 day, 1:51:25", "remaining_time": "4:05:29", "throughput": 1582.33, "total_tokens": 147292160} -{"current_steps": 17990, "total_steps": 20825, "loss": 0.9855, "learning_rate": 2.4806917475305806e-06, "epoch": 0.8638655462184874, "percentage": 86.39, "elapsed_time": "1 day, 1:52:10", "remaining_time": "4:04:36", "throughput": 1582.44, "total_tokens": 147374080} -{"current_steps": 18000, "total_steps": 20825, "loss": 0.8596, "learning_rate": 2.4635148925518577e-06, "epoch": 0.8643457382953181, "percentage": 86.43, "elapsed_time": "1 day, 1:52:56", "remaining_time": "4:03:43", "throughput": 1582.55, "total_tokens": 147456000} -{"current_steps": 18010, "total_steps": 20825, "loss": 0.8384, "learning_rate": 2.4463946301468143e-06, "epoch": 0.8648259303721488, "percentage": 86.48, "elapsed_time": "1 day, 1:53:45", "remaining_time": "4:02:51", "throughput": 1582.6, "total_tokens": 147537920} -{"current_steps": 18020, "total_steps": 20825, "loss": 0.9121, "learning_rate": 2.4293310033070614e-06, "epoch": 0.8653061224489796, "percentage": 86.53, "elapsed_time": "1 day, 1:54:30", "remaining_time": "4:01:58", "throughput": 1582.71, "total_tokens": 147619840} -{"current_steps": 18030, "total_steps": 20825, "loss": 0.9519, "learning_rate": 2.4123240548819955e-06, "epoch": 0.8657863145258103, "percentage": 86.58, "elapsed_time": "1 day, 1:55:16", "remaining_time": "4:01:05", "throughput": 1582.81, "total_tokens": 147701760} -{"current_steps": 18040, "total_steps": 20825, "loss": 0.7976, "learning_rate": 2.3953738275786565e-06, "epoch": 0.866266506602641, "percentage": 86.63, "elapsed_time": "1 day, 1:56:01", "remaining_time": "4:00:13", "throughput": 1582.92, "total_tokens": 147783680} -{"current_steps": 18050, "total_steps": 20825, "loss": 0.8773, "learning_rate": 2.3784803639616854e-06, "epoch": 0.8667466986794717, "percentage": 86.67, "elapsed_time": "1 day, 1:56:46", "remaining_time": "3:59:20", "throughput": 1583.03, "total_tokens": 147865600} -{"current_steps": 18060, "total_steps": 20825, "loss": 0.8026, "learning_rate": 2.361643706453151e-06, "epoch": 0.8672268907563025, "percentage": 86.72, "elapsed_time": "1 day, 1:57:31", "remaining_time": "3:58:27", "throughput": 1583.14, "total_tokens": 147947520} -{"current_steps": 18070, "total_steps": 20825, "loss": 0.8714, "learning_rate": 2.3448638973324833e-06, "epoch": 0.8677070828331332, "percentage": 86.77, "elapsed_time": "1 day, 1:58:17", "remaining_time": "3:57:34", "throughput": 1583.25, "total_tokens": 148029440} -{"current_steps": 18080, "total_steps": 20825, "loss": 1.224, "learning_rate": 2.328140978736365e-06, "epoch": 0.868187274909964, "percentage": 86.82, "elapsed_time": "1 day, 1:59:02", "remaining_time": "3:56:42", "throughput": 1583.36, "total_tokens": 148111360} -{"current_steps": 18090, "total_steps": 20825, "loss": 0.8576, "learning_rate": 2.311474992658613e-06, "epoch": 0.8686674669867948, "percentage": 86.87, "elapsed_time": "1 day, 1:59:48", "remaining_time": "3:55:49", "throughput": 1583.46, "total_tokens": 148193280} -{"current_steps": 18100, "total_steps": 20825, "loss": 0.7746, "learning_rate": 2.29486598095007e-06, "epoch": 0.8691476590636255, "percentage": 86.91, "elapsed_time": "1 day, 2:00:33", "remaining_time": "3:54:56", "throughput": 1583.56, "total_tokens": 148275200} -{"current_steps": 18110, "total_steps": 20825, "loss": 0.9388, "learning_rate": 2.278313985318517e-06, "epoch": 0.8696278511404562, "percentage": 86.96, "elapsed_time": "1 day, 2:01:19", "remaining_time": "3:54:04", "throughput": 1583.67, "total_tokens": 148357120} -{"current_steps": 18120, "total_steps": 20825, "loss": 0.8536, "learning_rate": 2.261819047328562e-06, "epoch": 0.870108043217287, "percentage": 87.01, "elapsed_time": "1 day, 2:02:05", "remaining_time": "3:53:11", "throughput": 1583.77, "total_tokens": 148439040} -{"current_steps": 18130, "total_steps": 20825, "loss": 0.9051, "learning_rate": 2.2453812084015175e-06, "epoch": 0.8705882352941177, "percentage": 87.06, "elapsed_time": "1 day, 2:02:50", "remaining_time": "3:52:18", "throughput": 1583.88, "total_tokens": 148520960} -{"current_steps": 18140, "total_steps": 20825, "loss": 1.2451, "learning_rate": 2.2290005098153296e-06, "epoch": 0.8710684273709484, "percentage": 87.11, "elapsed_time": "1 day, 2:03:35", "remaining_time": "3:51:26", "throughput": 1583.99, "total_tokens": 148602880} -{"current_steps": 18150, "total_steps": 20825, "loss": 0.9271, "learning_rate": 2.212676992704435e-06, "epoch": 0.8715486194477791, "percentage": 87.15, "elapsed_time": "1 day, 2:04:20", "remaining_time": "3:50:33", "throughput": 1584.1, "total_tokens": 148684800} -{"current_steps": 18160, "total_steps": 20825, "loss": 0.6553, "learning_rate": 2.1964106980597034e-06, "epoch": 0.8720288115246099, "percentage": 87.2, "elapsed_time": "1 day, 2:05:06", "remaining_time": "3:49:40", "throughput": 1584.2, "total_tokens": 148766720} -{"current_steps": 18170, "total_steps": 20825, "loss": 0.8742, "learning_rate": 2.1802016667282847e-06, "epoch": 0.8725090036014406, "percentage": 87.25, "elapsed_time": "1 day, 2:05:51", "remaining_time": "3:48:48", "throughput": 1584.31, "total_tokens": 148848640} -{"current_steps": 18180, "total_steps": 20825, "loss": 0.8704, "learning_rate": 2.1640499394135595e-06, "epoch": 0.8729891956782713, "percentage": 87.3, "elapsed_time": "1 day, 2:06:37", "remaining_time": "3:47:55", "throughput": 1584.42, "total_tokens": 148930560} -{"current_steps": 18190, "total_steps": 20825, "loss": 0.9272, "learning_rate": 2.1479555566749825e-06, "epoch": 0.8734693877551021, "percentage": 87.35, "elapsed_time": "1 day, 2:07:22", "remaining_time": "3:47:03", "throughput": 1584.52, "total_tokens": 149012480} -{"current_steps": 18200, "total_steps": 20825, "loss": 0.9053, "learning_rate": 2.131918558928023e-06, "epoch": 0.8739495798319328, "percentage": 87.39, "elapsed_time": "1 day, 2:08:08", "remaining_time": "3:46:10", "throughput": 1584.62, "total_tokens": 149094400} -{"current_steps": 18210, "total_steps": 20825, "loss": 0.8871, "learning_rate": 2.1159389864440495e-06, "epoch": 0.8744297719087635, "percentage": 87.44, "elapsed_time": "1 day, 2:08:53", "remaining_time": "3:45:17", "throughput": 1584.73, "total_tokens": 149176320} -{"current_steps": 18220, "total_steps": 20825, "loss": 0.7591, "learning_rate": 2.100016879350214e-06, "epoch": 0.8749099639855943, "percentage": 87.49, "elapsed_time": "1 day, 2:09:39", "remaining_time": "3:44:25", "throughput": 1584.84, "total_tokens": 149258240} -{"current_steps": 18230, "total_steps": 20825, "loss": 0.8473, "learning_rate": 2.0841522776293725e-06, "epoch": 0.875390156062425, "percentage": 87.54, "elapsed_time": "1 day, 2:10:24", "remaining_time": "3:43:32", "throughput": 1584.94, "total_tokens": 149340160} -{"current_steps": 18240, "total_steps": 20825, "loss": 1.118, "learning_rate": 2.0683452211199854e-06, "epoch": 0.8758703481392557, "percentage": 87.59, "elapsed_time": "1 day, 2:11:09", "remaining_time": "3:42:40", "throughput": 1585.04, "total_tokens": 149422080} -{"current_steps": 18250, "total_steps": 20825, "loss": 0.8301, "learning_rate": 2.052595749515987e-06, "epoch": 0.8763505402160864, "percentage": 87.64, "elapsed_time": "1 day, 2:11:55", "remaining_time": "3:41:47", "throughput": 1585.15, "total_tokens": 149504000} -{"current_steps": 18260, "total_steps": 20825, "loss": 0.9347, "learning_rate": 2.0369039023667215e-06, "epoch": 0.8768307322929172, "percentage": 87.68, "elapsed_time": "1 day, 2:12:40", "remaining_time": "3:40:54", "throughput": 1585.26, "total_tokens": 149585920} -{"current_steps": 18270, "total_steps": 20825, "loss": 0.9084, "learning_rate": 2.0212697190768263e-06, "epoch": 0.8773109243697479, "percentage": 87.73, "elapsed_time": "1 day, 2:13:26", "remaining_time": "3:40:02", "throughput": 1585.35, "total_tokens": 149667840} -{"current_steps": 18280, "total_steps": 20825, "loss": 0.8173, "learning_rate": 2.0056932389061338e-06, "epoch": 0.8777911164465786, "percentage": 87.78, "elapsed_time": "1 day, 2:14:14", "remaining_time": "3:39:10", "throughput": 1585.42, "total_tokens": 149749760} -{"current_steps": 18290, "total_steps": 20825, "loss": 0.9435, "learning_rate": 1.9901745009695773e-06, "epoch": 0.8782713085234094, "percentage": 87.83, "elapsed_time": "1 day, 2:15:02", "remaining_time": "3:38:18", "throughput": 1585.48, "total_tokens": 149831680} -{"current_steps": 18300, "total_steps": 20825, "loss": 0.8976, "learning_rate": 1.9747135442370946e-06, "epoch": 0.8787515006002401, "percentage": 87.88, "elapsed_time": "1 day, 2:15:49", "remaining_time": "3:37:25", "throughput": 1585.56, "total_tokens": 149913600} -{"current_steps": 18310, "total_steps": 20825, "loss": 0.762, "learning_rate": 1.9593104075335158e-06, "epoch": 0.8792316926770708, "percentage": 87.92, "elapsed_time": "1 day, 2:16:37", "remaining_time": "3:36:33", "throughput": 1585.62, "total_tokens": 149995520} -{"current_steps": 18320, "total_steps": 20825, "loss": 0.8791, "learning_rate": 1.943965129538483e-06, "epoch": 0.8797118847539016, "percentage": 87.97, "elapsed_time": "1 day, 2:17:26", "remaining_time": "3:35:41", "throughput": 1585.66, "total_tokens": 150077440} -{"current_steps": 18330, "total_steps": 20825, "loss": 0.8332, "learning_rate": 1.9286777487863477e-06, "epoch": 0.8801920768307323, "percentage": 88.02, "elapsed_time": "1 day, 2:18:16", "remaining_time": "3:34:49", "throughput": 1585.7, "total_tokens": 150159360} -{"current_steps": 18340, "total_steps": 20825, "loss": 0.999, "learning_rate": 1.913448303666071e-06, "epoch": 0.880672268907563, "percentage": 88.07, "elapsed_time": "1 day, 2:19:05", "remaining_time": "3:33:57", "throughput": 1585.74, "total_tokens": 150241280} -{"current_steps": 18350, "total_steps": 20825, "loss": 0.9294, "learning_rate": 1.8982768324211197e-06, "epoch": 0.8811524609843937, "percentage": 88.12, "elapsed_time": "1 day, 2:19:53", "remaining_time": "3:33:05", "throughput": 1585.79, "total_tokens": 150323200} -{"current_steps": 18360, "total_steps": 20825, "loss": 0.9785, "learning_rate": 1.8831633731493963e-06, "epoch": 0.8816326530612245, "percentage": 88.16, "elapsed_time": "1 day, 2:20:41", "remaining_time": "3:32:13", "throughput": 1585.87, "total_tokens": 150405120} -{"current_steps": 18370, "total_steps": 20825, "loss": 0.8177, "learning_rate": 1.8681079638031062e-06, "epoch": 0.8821128451380552, "percentage": 88.21, "elapsed_time": "1 day, 2:21:28", "remaining_time": "3:31:21", "throughput": 1585.93, "total_tokens": 150487040} -{"current_steps": 18380, "total_steps": 20825, "loss": 0.8862, "learning_rate": 1.8531106421887017e-06, "epoch": 0.8825930372148859, "percentage": 88.26, "elapsed_time": "1 day, 2:22:14", "remaining_time": "3:30:28", "throughput": 1586.03, "total_tokens": 150568960} -{"current_steps": 18390, "total_steps": 20825, "loss": 0.7221, "learning_rate": 1.8381714459667603e-06, "epoch": 0.8830732292917167, "percentage": 88.31, "elapsed_time": "1 day, 2:23:01", "remaining_time": "3:29:36", "throughput": 1586.12, "total_tokens": 150650880} -{"current_steps": 18400, "total_steps": 20825, "loss": 1.0007, "learning_rate": 1.823290412651893e-06, "epoch": 0.8835534213685474, "percentage": 88.36, "elapsed_time": "1 day, 2:23:46", "remaining_time": "3:28:43", "throughput": 1586.21, "total_tokens": 150732800} -{"current_steps": 18410, "total_steps": 20825, "loss": 1.1891, "learning_rate": 1.8084675796126576e-06, "epoch": 0.8840336134453781, "percentage": 88.4, "elapsed_time": "1 day, 2:24:33", "remaining_time": "3:27:51", "throughput": 1586.3, "total_tokens": 150814720} -{"current_steps": 18420, "total_steps": 20825, "loss": 1.0123, "learning_rate": 1.7937029840714715e-06, "epoch": 0.8845138055222089, "percentage": 88.45, "elapsed_time": "1 day, 2:25:21", "remaining_time": "3:26:59", "throughput": 1586.35, "total_tokens": 150896640} -{"current_steps": 18430, "total_steps": 20825, "loss": 0.8358, "learning_rate": 1.778996663104493e-06, "epoch": 0.8849939975990396, "percentage": 88.5, "elapsed_time": "1 day, 2:26:08", "remaining_time": "3:26:07", "throughput": 1586.43, "total_tokens": 150978560} -{"current_steps": 18440, "total_steps": 20825, "loss": 0.9354, "learning_rate": 1.7643486536415537e-06, "epoch": 0.8854741896758703, "percentage": 88.55, "elapsed_time": "1 day, 2:26:54", "remaining_time": "3:25:14", "throughput": 1586.53, "total_tokens": 151060480} -{"current_steps": 18450, "total_steps": 20825, "loss": 0.8802, "learning_rate": 1.7497589924660552e-06, "epoch": 0.885954381752701, "percentage": 88.6, "elapsed_time": "1 day, 2:27:41", "remaining_time": "3:24:22", "throughput": 1586.6, "total_tokens": 151142400} -{"current_steps": 18460, "total_steps": 20825, "loss": 0.8142, "learning_rate": 1.7352277162148712e-06, "epoch": 0.8864345738295318, "percentage": 88.64, "elapsed_time": "1 day, 2:28:28", "remaining_time": "3:23:30", "throughput": 1586.68, "total_tokens": 151224320} -{"current_steps": 18470, "total_steps": 20825, "loss": 0.8752, "learning_rate": 1.7207548613782709e-06, "epoch": 0.8869147659063625, "percentage": 88.69, "elapsed_time": "1 day, 2:29:15", "remaining_time": "3:22:38", "throughput": 1586.76, "total_tokens": 151306240} -{"current_steps": 18480, "total_steps": 20825, "loss": 1.0158, "learning_rate": 1.7063404642998186e-06, "epoch": 0.8873949579831932, "percentage": 88.74, "elapsed_time": "1 day, 2:30:01", "remaining_time": "3:21:45", "throughput": 1586.86, "total_tokens": 151388160} -{"current_steps": 18490, "total_steps": 20825, "loss": 0.9463, "learning_rate": 1.6919845611762714e-06, "epoch": 0.887875150060024, "percentage": 88.79, "elapsed_time": "1 day, 2:30:49", "remaining_time": "3:20:53", "throughput": 1586.91, "total_tokens": 151470080} -{"current_steps": 18500, "total_steps": 20825, "loss": 1.0312, "learning_rate": 1.6776871880575084e-06, "epoch": 0.8883553421368547, "percentage": 88.84, "elapsed_time": "1 day, 2:31:37", "remaining_time": "3:20:01", "throughput": 1586.97, "total_tokens": 151552000} -{"current_steps": 18510, "total_steps": 20825, "loss": 0.841, "learning_rate": 1.663448380846433e-06, "epoch": 0.8888355342136854, "percentage": 88.88, "elapsed_time": "1 day, 2:32:23", "remaining_time": "3:19:09", "throughput": 1587.06, "total_tokens": 151633920} -{"current_steps": 18520, "total_steps": 20825, "loss": 0.819, "learning_rate": 1.649268175298868e-06, "epoch": 0.8893157262905163, "percentage": 88.93, "elapsed_time": "1 day, 2:33:11", "remaining_time": "3:18:17", "throughput": 1587.13, "total_tokens": 151715840} -{"current_steps": 18530, "total_steps": 20825, "loss": 1.1654, "learning_rate": 1.6351466070234882e-06, "epoch": 0.889795918367347, "percentage": 88.98, "elapsed_time": "1 day, 2:33:59", "remaining_time": "3:17:25", "throughput": 1587.19, "total_tokens": 151797760} -{"current_steps": 18540, "total_steps": 20825, "loss": 0.8883, "learning_rate": 1.6210837114817272e-06, "epoch": 0.8902761104441776, "percentage": 89.03, "elapsed_time": "1 day, 2:34:45", "remaining_time": "3:16:33", "throughput": 1587.27, "total_tokens": 151879680} -{"current_steps": 18550, "total_steps": 20825, "loss": 0.785, "learning_rate": 1.6070795239876618e-06, "epoch": 0.8907563025210085, "percentage": 89.08, "elapsed_time": "1 day, 2:35:33", "remaining_time": "3:15:40", "throughput": 1587.33, "total_tokens": 151961600} -{"current_steps": 18560, "total_steps": 20825, "loss": 0.7937, "learning_rate": 1.5931340797079613e-06, "epoch": 0.8912364945978392, "percentage": 89.12, "elapsed_time": "1 day, 2:36:23", "remaining_time": "3:14:49", "throughput": 1587.37, "total_tokens": 152043520} -{"current_steps": 18570, "total_steps": 20825, "loss": 0.8338, "learning_rate": 1.5792474136617858e-06, "epoch": 0.8917166866746699, "percentage": 89.17, "elapsed_time": "1 day, 2:37:11", "remaining_time": "3:13:57", "throughput": 1587.42, "total_tokens": 152125440} -{"current_steps": 18580, "total_steps": 20825, "loss": 0.8318, "learning_rate": 1.5654195607206712e-06, "epoch": 0.8921968787515006, "percentage": 89.22, "elapsed_time": "1 day, 2:37:59", "remaining_time": "3:13:05", "throughput": 1587.49, "total_tokens": 152207360} -{"current_steps": 18590, "total_steps": 20825, "loss": 0.8587, "learning_rate": 1.5516505556084888e-06, "epoch": 0.8926770708283314, "percentage": 89.27, "elapsed_time": "1 day, 2:38:48", "remaining_time": "3:12:13", "throughput": 1587.53, "total_tokens": 152289280} -{"current_steps": 18600, "total_steps": 20825, "loss": 1.0141, "learning_rate": 1.5379404329013246e-06, "epoch": 0.8931572629051621, "percentage": 89.32, "elapsed_time": "1 day, 2:39:36", "remaining_time": "3:11:21", "throughput": 1587.58, "total_tokens": 152371200} -{"current_steps": 18610, "total_steps": 20825, "loss": 0.8301, "learning_rate": 1.5242892270273951e-06, "epoch": 0.8936374549819928, "percentage": 89.36, "elapsed_time": "1 day, 2:40:24", "remaining_time": "3:10:29", "throughput": 1587.64, "total_tokens": 152453120} -{"current_steps": 18620, "total_steps": 20825, "loss": 0.9144, "learning_rate": 1.5106969722669812e-06, "epoch": 0.8941176470588236, "percentage": 89.41, "elapsed_time": "1 day, 2:41:14", "remaining_time": "3:09:37", "throughput": 1587.68, "total_tokens": 152535040} -{"current_steps": 18630, "total_steps": 20825, "loss": 1.1305, "learning_rate": 1.4971637027523106e-06, "epoch": 0.8945978391356543, "percentage": 89.46, "elapsed_time": "1 day, 2:42:03", "remaining_time": "3:08:45", "throughput": 1587.72, "total_tokens": 152616960} -{"current_steps": 18640, "total_steps": 20825, "loss": 0.9489, "learning_rate": 1.4836894524675126e-06, "epoch": 0.895078031212485, "percentage": 89.51, "elapsed_time": "1 day, 2:42:49", "remaining_time": "3:07:53", "throughput": 1587.8, "total_tokens": 152698880} -{"current_steps": 18650, "total_steps": 20825, "loss": 1.1124, "learning_rate": 1.4702742552484884e-06, "epoch": 0.8955582232893158, "percentage": 89.56, "elapsed_time": "1 day, 2:43:38", "remaining_time": "3:07:01", "throughput": 1587.85, "total_tokens": 152780800} -{"current_steps": 18660, "total_steps": 20825, "loss": 0.836, "learning_rate": 1.4569181447828623e-06, "epoch": 0.8960384153661465, "percentage": 89.6, "elapsed_time": "1 day, 2:44:26", "remaining_time": "3:06:09", "throughput": 1587.9, "total_tokens": 152862720} -{"current_steps": 18670, "total_steps": 20825, "loss": 1.0544, "learning_rate": 1.4436211546098782e-06, "epoch": 0.8965186074429772, "percentage": 89.65, "elapsed_time": "1 day, 2:45:14", "remaining_time": "3:05:17", "throughput": 1587.97, "total_tokens": 152944640} -{"current_steps": 18680, "total_steps": 20825, "loss": 0.9155, "learning_rate": 1.430383318120318e-06, "epoch": 0.8969987995198079, "percentage": 89.7, "elapsed_time": "1 day, 2:46:01", "remaining_time": "3:04:25", "throughput": 1588.04, "total_tokens": 153026560} -{"current_steps": 18690, "total_steps": 20825, "loss": 0.862, "learning_rate": 1.4172046685564212e-06, "epoch": 0.8974789915966387, "percentage": 89.75, "elapsed_time": "1 day, 2:46:50", "remaining_time": "3:03:33", "throughput": 1588.09, "total_tokens": 153108480} -{"current_steps": 18700, "total_steps": 20825, "loss": 0.9023, "learning_rate": 1.4040852390118042e-06, "epoch": 0.8979591836734694, "percentage": 89.8, "elapsed_time": "1 day, 2:47:42", "remaining_time": "3:02:41", "throughput": 1588.09, "total_tokens": 153190400} -{"current_steps": 18710, "total_steps": 20825, "loss": 1.0013, "learning_rate": 1.3910250624313642e-06, "epoch": 0.8984393757503001, "percentage": 89.84, "elapsed_time": "1 day, 2:48:32", "remaining_time": "3:01:49", "throughput": 1588.12, "total_tokens": 153272320} -{"current_steps": 18720, "total_steps": 20825, "loss": 0.8953, "learning_rate": 1.3780241716112057e-06, "epoch": 0.8989195678271309, "percentage": 89.89, "elapsed_time": "1 day, 2:49:22", "remaining_time": "3:00:58", "throughput": 1588.13, "total_tokens": 153354240} -{"current_steps": 18730, "total_steps": 20825, "loss": 0.8403, "learning_rate": 1.3650825991985722e-06, "epoch": 0.8993997599039616, "percentage": 89.94, "elapsed_time": "1 day, 2:50:12", "remaining_time": "3:00:06", "throughput": 1588.16, "total_tokens": 153436160} -{"current_steps": 18740, "total_steps": 20825, "loss": 0.7954, "learning_rate": 1.3522003776917285e-06, "epoch": 0.8998799519807923, "percentage": 89.99, "elapsed_time": "1 day, 2:51:00", "remaining_time": "2:59:14", "throughput": 1588.23, "total_tokens": 153518080} -{"current_steps": 18750, "total_steps": 20825, "loss": 0.8046, "learning_rate": 1.3393775394399123e-06, "epoch": 0.9003601440576231, "percentage": 90.04, "elapsed_time": "1 day, 2:51:48", "remaining_time": "2:58:22", "throughput": 1588.29, "total_tokens": 153600000} -{"current_steps": 18760, "total_steps": 20825, "loss": 0.712, "learning_rate": 1.326614116643246e-06, "epoch": 0.9008403361344538, "percentage": 90.08, "elapsed_time": "1 day, 2:52:38", "remaining_time": "2:57:30", "throughput": 1588.31, "total_tokens": 153681920} -{"current_steps": 18770, "total_steps": 20825, "loss": 0.8778, "learning_rate": 1.3139101413526339e-06, "epoch": 0.9013205282112845, "percentage": 90.13, "elapsed_time": "1 day, 2:53:28", "remaining_time": "2:56:38", "throughput": 1588.33, "total_tokens": 153763840} -{"current_steps": 18780, "total_steps": 20825, "loss": 1.0348, "learning_rate": 1.3012656454697125e-06, "epoch": 0.9018007202881152, "percentage": 90.18, "elapsed_time": "1 day, 2:54:19", "remaining_time": "2:55:47", "throughput": 1588.34, "total_tokens": 153845760} -{"current_steps": 18790, "total_steps": 20825, "loss": 0.9589, "learning_rate": 1.2886806607467578e-06, "epoch": 0.902280912364946, "percentage": 90.23, "elapsed_time": "1 day, 2:55:08", "remaining_time": "2:54:55", "throughput": 1588.39, "total_tokens": 153927680} -{"current_steps": 18800, "total_steps": 20825, "loss": 0.9268, "learning_rate": 1.2761552187865899e-06, "epoch": 0.9027611044417767, "percentage": 90.28, "elapsed_time": "1 day, 2:55:59", "remaining_time": "2:54:03", "throughput": 1588.4, "total_tokens": 154009600} -{"current_steps": 18810, "total_steps": 20825, "loss": 0.8947, "learning_rate": 1.2636893510425186e-06, "epoch": 0.9032412965186074, "percentage": 90.32, "elapsed_time": "1 day, 2:56:48", "remaining_time": "2:53:11", "throughput": 1588.44, "total_tokens": 154091520} -{"current_steps": 18820, "total_steps": 20825, "loss": 0.9701, "learning_rate": 1.2512830888182531e-06, "epoch": 0.9037214885954382, "percentage": 90.37, "elapsed_time": "1 day, 2:57:40", "remaining_time": "2:52:20", "throughput": 1588.42, "total_tokens": 154173440} -{"current_steps": 18830, "total_steps": 20825, "loss": 0.9968, "learning_rate": 1.23893646326782e-06, "epoch": 0.9042016806722689, "percentage": 90.42, "elapsed_time": "1 day, 2:58:31", "remaining_time": "2:51:28", "throughput": 1588.44, "total_tokens": 154255360} -{"current_steps": 18840, "total_steps": 20825, "loss": 0.7056, "learning_rate": 1.2266495053954913e-06, "epoch": 0.9046818727490996, "percentage": 90.47, "elapsed_time": "1 day, 2:59:19", "remaining_time": "2:50:36", "throughput": 1588.49, "total_tokens": 154337280} -{"current_steps": 18850, "total_steps": 20825, "loss": 0.8708, "learning_rate": 1.2144222460557074e-06, "epoch": 0.9051620648259304, "percentage": 90.52, "elapsed_time": "1 day, 3:00:08", "remaining_time": "2:49:45", "throughput": 1588.53, "total_tokens": 154419200} -{"current_steps": 18860, "total_steps": 20825, "loss": 1.0057, "learning_rate": 1.2022547159529911e-06, "epoch": 0.9056422569027611, "percentage": 90.56, "elapsed_time": "1 day, 3:00:57", "remaining_time": "2:48:53", "throughput": 1588.57, "total_tokens": 154501120} -{"current_steps": 18870, "total_steps": 20825, "loss": 0.8827, "learning_rate": 1.190146945641879e-06, "epoch": 0.9061224489795918, "percentage": 90.61, "elapsed_time": "1 day, 3:01:46", "remaining_time": "2:48:01", "throughput": 1588.61, "total_tokens": 154583040} -{"current_steps": 18880, "total_steps": 20825, "loss": 0.9975, "learning_rate": 1.1780989655268415e-06, "epoch": 0.9066026410564225, "percentage": 90.66, "elapsed_time": "1 day, 3:02:35", "remaining_time": "2:47:09", "throughput": 1588.66, "total_tokens": 154664960} -{"current_steps": 18890, "total_steps": 20825, "loss": 0.8246, "learning_rate": 1.1661108058622082e-06, "epoch": 0.9070828331332533, "percentage": 90.71, "elapsed_time": "1 day, 3:03:24", "remaining_time": "2:46:17", "throughput": 1588.7, "total_tokens": 154746880} -{"current_steps": 18900, "total_steps": 20825, "loss": 0.7727, "learning_rate": 1.154182496752082e-06, "epoch": 0.907563025210084, "percentage": 90.76, "elapsed_time": "1 day, 3:04:12", "remaining_time": "2:45:25", "throughput": 1588.76, "total_tokens": 154828800} -{"current_steps": 18910, "total_steps": 20825, "loss": 1.0012, "learning_rate": 1.142314068150288e-06, "epoch": 0.9080432172869147, "percentage": 90.8, "elapsed_time": "1 day, 3:04:59", "remaining_time": "2:44:33", "throughput": 1588.83, "total_tokens": 154910720} -{"current_steps": 18920, "total_steps": 20825, "loss": 0.8584, "learning_rate": 1.1305055498602584e-06, "epoch": 0.9085234093637455, "percentage": 90.85, "elapsed_time": "1 day, 3:05:46", "remaining_time": "2:43:41", "throughput": 1588.91, "total_tokens": 154992640} -{"current_steps": 18930, "total_steps": 20825, "loss": 0.8211, "learning_rate": 1.1187569715350066e-06, "epoch": 0.9090036014405762, "percentage": 90.9, "elapsed_time": "1 day, 3:06:33", "remaining_time": "2:42:49", "throughput": 1588.98, "total_tokens": 155074560} -{"current_steps": 18940, "total_steps": 20825, "loss": 0.7993, "learning_rate": 1.1070683626770162e-06, "epoch": 0.9094837935174069, "percentage": 90.95, "elapsed_time": "1 day, 3:07:22", "remaining_time": "2:41:57", "throughput": 1589.03, "total_tokens": 155156480} -{"current_steps": 18950, "total_steps": 20825, "loss": 0.88, "learning_rate": 1.0954397526381694e-06, "epoch": 0.9099639855942377, "percentage": 91.0, "elapsed_time": "1 day, 3:08:13", "remaining_time": "2:41:06", "throughput": 1589.04, "total_tokens": 155238400} -{"current_steps": 18960, "total_steps": 20825, "loss": 0.9003, "learning_rate": 1.0838711706196992e-06, "epoch": 0.9104441776710684, "percentage": 91.04, "elapsed_time": "1 day, 3:09:13", "remaining_time": "2:40:15", "throughput": 1588.89, "total_tokens": 155320320} -{"current_steps": 18970, "total_steps": 20825, "loss": 0.9935, "learning_rate": 1.0723626456720925e-06, "epoch": 0.9109243697478991, "percentage": 91.09, "elapsed_time": "1 day, 3:10:03", "remaining_time": "2:39:23", "throughput": 1588.92, "total_tokens": 155402240} -{"current_steps": 18980, "total_steps": 20825, "loss": 1.0318, "learning_rate": 1.0609142066950157e-06, "epoch": 0.9114045618247298, "percentage": 91.14, "elapsed_time": "1 day, 3:11:01", "remaining_time": "2:38:32", "throughput": 1588.82, "total_tokens": 155484160} -{"current_steps": 18990, "total_steps": 20825, "loss": 0.837, "learning_rate": 1.0495258824372578e-06, "epoch": 0.9118847539015607, "percentage": 91.19, "elapsed_time": "1 day, 3:11:52", "remaining_time": "2:37:41", "throughput": 1588.82, "total_tokens": 155566080} -{"current_steps": 19000, "total_steps": 20825, "loss": 0.7732, "learning_rate": 1.0381977014966543e-06, "epoch": 0.9123649459783914, "percentage": 91.24, "elapsed_time": "1 day, 3:12:46", "remaining_time": "2:36:49", "throughput": 1588.79, "total_tokens": 155648000} -{"current_steps": 19010, "total_steps": 20825, "loss": 1.0176, "learning_rate": 1.0269296923199972e-06, "epoch": 0.912845138055222, "percentage": 91.28, "elapsed_time": "1 day, 3:13:40", "remaining_time": "2:35:58", "throughput": 1588.74, "total_tokens": 155729920} -{"current_steps": 19020, "total_steps": 20825, "loss": 1.012, "learning_rate": 1.0157218832029969e-06, "epoch": 0.9133253301320529, "percentage": 91.33, "elapsed_time": "1 day, 3:14:29", "remaining_time": "2:35:06", "throughput": 1588.79, "total_tokens": 155811840} -{"current_steps": 19030, "total_steps": 20825, "loss": 1.009, "learning_rate": 1.0045743022901787e-06, "epoch": 0.9138055222088836, "percentage": 91.38, "elapsed_time": "1 day, 3:15:17", "remaining_time": "2:34:14", "throughput": 1588.84, "total_tokens": 155893760} -{"current_steps": 19040, "total_steps": 20825, "loss": 0.7293, "learning_rate": 9.934869775748258e-07, "epoch": 0.9142857142857143, "percentage": 91.43, "elapsed_time": "1 day, 3:16:03", "remaining_time": "2:33:22", "throughput": 1588.94, "total_tokens": 155975680} -{"current_steps": 19050, "total_steps": 20825, "loss": 0.8924, "learning_rate": 9.824599368989163e-07, "epoch": 0.9147659063625451, "percentage": 91.48, "elapsed_time": "1 day, 3:16:50", "remaining_time": "2:32:30", "throughput": 1589.01, "total_tokens": 156057600} -{"current_steps": 19060, "total_steps": 20825, "loss": 0.8136, "learning_rate": 9.714932079530476e-07, "epoch": 0.9152460984393758, "percentage": 91.52, "elapsed_time": "1 day, 3:17:37", "remaining_time": "2:31:38", "throughput": 1589.09, "total_tokens": 156139520} -{"current_steps": 19070, "total_steps": 20825, "loss": 0.7444, "learning_rate": 9.60586818276349e-07, "epoch": 0.9157262905162065, "percentage": 91.57, "elapsed_time": "1 day, 3:18:23", "remaining_time": "2:30:46", "throughput": 1589.18, "total_tokens": 156221440} -{"current_steps": 19080, "total_steps": 20825, "loss": 0.7502, "learning_rate": 9.497407952564485e-07, "epoch": 0.9162064825930372, "percentage": 91.62, "elapsed_time": "1 day, 3:19:09", "remaining_time": "2:29:54", "throughput": 1589.27, "total_tokens": 156303360} -{"current_steps": 19090, "total_steps": 20825, "loss": 0.9223, "learning_rate": 9.389551661293683e-07, "epoch": 0.916686674669868, "percentage": 91.67, "elapsed_time": "1 day, 3:19:56", "remaining_time": "2:29:02", "throughput": 1589.34, "total_tokens": 156385280} -{"current_steps": 19100, "total_steps": 20825, "loss": 0.8431, "learning_rate": 9.282299579794789e-07, "epoch": 0.9171668667466987, "percentage": 91.72, "elapsed_time": "1 day, 3:20:43", "remaining_time": "2:28:10", "throughput": 1589.4, "total_tokens": 156467200} -{"current_steps": 19110, "total_steps": 20825, "loss": 0.8672, "learning_rate": 9.175651977394284e-07, "epoch": 0.9176470588235294, "percentage": 91.76, "elapsed_time": "1 day, 3:21:34", "remaining_time": "2:27:19", "throughput": 1589.42, "total_tokens": 156549120} -{"current_steps": 19120, "total_steps": 20825, "loss": 0.8328, "learning_rate": 9.069609121900663e-07, "epoch": 0.9181272509003602, "percentage": 91.81, "elapsed_time": "1 day, 3:22:24", "remaining_time": "2:26:27", "throughput": 1589.44, "total_tokens": 156631040} -{"current_steps": 19130, "total_steps": 20825, "loss": 0.7688, "learning_rate": 8.964171279603778e-07, "epoch": 0.9186074429771909, "percentage": 91.86, "elapsed_time": "1 day, 3:23:12", "remaining_time": "2:25:35", "throughput": 1589.5, "total_tokens": 156712960} -{"current_steps": 19140, "total_steps": 20825, "loss": 0.7694, "learning_rate": 8.859338715274279e-07, "epoch": 0.9190876350540216, "percentage": 91.91, "elapsed_time": "1 day, 3:24:02", "remaining_time": "2:24:44", "throughput": 1589.53, "total_tokens": 156794880} -{"current_steps": 19150, "total_steps": 20825, "loss": 0.9128, "learning_rate": 8.755111692162837e-07, "epoch": 0.9195678271308524, "percentage": 91.96, "elapsed_time": "1 day, 3:24:51", "remaining_time": "2:23:52", "throughput": 1589.57, "total_tokens": 156876800} -{"current_steps": 19160, "total_steps": 20825, "loss": 0.9739, "learning_rate": 8.651490471999424e-07, "epoch": 0.9200480192076831, "percentage": 92.0, "elapsed_time": "1 day, 3:25:38", "remaining_time": "2:23:00", "throughput": 1589.65, "total_tokens": 156958720} -{"current_steps": 19170, "total_steps": 20825, "loss": 0.9776, "learning_rate": 8.548475314992949e-07, "epoch": 0.9205282112845138, "percentage": 92.05, "elapsed_time": "1 day, 3:26:28", "remaining_time": "2:22:08", "throughput": 1589.66, "total_tokens": 157040640} -{"current_steps": 19180, "total_steps": 20825, "loss": 0.9048, "learning_rate": 8.446066479830206e-07, "epoch": 0.9210084033613445, "percentage": 92.1, "elapsed_time": "1 day, 3:27:16", "remaining_time": "2:21:16", "throughput": 1589.72, "total_tokens": 157122560} -{"current_steps": 19190, "total_steps": 20825, "loss": 0.8928, "learning_rate": 8.344264223675485e-07, "epoch": 0.9214885954381753, "percentage": 92.15, "elapsed_time": "1 day, 3:28:03", "remaining_time": "2:20:24", "throughput": 1589.8, "total_tokens": 157204480} -{"current_steps": 19200, "total_steps": 20825, "loss": 0.8414, "learning_rate": 8.243068802169906e-07, "epoch": 0.921968787515006, "percentage": 92.2, "elapsed_time": "1 day, 3:28:51", "remaining_time": "2:19:33", "throughput": 1589.85, "total_tokens": 157286400} -{"current_steps": 19210, "total_steps": 20825, "loss": 0.9802, "learning_rate": 8.14248046943078e-07, "epoch": 0.9224489795918367, "percentage": 92.24, "elapsed_time": "1 day, 3:29:41", "remaining_time": "2:18:41", "throughput": 1589.88, "total_tokens": 157368320} -{"current_steps": 19220, "total_steps": 20825, "loss": 0.7226, "learning_rate": 8.042499478050719e-07, "epoch": 0.9229291716686675, "percentage": 92.29, "elapsed_time": "1 day, 3:30:31", "remaining_time": "2:17:49", "throughput": 1589.9, "total_tokens": 157450240} -{"current_steps": 19230, "total_steps": 20825, "loss": 0.8491, "learning_rate": 7.943126079097418e-07, "epoch": 0.9234093637454982, "percentage": 92.34, "elapsed_time": "1 day, 3:31:25", "remaining_time": "2:16:58", "throughput": 1589.87, "total_tokens": 157532160} -{"current_steps": 19240, "total_steps": 20825, "loss": 0.9703, "learning_rate": 7.844360522112737e-07, "epoch": 0.9238895558223289, "percentage": 92.39, "elapsed_time": "1 day, 3:32:28", "remaining_time": "2:16:07", "throughput": 1589.68, "total_tokens": 157614080} -{"current_steps": 19250, "total_steps": 20825, "loss": 0.8683, "learning_rate": 7.746203055112145e-07, "epoch": 0.9243697478991597, "percentage": 92.44, "elapsed_time": "1 day, 3:33:28", "remaining_time": "2:15:17", "throughput": 1589.54, "total_tokens": 157696000} -{"current_steps": 19260, "total_steps": 20825, "loss": 0.9395, "learning_rate": 7.648653924584137e-07, "epoch": 0.9248499399759904, "percentage": 92.48, "elapsed_time": "1 day, 3:34:31", "remaining_time": "2:14:26", "throughput": 1589.35, "total_tokens": 157777920} -{"current_steps": 19270, "total_steps": 20825, "loss": 0.84, "learning_rate": 7.55171337548946e-07, "epoch": 0.9253301320528211, "percentage": 92.53, "elapsed_time": "1 day, 3:35:24", "remaining_time": "2:13:35", "throughput": 1589.34, "total_tokens": 157859840} -{"current_steps": 19280, "total_steps": 20825, "loss": 0.7814, "learning_rate": 7.455381651260807e-07, "epoch": 0.9258103241296518, "percentage": 92.58, "elapsed_time": "1 day, 3:36:11", "remaining_time": "2:12:43", "throughput": 1589.41, "total_tokens": 157941760} -{"current_steps": 19290, "total_steps": 20825, "loss": 0.954, "learning_rate": 7.359658993801894e-07, "epoch": 0.9262905162064826, "percentage": 92.63, "elapsed_time": "1 day, 3:36:58", "remaining_time": "2:11:51", "throughput": 1589.49, "total_tokens": 158023680} -{"current_steps": 19300, "total_steps": 20825, "loss": 0.9109, "learning_rate": 7.264545643486997e-07, "epoch": 0.9267707082833133, "percentage": 92.68, "elapsed_time": "1 day, 3:37:46", "remaining_time": "2:10:59", "throughput": 1589.53, "total_tokens": 158105600} -{"current_steps": 19310, "total_steps": 20825, "loss": 0.9779, "learning_rate": 7.170041839160368e-07, "epoch": 0.927250900360144, "percentage": 92.73, "elapsed_time": "1 day, 3:38:38", "remaining_time": "2:10:07", "throughput": 1589.52, "total_tokens": 158187520} -{"current_steps": 19320, "total_steps": 20825, "loss": 0.8145, "learning_rate": 7.076147818135537e-07, "epoch": 0.9277310924369748, "percentage": 92.77, "elapsed_time": "1 day, 3:39:31", "remaining_time": "2:09:16", "throughput": 1589.51, "total_tokens": 158269440} -{"current_steps": 19330, "total_steps": 20825, "loss": 0.7036, "learning_rate": 6.982863816194812e-07, "epoch": 0.9282112845138055, "percentage": 92.82, "elapsed_time": "1 day, 3:40:33", "remaining_time": "2:08:25", "throughput": 1589.34, "total_tokens": 158351360} -{"current_steps": 19340, "total_steps": 20825, "loss": 0.8395, "learning_rate": 6.890190067588648e-07, "epoch": 0.9286914765906362, "percentage": 92.87, "elapsed_time": "1 day, 3:41:21", "remaining_time": "2:07:33", "throughput": 1589.39, "total_tokens": 158433280} -{"current_steps": 19350, "total_steps": 20825, "loss": 0.9633, "learning_rate": 6.798126805035082e-07, "epoch": 0.929171668667467, "percentage": 92.92, "elapsed_time": "1 day, 3:42:09", "remaining_time": "2:06:42", "throughput": 1589.45, "total_tokens": 158515200} -{"current_steps": 19360, "total_steps": 20825, "loss": 0.9551, "learning_rate": 6.706674259719048e-07, "epoch": 0.9296518607442977, "percentage": 92.97, "elapsed_time": "1 day, 3:42:57", "remaining_time": "2:05:50", "throughput": 1589.51, "total_tokens": 158597120} -{"current_steps": 19370, "total_steps": 20825, "loss": 0.895, "learning_rate": 6.615832661291954e-07, "epoch": 0.9301320528211284, "percentage": 93.01, "elapsed_time": "1 day, 3:43:46", "remaining_time": "2:04:58", "throughput": 1589.54, "total_tokens": 158679040} -{"current_steps": 19380, "total_steps": 20825, "loss": 0.7502, "learning_rate": 6.525602237870993e-07, "epoch": 0.9306122448979591, "percentage": 93.06, "elapsed_time": "1 day, 3:44:32", "remaining_time": "2:04:06", "throughput": 1589.63, "total_tokens": 158760960} -{"current_steps": 19390, "total_steps": 20825, "loss": 0.693, "learning_rate": 6.435983216038583e-07, "epoch": 0.9310924369747899, "percentage": 93.11, "elapsed_time": "1 day, 3:45:18", "remaining_time": "2:03:14", "throughput": 1589.73, "total_tokens": 158842880} -{"current_steps": 19400, "total_steps": 20825, "loss": 0.8507, "learning_rate": 6.346975820841927e-07, "epoch": 0.9315726290516206, "percentage": 93.16, "elapsed_time": "1 day, 3:46:05", "remaining_time": "2:02:22", "throughput": 1589.8, "total_tokens": 158924800} -{"current_steps": 19410, "total_steps": 20825, "loss": 0.9174, "learning_rate": 6.258580275792153e-07, "epoch": 0.9320528211284513, "percentage": 93.21, "elapsed_time": "1 day, 3:46:51", "remaining_time": "2:01:30", "throughput": 1589.88, "total_tokens": 159006720} -{"current_steps": 19420, "total_steps": 20825, "loss": 0.7601, "learning_rate": 6.170796802864115e-07, "epoch": 0.9325330132052821, "percentage": 93.25, "elapsed_time": "1 day, 3:47:37", "remaining_time": "2:00:38", "throughput": 1589.97, "total_tokens": 159088640} -{"current_steps": 19430, "total_steps": 20825, "loss": 0.8922, "learning_rate": 6.083625622495565e-07, "epoch": 0.9330132052821128, "percentage": 93.3, "elapsed_time": "1 day, 3:48:25", "remaining_time": "1:59:47", "throughput": 1590.04, "total_tokens": 159170560} -{"current_steps": 19440, "total_steps": 20825, "loss": 0.8506, "learning_rate": 5.997066953586761e-07, "epoch": 0.9334933973589435, "percentage": 93.35, "elapsed_time": "1 day, 3:49:13", "remaining_time": "1:58:55", "throughput": 1590.08, "total_tokens": 159252480} -{"current_steps": 19450, "total_steps": 20825, "loss": 0.801, "learning_rate": 5.911121013499721e-07, "epoch": 0.9339735894357744, "percentage": 93.4, "elapsed_time": "1 day, 3:49:59", "remaining_time": "1:58:03", "throughput": 1590.16, "total_tokens": 159334400} -{"current_steps": 19460, "total_steps": 20825, "loss": 0.8358, "learning_rate": 5.825788018057971e-07, "epoch": 0.934453781512605, "percentage": 93.45, "elapsed_time": "1 day, 3:51:42", "remaining_time": "1:57:15", "throughput": 1589.35, "total_tokens": 159416320} -{"current_steps": 19470, "total_steps": 20825, "loss": 1.0555, "learning_rate": 5.741068181545684e-07, "epoch": 0.9349339735894358, "percentage": 93.49, "elapsed_time": "1 day, 3:52:49", "remaining_time": "1:56:25", "throughput": 1589.11, "total_tokens": 159498240} -{"current_steps": 19480, "total_steps": 20825, "loss": 1.184, "learning_rate": 5.656961716707459e-07, "epoch": 0.9354141656662666, "percentage": 93.54, "elapsed_time": "1 day, 3:54:05", "remaining_time": "1:55:35", "throughput": 1588.72, "total_tokens": 159580160} -{"current_steps": 19490, "total_steps": 20825, "loss": 0.8181, "learning_rate": 5.57346883474752e-07, "epoch": 0.9358943577430973, "percentage": 93.59, "elapsed_time": "1 day, 3:55:23", "remaining_time": "1:54:45", "throughput": 1588.3, "total_tokens": 159662080} -{"current_steps": 19500, "total_steps": 20825, "loss": 0.9217, "learning_rate": 5.490589745329261e-07, "epoch": 0.936374549819928, "percentage": 93.64, "elapsed_time": "1 day, 3:56:33", "remaining_time": "1:53:55", "throughput": 1588.01, "total_tokens": 159744000} -{"current_steps": 19510, "total_steps": 20825, "loss": 1.0929, "learning_rate": 5.408324656574842e-07, "epoch": 0.9368547418967587, "percentage": 93.69, "elapsed_time": "1 day, 3:57:37", "remaining_time": "1:53:04", "throughput": 1587.81, "total_tokens": 159825920} -{"current_steps": 19520, "total_steps": 20825, "loss": 0.9711, "learning_rate": 5.326673775064545e-07, "epoch": 0.9373349339735895, "percentage": 93.73, "elapsed_time": "1 day, 3:58:45", "remaining_time": "1:52:13", "throughput": 1587.57, "total_tokens": 159907840} -{"current_steps": 19530, "total_steps": 20825, "loss": 0.872, "learning_rate": 5.245637305836243e-07, "epoch": 0.9378151260504202, "percentage": 93.78, "elapsed_time": "1 day, 3:59:32", "remaining_time": "1:51:22", "throughput": 1587.64, "total_tokens": 159989760} -{"current_steps": 19540, "total_steps": 20825, "loss": 0.8849, "learning_rate": 5.165215452384936e-07, "epoch": 0.9382953181272509, "percentage": 93.83, "elapsed_time": "1 day, 4:00:19", "remaining_time": "1:50:30", "throughput": 1587.71, "total_tokens": 160071680} -{"current_steps": 19550, "total_steps": 20825, "loss": 0.8509, "learning_rate": 5.085408416662274e-07, "epoch": 0.9387755102040817, "percentage": 93.88, "elapsed_time": "1 day, 4:01:05", "remaining_time": "1:49:38", "throughput": 1587.79, "total_tokens": 160153600} -{"current_steps": 19560, "total_steps": 20825, "loss": 0.9798, "learning_rate": 5.006216399075947e-07, "epoch": 0.9392557022809124, "percentage": 93.93, "elapsed_time": "1 day, 4:01:52", "remaining_time": "1:48:46", "throughput": 1587.86, "total_tokens": 160235520} -{"current_steps": 19570, "total_steps": 20825, "loss": 0.8332, "learning_rate": 4.92763959848927e-07, "epoch": 0.9397358943577431, "percentage": 93.97, "elapsed_time": "1 day, 4:02:39", "remaining_time": "1:47:54", "throughput": 1587.94, "total_tokens": 160317440} -{"current_steps": 19580, "total_steps": 20825, "loss": 0.9557, "learning_rate": 4.849678212220682e-07, "epoch": 0.9402160864345739, "percentage": 94.02, "elapsed_time": "1 day, 4:03:24", "remaining_time": "1:47:02", "throughput": 1588.04, "total_tokens": 160399360} -{"current_steps": 19590, "total_steps": 20825, "loss": 0.7306, "learning_rate": 4.772332436043165e-07, "epoch": 0.9406962785114046, "percentage": 94.07, "elapsed_time": "1 day, 4:04:11", "remaining_time": "1:46:10", "throughput": 1588.12, "total_tokens": 160481280} -{"current_steps": 19600, "total_steps": 20825, "loss": 0.9514, "learning_rate": 4.6956024641838237e-07, "epoch": 0.9411764705882353, "percentage": 94.12, "elapsed_time": "1 day, 4:04:57", "remaining_time": "1:45:18", "throughput": 1588.21, "total_tokens": 160563200} -{"current_steps": 19610, "total_steps": 20825, "loss": 0.9364, "learning_rate": 4.619488489323448e-07, "epoch": 0.941656662665066, "percentage": 94.17, "elapsed_time": "1 day, 4:05:44", "remaining_time": "1:44:26", "throughput": 1588.28, "total_tokens": 160645120} -{"current_steps": 19620, "total_steps": 20825, "loss": 1.0067, "learning_rate": 4.5439907025958405e-07, "epoch": 0.9421368547418968, "percentage": 94.21, "elapsed_time": "1 day, 4:06:31", "remaining_time": "1:43:34", "throughput": 1588.34, "total_tokens": 160727040} -{"current_steps": 19630, "total_steps": 20825, "loss": 0.985, "learning_rate": 4.4691092935876256e-07, "epoch": 0.9426170468187275, "percentage": 94.26, "elapsed_time": "1 day, 4:07:18", "remaining_time": "1:42:43", "throughput": 1588.41, "total_tokens": 160808960} -{"current_steps": 19640, "total_steps": 20825, "loss": 1.1212, "learning_rate": 4.394844450337443e-07, "epoch": 0.9430972388955582, "percentage": 94.31, "elapsed_time": "1 day, 4:08:05", "remaining_time": "1:41:51", "throughput": 1588.5, "total_tokens": 160890880} -{"current_steps": 19650, "total_steps": 20825, "loss": 1.0098, "learning_rate": 4.3211963593357275e-07, "epoch": 0.943577430972389, "percentage": 94.36, "elapsed_time": "1 day, 4:08:51", "remaining_time": "1:40:59", "throughput": 1588.57, "total_tokens": 160972800} -{"current_steps": 19660, "total_steps": 20825, "loss": 0.8137, "learning_rate": 4.248165205524152e-07, "epoch": 0.9440576230492197, "percentage": 94.41, "elapsed_time": "1 day, 4:09:39", "remaining_time": "1:40:07", "throughput": 1588.64, "total_tokens": 161054720} -{"current_steps": 19670, "total_steps": 20825, "loss": 0.9042, "learning_rate": 4.175751172295156e-07, "epoch": 0.9445378151260504, "percentage": 94.45, "elapsed_time": "1 day, 4:10:25", "remaining_time": "1:39:15", "throughput": 1588.71, "total_tokens": 161136640} -{"current_steps": 19680, "total_steps": 20825, "loss": 0.8619, "learning_rate": 4.1039544414914753e-07, "epoch": 0.9450180072028812, "percentage": 94.5, "elapsed_time": "1 day, 4:11:12", "remaining_time": "1:38:23", "throughput": 1588.8, "total_tokens": 161218560} -{"current_steps": 19690, "total_steps": 20825, "loss": 0.8915, "learning_rate": 4.032775193405752e-07, "epoch": 0.9454981992797119, "percentage": 94.55, "elapsed_time": "1 day, 4:11:59", "remaining_time": "1:37:31", "throughput": 1588.86, "total_tokens": 161300480} -{"current_steps": 19700, "total_steps": 20825, "loss": 0.815, "learning_rate": 3.96221360677998e-07, "epoch": 0.9459783913565426, "percentage": 94.6, "elapsed_time": "1 day, 4:12:47", "remaining_time": "1:36:40", "throughput": 1588.92, "total_tokens": 161382400} -{"current_steps": 19710, "total_steps": 20825, "loss": 0.9076, "learning_rate": 3.892269858805142e-07, "epoch": 0.9464585834333733, "percentage": 94.65, "elapsed_time": "1 day, 4:13:35", "remaining_time": "1:35:48", "throughput": 1588.97, "total_tokens": 161464320} -{"current_steps": 19720, "total_steps": 20825, "loss": 0.8012, "learning_rate": 3.82294412512077e-07, "epoch": 0.9469387755102041, "percentage": 94.69, "elapsed_time": "1 day, 4:14:24", "remaining_time": "1:34:56", "throughput": 1589.02, "total_tokens": 161546240} -{"current_steps": 19730, "total_steps": 20825, "loss": 0.8382, "learning_rate": 3.7542365798143573e-07, "epoch": 0.9474189675870348, "percentage": 94.74, "elapsed_time": "1 day, 4:15:11", "remaining_time": "1:34:04", "throughput": 1589.08, "total_tokens": 161628160} -{"current_steps": 19740, "total_steps": 20825, "loss": 1.0418, "learning_rate": 3.6861473954210855e-07, "epoch": 0.9478991596638655, "percentage": 94.79, "elapsed_time": "1 day, 4:15:58", "remaining_time": "1:33:13", "throughput": 1589.16, "total_tokens": 161710080} -{"current_steps": 19750, "total_steps": 20825, "loss": 0.7393, "learning_rate": 3.6186767429234323e-07, "epoch": 0.9483793517406963, "percentage": 94.84, "elapsed_time": "1 day, 4:16:45", "remaining_time": "1:32:21", "throughput": 1589.23, "total_tokens": 161792000} -{"current_steps": 19760, "total_steps": 20825, "loss": 0.8615, "learning_rate": 3.5518247917505077e-07, "epoch": 0.948859543817527, "percentage": 94.89, "elapsed_time": "1 day, 4:17:30", "remaining_time": "1:31:29", "throughput": 1589.32, "total_tokens": 161873920} -{"current_steps": 19770, "total_steps": 20825, "loss": 1.041, "learning_rate": 3.485591709777802e-07, "epoch": 0.9493397358943577, "percentage": 94.93, "elapsed_time": "1 day, 4:18:16", "remaining_time": "1:30:37", "throughput": 1589.41, "total_tokens": 161955840} -{"current_steps": 19780, "total_steps": 20825, "loss": 0.813, "learning_rate": 3.419977663326801e-07, "epoch": 0.9498199279711885, "percentage": 94.98, "elapsed_time": "1 day, 4:19:02", "remaining_time": "1:29:45", "throughput": 1589.5, "total_tokens": 162037760} -{"current_steps": 19790, "total_steps": 20825, "loss": 1.2698, "learning_rate": 3.3549828171644537e-07, "epoch": 0.9503001200480192, "percentage": 95.03, "elapsed_time": "1 day, 4:19:47", "remaining_time": "1:28:53", "throughput": 1589.6, "total_tokens": 162119680} -{"current_steps": 19800, "total_steps": 20825, "loss": 0.8896, "learning_rate": 3.29060733450276e-07, "epoch": 0.9507803121248499, "percentage": 95.08, "elapsed_time": "1 day, 4:20:34", "remaining_time": "1:28:02", "throughput": 1589.68, "total_tokens": 162201600} -{"current_steps": 19810, "total_steps": 20825, "loss": 1.0284, "learning_rate": 3.2268513769984634e-07, "epoch": 0.9512605042016806, "percentage": 95.13, "elapsed_time": "1 day, 4:21:20", "remaining_time": "1:27:10", "throughput": 1589.76, "total_tokens": 162283520} -{"current_steps": 19820, "total_steps": 20825, "loss": 0.9543, "learning_rate": 3.163715104752524e-07, "epoch": 0.9517406962785114, "percentage": 95.17, "elapsed_time": "1 day, 4:22:06", "remaining_time": "1:26:18", "throughput": 1589.85, "total_tokens": 162365440} -{"current_steps": 19830, "total_steps": 20825, "loss": 0.9059, "learning_rate": 3.101198676309841e-07, "epoch": 0.9522208883553421, "percentage": 95.22, "elapsed_time": "1 day, 4:22:51", "remaining_time": "1:25:26", "throughput": 1589.94, "total_tokens": 162447360} -{"current_steps": 19840, "total_steps": 20825, "loss": 0.9259, "learning_rate": 3.039302248658754e-07, "epoch": 0.9527010804321728, "percentage": 95.27, "elapsed_time": "1 day, 4:23:37", "remaining_time": "1:24:34", "throughput": 1590.03, "total_tokens": 162529280} -{"current_steps": 19850, "total_steps": 20825, "loss": 1.0082, "learning_rate": 2.978025977230736e-07, "epoch": 0.9531812725090036, "percentage": 95.32, "elapsed_time": "1 day, 4:24:25", "remaining_time": "1:23:43", "throughput": 1590.09, "total_tokens": 162611200} -{"current_steps": 19860, "total_steps": 20825, "loss": 0.9153, "learning_rate": 2.91737001589984e-07, "epoch": 0.9536614645858343, "percentage": 95.37, "elapsed_time": "1 day, 4:25:16", "remaining_time": "1:22:51", "throughput": 1590.1, "total_tokens": 162693120} -{"current_steps": 19870, "total_steps": 20825, "loss": 0.9446, "learning_rate": 2.8573345169825296e-07, "epoch": 0.954141656662665, "percentage": 95.41, "elapsed_time": "1 day, 4:26:04", "remaining_time": "1:21:59", "throughput": 1590.15, "total_tokens": 162775040} -{"current_steps": 19880, "total_steps": 20825, "loss": 0.7736, "learning_rate": 2.797919631237156e-07, "epoch": 0.9546218487394958, "percentage": 95.46, "elapsed_time": "1 day, 4:26:50", "remaining_time": "1:21:08", "throughput": 1590.24, "total_tokens": 162856960} -{"current_steps": 19890, "total_steps": 20825, "loss": 0.9343, "learning_rate": 2.739125507863649e-07, "epoch": 0.9551020408163265, "percentage": 95.51, "elapsed_time": "1 day, 4:27:40", "remaining_time": "1:20:16", "throughput": 1590.26, "total_tokens": 162938880} -{"current_steps": 19900, "total_steps": 20825, "loss": 0.9554, "learning_rate": 2.680952294503075e-07, "epoch": 0.9555822328931572, "percentage": 95.56, "elapsed_time": "1 day, 4:28:33", "remaining_time": "1:19:25", "throughput": 1590.24, "total_tokens": 163020800} -{"current_steps": 19910, "total_steps": 20825, "loss": 0.9323, "learning_rate": 2.6234001372372194e-07, "epoch": 0.956062424969988, "percentage": 95.61, "elapsed_time": "1 day, 4:29:21", "remaining_time": "1:18:33", "throughput": 1590.29, "total_tokens": 163102720} -{"current_steps": 19920, "total_steps": 20825, "loss": 0.9947, "learning_rate": 2.5664691805884767e-07, "epoch": 0.9565426170468188, "percentage": 95.65, "elapsed_time": "1 day, 4:30:09", "remaining_time": "1:17:41", "throughput": 1590.35, "total_tokens": 163184640} -{"current_steps": 19930, "total_steps": 20825, "loss": 0.9797, "learning_rate": 2.5101595675191827e-07, "epoch": 0.9570228091236495, "percentage": 95.7, "elapsed_time": "1 day, 4:30:56", "remaining_time": "1:16:49", "throughput": 1590.42, "total_tokens": 163266560} -{"current_steps": 19940, "total_steps": 20825, "loss": 0.9892, "learning_rate": 2.4544714394314215e-07, "epoch": 0.9575030012004802, "percentage": 95.75, "elapsed_time": "1 day, 4:31:41", "remaining_time": "1:15:58", "throughput": 1590.51, "total_tokens": 163348480} -{"current_steps": 19950, "total_steps": 20825, "loss": 1.171, "learning_rate": 2.399404936166638e-07, "epoch": 0.957983193277311, "percentage": 95.8, "elapsed_time": "1 day, 4:32:28", "remaining_time": "1:15:06", "throughput": 1590.58, "total_tokens": 163430400} -{"current_steps": 19960, "total_steps": 20825, "loss": 0.7551, "learning_rate": 2.3449601960052746e-07, "epoch": 0.9584633853541417, "percentage": 95.85, "elapsed_time": "1 day, 4:33:13", "remaining_time": "1:14:14", "throughput": 1590.68, "total_tokens": 163512320} -{"current_steps": 19970, "total_steps": 20825, "loss": 0.7974, "learning_rate": 2.2911373556664118e-07, "epoch": 0.9589435774309724, "percentage": 95.89, "elapsed_time": "1 day, 4:34:01", "remaining_time": "1:13:23", "throughput": 1590.75, "total_tokens": 163594240} -{"current_steps": 19980, "total_steps": 20825, "loss": 0.8963, "learning_rate": 2.23793655030749e-07, "epoch": 0.9594237695078032, "percentage": 95.94, "elapsed_time": "1 day, 4:34:46", "remaining_time": "1:12:31", "throughput": 1590.84, "total_tokens": 163676160} -{"current_steps": 19990, "total_steps": 20825, "loss": 0.9377, "learning_rate": 2.1853579135238667e-07, "epoch": 0.9599039615846339, "percentage": 95.99, "elapsed_time": "1 day, 4:35:32", "remaining_time": "1:11:39", "throughput": 1590.92, "total_tokens": 163758080} -{"current_steps": 20000, "total_steps": 20825, "loss": 1.0792, "learning_rate": 2.1334015773486203e-07, "epoch": 0.9603841536614646, "percentage": 96.04, "elapsed_time": "1 day, 4:36:19", "remaining_time": "1:10:47", "throughput": 1590.99, "total_tokens": 163840000} -{"current_steps": 20010, "total_steps": 20825, "loss": 0.7725, "learning_rate": 2.0820676722520526e-07, "epoch": 0.9608643457382953, "percentage": 96.09, "elapsed_time": "1 day, 4:37:10", "remaining_time": "1:09:56", "throughput": 1591.01, "total_tokens": 163921920} -{"current_steps": 20020, "total_steps": 20825, "loss": 0.8982, "learning_rate": 2.0313563271414927e-07, "epoch": 0.9613445378151261, "percentage": 96.13, "elapsed_time": "1 day, 4:37:55", "remaining_time": "1:09:04", "throughput": 1591.1, "total_tokens": 164003840} -{"current_steps": 20030, "total_steps": 20825, "loss": 0.7376, "learning_rate": 1.9812676693608812e-07, "epoch": 0.9618247298919568, "percentage": 96.18, "elapsed_time": "1 day, 4:38:42", "remaining_time": "1:08:12", "throughput": 1591.18, "total_tokens": 164085760} -{"current_steps": 20040, "total_steps": 20825, "loss": 0.8378, "learning_rate": 1.9318018246905488e-07, "epoch": 0.9623049219687875, "percentage": 96.23, "elapsed_time": "1 day, 4:39:27", "remaining_time": "1:07:21", "throughput": 1591.27, "total_tokens": 164167680} -{"current_steps": 20050, "total_steps": 20825, "loss": 0.8883, "learning_rate": 1.8829589173468552e-07, "epoch": 0.9627851140456183, "percentage": 96.28, "elapsed_time": "1 day, 4:40:13", "remaining_time": "1:06:29", "throughput": 1591.36, "total_tokens": 164249600} -{"current_steps": 20060, "total_steps": 20825, "loss": 0.7442, "learning_rate": 1.8347390699817724e-07, "epoch": 0.963265306122449, "percentage": 96.33, "elapsed_time": "1 day, 4:40:59", "remaining_time": "1:05:37", "throughput": 1591.45, "total_tokens": 164331520} -{"current_steps": 20070, "total_steps": 20825, "loss": 0.9274, "learning_rate": 1.7871424036828288e-07, "epoch": 0.9637454981992797, "percentage": 96.37, "elapsed_time": "1 day, 4:41:44", "remaining_time": "1:04:46", "throughput": 1591.54, "total_tokens": 164413440} -{"current_steps": 20080, "total_steps": 20825, "loss": 0.9755, "learning_rate": 1.7401690379724722e-07, "epoch": 0.9642256902761105, "percentage": 96.42, "elapsed_time": "1 day, 4:42:30", "remaining_time": "1:03:54", "throughput": 1591.62, "total_tokens": 164495360} -{"current_steps": 20090, "total_steps": 20825, "loss": 0.8417, "learning_rate": 1.6938190908080688e-07, "epoch": 0.9647058823529412, "percentage": 96.47, "elapsed_time": "1 day, 4:43:16", "remaining_time": "1:03:02", "throughput": 1591.71, "total_tokens": 164577280} -{"current_steps": 20100, "total_steps": 20825, "loss": 0.7835, "learning_rate": 1.6480926785814866e-07, "epoch": 0.9651860744297719, "percentage": 96.52, "elapsed_time": "1 day, 4:44:01", "remaining_time": "1:02:11", "throughput": 1591.81, "total_tokens": 164659200} -{"current_steps": 20110, "total_steps": 20825, "loss": 1.0117, "learning_rate": 1.6029899161187079e-07, "epoch": 0.9656662665066026, "percentage": 96.57, "elapsed_time": "1 day, 4:44:46", "remaining_time": "1:01:19", "throughput": 1591.91, "total_tokens": 164741120} -{"current_steps": 20120, "total_steps": 20825, "loss": 0.7976, "learning_rate": 1.5585109166796896e-07, "epoch": 0.9661464585834334, "percentage": 96.61, "elapsed_time": "1 day, 4:45:31", "remaining_time": "1:00:27", "throughput": 1592.0, "total_tokens": 164823040} -{"current_steps": 20130, "total_steps": 20825, "loss": 0.9373, "learning_rate": 1.5146557919581138e-07, "epoch": 0.9666266506602641, "percentage": 96.66, "elapsed_time": "1 day, 4:46:16", "remaining_time": "0:59:36", "throughput": 1592.11, "total_tokens": 164904960} -{"current_steps": 20140, "total_steps": 20825, "loss": 0.717, "learning_rate": 1.4714246520808328e-07, "epoch": 0.9671068427370948, "percentage": 96.71, "elapsed_time": "1 day, 4:47:01", "remaining_time": "0:58:44", "throughput": 1592.2, "total_tokens": 164986880} -{"current_steps": 20150, "total_steps": 20825, "loss": 0.8526, "learning_rate": 1.4288176056079238e-07, "epoch": 0.9675870348139256, "percentage": 96.76, "elapsed_time": "1 day, 4:47:48", "remaining_time": "0:57:52", "throughput": 1592.28, "total_tokens": 165068800} -{"current_steps": 20160, "total_steps": 20825, "loss": 0.8959, "learning_rate": 1.3868347595322184e-07, "epoch": 0.9680672268907563, "percentage": 96.81, "elapsed_time": "1 day, 4:48:33", "remaining_time": "0:57:01", "throughput": 1592.38, "total_tokens": 165150720} -{"current_steps": 20170, "total_steps": 20825, "loss": 1.1636, "learning_rate": 1.3454762192790794e-07, "epoch": 0.968547418967587, "percentage": 96.85, "elapsed_time": "1 day, 4:49:18", "remaining_time": "0:56:09", "throughput": 1592.47, "total_tokens": 165232640} -{"current_steps": 20180, "total_steps": 20825, "loss": 1.0033, "learning_rate": 1.3047420887061513e-07, "epoch": 0.9690276110444178, "percentage": 96.9, "elapsed_time": "1 day, 4:50:04", "remaining_time": "0:55:17", "throughput": 1592.56, "total_tokens": 165314560} -{"current_steps": 20190, "total_steps": 20825, "loss": 0.8926, "learning_rate": 1.264632470103111e-07, "epoch": 0.9695078031212485, "percentage": 96.95, "elapsed_time": "1 day, 4:50:49", "remaining_time": "0:54:26", "throughput": 1592.65, "total_tokens": 165396480} -{"current_steps": 20200, "total_steps": 20825, "loss": 0.9251, "learning_rate": 1.225147464191334e-07, "epoch": 0.9699879951980792, "percentage": 97.0, "elapsed_time": "1 day, 4:51:35", "remaining_time": "0:53:34", "throughput": 1592.74, "total_tokens": 165478400} -{"current_steps": 20210, "total_steps": 20825, "loss": 0.754, "learning_rate": 1.1862871701237288e-07, "epoch": 0.9704681872749099, "percentage": 97.05, "elapsed_time": "1 day, 4:52:21", "remaining_time": "0:52:42", "throughput": 1592.83, "total_tokens": 165560320} -{"current_steps": 20220, "total_steps": 20825, "loss": 0.799, "learning_rate": 1.1480516854844858e-07, "epoch": 0.9709483793517407, "percentage": 97.09, "elapsed_time": "1 day, 4:53:07", "remaining_time": "0:51:51", "throughput": 1592.9, "total_tokens": 165642240} -{"current_steps": 20230, "total_steps": 20825, "loss": 0.797, "learning_rate": 1.1104411062887732e-07, "epoch": 0.9714285714285714, "percentage": 97.14, "elapsed_time": "1 day, 4:53:54", "remaining_time": "0:50:59", "throughput": 1592.98, "total_tokens": 165724160} -{"current_steps": 20240, "total_steps": 20825, "loss": 0.7708, "learning_rate": 1.0734555269825141e-07, "epoch": 0.9719087635054021, "percentage": 97.19, "elapsed_time": "1 day, 4:54:41", "remaining_time": "0:50:08", "throughput": 1593.05, "total_tokens": 165806080} -{"current_steps": 20250, "total_steps": 20825, "loss": 0.7448, "learning_rate": 1.0370950404421931e-07, "epoch": 0.9723889555822329, "percentage": 97.24, "elapsed_time": "1 day, 4:55:29", "remaining_time": "0:49:16", "throughput": 1593.09, "total_tokens": 165888000} -{"current_steps": 20260, "total_steps": 20825, "loss": 0.8983, "learning_rate": 1.0013597379745776e-07, "epoch": 0.9728691476590636, "percentage": 97.29, "elapsed_time": "1 day, 4:56:17", "remaining_time": "0:48:25", "throughput": 1593.15, "total_tokens": 165969920} -{"current_steps": 20270, "total_steps": 20825, "loss": 0.7648, "learning_rate": 9.662497093164691e-08, "epoch": 0.9733493397358943, "percentage": 97.33, "elapsed_time": "1 day, 4:57:04", "remaining_time": "0:47:33", "throughput": 1593.22, "total_tokens": 166051840} -{"current_steps": 20280, "total_steps": 20825, "loss": 0.9752, "learning_rate": 9.317650426345637e-08, "epoch": 0.9738295318127251, "percentage": 97.38, "elapsed_time": "1 day, 4:57:50", "remaining_time": "0:46:42", "throughput": 1593.29, "total_tokens": 166133760} -{"current_steps": 20290, "total_steps": 20825, "loss": 0.8632, "learning_rate": 8.979058245251193e-08, "epoch": 0.9743097238895558, "percentage": 97.43, "elapsed_time": "1 day, 4:58:36", "remaining_time": "0:45:50", "throughput": 1593.38, "total_tokens": 166215680} -{"current_steps": 20300, "total_steps": 20825, "loss": 1.0177, "learning_rate": 8.646721400138724e-08, "epoch": 0.9747899159663865, "percentage": 97.48, "elapsed_time": "1 day, 4:59:22", "remaining_time": "0:44:59", "throughput": 1593.46, "total_tokens": 166297600} -{"current_steps": 20310, "total_steps": 20825, "loss": 0.9075, "learning_rate": 8.320640725556773e-08, "epoch": 0.9752701080432172, "percentage": 97.53, "elapsed_time": "1 day, 5:00:08", "remaining_time": "0:44:07", "throughput": 1593.54, "total_tokens": 166379520} -{"current_steps": 20320, "total_steps": 20825, "loss": 0.9434, "learning_rate": 8.000817040344222e-08, "epoch": 0.975750300120048, "percentage": 97.58, "elapsed_time": "1 day, 5:00:54", "remaining_time": "0:43:15", "throughput": 1593.63, "total_tokens": 166461440} -{"current_steps": 20330, "total_steps": 20825, "loss": 0.8307, "learning_rate": 7.687251147627251e-08, "epoch": 0.9762304921968787, "percentage": 97.62, "elapsed_time": "1 day, 5:01:39", "remaining_time": "0:42:24", "throughput": 1593.72, "total_tokens": 166543360} -{"current_steps": 20340, "total_steps": 20825, "loss": 0.7942, "learning_rate": 7.379943834818214e-08, "epoch": 0.9767106842737094, "percentage": 97.67, "elapsed_time": "1 day, 5:02:25", "remaining_time": "0:41:32", "throughput": 1593.8, "total_tokens": 166625280} -{"current_steps": 20350, "total_steps": 20825, "loss": 0.6887, "learning_rate": 7.0788958736126e-08, "epoch": 0.9771908763505402, "percentage": 97.72, "elapsed_time": "1 day, 5:03:11", "remaining_time": "0:40:41", "throughput": 1593.89, "total_tokens": 166707200} -{"current_steps": 20360, "total_steps": 20825, "loss": 0.8574, "learning_rate": 6.784108019988189e-08, "epoch": 0.977671068427371, "percentage": 97.77, "elapsed_time": "1 day, 5:03:59", "remaining_time": "0:39:49", "throughput": 1593.94, "total_tokens": 166789120} -{"current_steps": 20370, "total_steps": 20825, "loss": 0.7726, "learning_rate": 6.495581014202556e-08, "epoch": 0.9781512605042016, "percentage": 97.82, "elapsed_time": "1 day, 5:04:46", "remaining_time": "0:38:58", "throughput": 1594.0, "total_tokens": 166871040} -{"current_steps": 20380, "total_steps": 20825, "loss": 0.9247, "learning_rate": 6.213315580791135e-08, "epoch": 0.9786314525810325, "percentage": 97.86, "elapsed_time": "1 day, 5:05:35", "remaining_time": "0:38:06", "throughput": 1594.04, "total_tokens": 166952960} -{"current_steps": 20390, "total_steps": 20825, "loss": 0.8177, "learning_rate": 5.9373124285661e-08, "epoch": 0.9791116446578632, "percentage": 97.91, "elapsed_time": "1 day, 5:06:23", "remaining_time": "0:37:15", "throughput": 1594.1, "total_tokens": 167034880} -{"current_steps": 20400, "total_steps": 20825, "loss": 0.8603, "learning_rate": 5.6675722506135956e-08, "epoch": 0.9795918367346939, "percentage": 97.96, "elapsed_time": "1 day, 5:07:09", "remaining_time": "0:36:23", "throughput": 1594.17, "total_tokens": 167116800} -{"current_steps": 20410, "total_steps": 20825, "loss": 0.9751, "learning_rate": 5.404095724292346e-08, "epoch": 0.9800720288115247, "percentage": 98.01, "elapsed_time": "1 day, 5:08:09", "remaining_time": "0:35:32", "throughput": 1594.05, "total_tokens": 167198720} -{"current_steps": 20420, "total_steps": 20825, "loss": 0.9047, "learning_rate": 5.146883511232825e-08, "epoch": 0.9805522208883554, "percentage": 98.06, "elapsed_time": "1 day, 5:09:06", "remaining_time": "0:34:41", "throughput": 1593.96, "total_tokens": 167280640} -{"current_steps": 20430, "total_steps": 20825, "loss": 0.8816, "learning_rate": 4.8959362573341995e-08, "epoch": 0.9810324129651861, "percentage": 98.1, "elapsed_time": "1 day, 5:09:58", "remaining_time": "0:33:50", "throughput": 1593.95, "total_tokens": 167362560} -{"current_steps": 20440, "total_steps": 20825, "loss": 0.8182, "learning_rate": 4.6512545927632213e-08, "epoch": 0.9815126050420168, "percentage": 98.15, "elapsed_time": "1 day, 5:10:53", "remaining_time": "0:32:58", "throughput": 1593.9, "total_tokens": 167444480} -{"current_steps": 20450, "total_steps": 20825, "loss": 0.8999, "learning_rate": 4.412839131953395e-08, "epoch": 0.9819927971188476, "percentage": 98.2, "elapsed_time": "1 day, 5:11:41", "remaining_time": "0:32:07", "throughput": 1593.95, "total_tokens": 167526400} -{"current_steps": 20460, "total_steps": 20825, "loss": 0.9972, "learning_rate": 4.180690473602755e-08, "epoch": 0.9824729891956783, "percentage": 98.25, "elapsed_time": "1 day, 5:12:31", "remaining_time": "0:31:15", "throughput": 1593.96, "total_tokens": 167608320} -{"current_steps": 20470, "total_steps": 20825, "loss": 0.7583, "learning_rate": 3.9548092006719275e-08, "epoch": 0.982953181272509, "percentage": 98.3, "elapsed_time": "1 day, 5:13:19", "remaining_time": "0:30:24", "throughput": 1594.02, "total_tokens": 167690240} -{"current_steps": 20480, "total_steps": 20825, "loss": 1.0416, "learning_rate": 3.7351958803835685e-08, "epoch": 0.9834333733493398, "percentage": 98.34, "elapsed_time": "1 day, 5:14:08", "remaining_time": "0:29:32", "throughput": 1594.06, "total_tokens": 167772160} -{"current_steps": 20490, "total_steps": 20825, "loss": 1.1318, "learning_rate": 3.5218510642201496e-08, "epoch": 0.9839135654261705, "percentage": 98.39, "elapsed_time": "1 day, 5:14:54", "remaining_time": "0:28:41", "throughput": 1594.14, "total_tokens": 167854080} -{"current_steps": 20500, "total_steps": 20825, "loss": 1.0568, "learning_rate": 3.314775287923677e-08, "epoch": 0.9843937575030012, "percentage": 98.44, "elapsed_time": "1 day, 5:15:44", "remaining_time": "0:27:50", "throughput": 1594.16, "total_tokens": 167936000} -{"current_steps": 20510, "total_steps": 20825, "loss": 0.9061, "learning_rate": 3.1139690714931945e-08, "epoch": 0.984873949579832, "percentage": 98.49, "elapsed_time": "1 day, 5:16:34", "remaining_time": "0:26:58", "throughput": 1594.18, "total_tokens": 168017920} -{"current_steps": 20520, "total_steps": 20825, "loss": 0.7413, "learning_rate": 2.919432919183396e-08, "epoch": 0.9853541416566627, "percentage": 98.54, "elapsed_time": "1 day, 5:17:22", "remaining_time": "0:26:07", "throughput": 1594.23, "total_tokens": 168099840} -{"current_steps": 20530, "total_steps": 20825, "loss": 0.7303, "learning_rate": 2.731167319505179e-08, "epoch": 0.9858343337334934, "percentage": 98.58, "elapsed_time": "1 day, 5:18:09", "remaining_time": "0:25:15", "throughput": 1594.3, "total_tokens": 168181760} -{"current_steps": 20540, "total_steps": 20825, "loss": 0.763, "learning_rate": 2.5491727452217616e-08, "epoch": 0.9863145258103241, "percentage": 98.63, "elapsed_time": "1 day, 5:18:56", "remaining_time": "0:24:24", "throughput": 1594.36, "total_tokens": 168263680} -{"current_steps": 20550, "total_steps": 20825, "loss": 0.9044, "learning_rate": 2.3734496533497907e-08, "epoch": 0.9867947178871549, "percentage": 98.68, "elapsed_time": "1 day, 5:19:44", "remaining_time": "0:23:32", "throughput": 1594.42, "total_tokens": 168345600} -{"current_steps": 20560, "total_steps": 20825, "loss": 0.9609, "learning_rate": 2.203998485156844e-08, "epoch": 0.9872749099639856, "percentage": 98.73, "elapsed_time": "1 day, 5:20:30", "remaining_time": "0:22:41", "throughput": 1594.49, "total_tokens": 168427520} -{"current_steps": 20570, "total_steps": 20825, "loss": 1.0561, "learning_rate": 2.040819666160876e-08, "epoch": 0.9877551020408163, "percentage": 98.78, "elapsed_time": "1 day, 5:21:16", "remaining_time": "0:21:50", "throughput": 1594.58, "total_tokens": 168509440} -{"current_steps": 20580, "total_steps": 20825, "loss": 1.0402, "learning_rate": 1.8839136061288288e-08, "epoch": 0.9882352941176471, "percentage": 98.82, "elapsed_time": "1 day, 5:22:02", "remaining_time": "0:20:58", "throughput": 1594.66, "total_tokens": 168591360} -{"current_steps": 20590, "total_steps": 20825, "loss": 1.1063, "learning_rate": 1.7332806990758012e-08, "epoch": 0.9887154861944778, "percentage": 98.87, "elapsed_time": "1 day, 5:22:48", "remaining_time": "0:20:07", "throughput": 1594.74, "total_tokens": 168673280} -{"current_steps": 20600, "total_steps": 20825, "loss": 0.8762, "learning_rate": 1.5889213232644917e-08, "epoch": 0.9891956782713085, "percentage": 98.92, "elapsed_time": "1 day, 5:23:34", "remaining_time": "0:19:15", "throughput": 1594.82, "total_tokens": 168755200} -{"current_steps": 20610, "total_steps": 20825, "loss": 1.2618, "learning_rate": 1.4508358412032575e-08, "epoch": 0.9896758703481393, "percentage": 98.97, "elapsed_time": "1 day, 5:24:19", "remaining_time": "0:18:24", "throughput": 1594.91, "total_tokens": 168837120} -{"current_steps": 20620, "total_steps": 20825, "loss": 0.959, "learning_rate": 1.319024599645835e-08, "epoch": 0.99015606242497, "percentage": 99.02, "elapsed_time": "1 day, 5:25:05", "remaining_time": "0:17:32", "throughput": 1595.0, "total_tokens": 168919040} -{"current_steps": 20630, "total_steps": 20825, "loss": 0.7467, "learning_rate": 1.1934879295905089e-08, "epoch": 0.9906362545018007, "percentage": 99.06, "elapsed_time": "1 day, 5:25:51", "remaining_time": "0:16:41", "throughput": 1595.08, "total_tokens": 169000960} -{"current_steps": 20640, "total_steps": 20825, "loss": 1.0644, "learning_rate": 1.074226146279278e-08, "epoch": 0.9911164465786314, "percentage": 99.11, "elapsed_time": "1 day, 5:26:36", "remaining_time": "0:15:50", "throughput": 1595.18, "total_tokens": 169082880} -{"current_steps": 20650, "total_steps": 20825, "loss": 1.036, "learning_rate": 9.612395491970239e-09, "epoch": 0.9915966386554622, "percentage": 99.16, "elapsed_time": "1 day, 5:27:21", "remaining_time": "0:14:58", "throughput": 1595.26, "total_tokens": 169164800} -{"current_steps": 20660, "total_steps": 20825, "loss": 0.8798, "learning_rate": 8.545284220698446e-09, "epoch": 0.9920768307322929, "percentage": 99.21, "elapsed_time": "1 day, 5:28:06", "remaining_time": "0:14:07", "throughput": 1595.36, "total_tokens": 169246720} -{"current_steps": 20670, "total_steps": 20825, "loss": 0.848, "learning_rate": 7.540930328658879e-09, "epoch": 0.9925570228091236, "percentage": 99.26, "elapsed_time": "1 day, 5:28:51", "remaining_time": "0:13:15", "throughput": 1595.45, "total_tokens": 169328640} -{"current_steps": 20680, "total_steps": 20825, "loss": 1.0114, "learning_rate": 6.599336337942408e-09, "epoch": 0.9930372148859544, "percentage": 99.3, "elapsed_time": "1 day, 5:29:37", "remaining_time": "0:12:24", "throughput": 1595.54, "total_tokens": 169410560} -{"current_steps": 20690, "total_steps": 20825, "loss": 0.7468, "learning_rate": 5.720504613035416e-09, "epoch": 0.9935174069627851, "percentage": 99.35, "elapsed_time": "1 day, 5:30:22", "remaining_time": "0:11:33", "throughput": 1595.63, "total_tokens": 169492480} -{"current_steps": 20700, "total_steps": 20825, "loss": 0.8409, "learning_rate": 4.904437360814252e-09, "epoch": 0.9939975990396158, "percentage": 99.4, "elapsed_time": "1 day, 5:31:08", "remaining_time": "0:10:41", "throughput": 1595.72, "total_tokens": 169574400} -{"current_steps": 20710, "total_steps": 20825, "loss": 1.024, "learning_rate": 4.151136630553554e-09, "epoch": 0.9944777911164466, "percentage": 99.45, "elapsed_time": "1 day, 5:31:53", "remaining_time": "0:09:50", "throughput": 1595.81, "total_tokens": 169656320} -{"current_steps": 20720, "total_steps": 20825, "loss": 1.1108, "learning_rate": 3.4606043139068234e-09, "epoch": 0.9949579831932773, "percentage": 99.5, "elapsed_time": "1 day, 5:32:39", "remaining_time": "0:08:58", "throughput": 1595.9, "total_tokens": 169738240} -{"current_steps": 20730, "total_steps": 20825, "loss": 0.9724, "learning_rate": 2.832842144903647e-09, "epoch": 0.995438175270108, "percentage": 99.54, "elapsed_time": "1 day, 5:33:24", "remaining_time": "0:08:07", "throughput": 1595.99, "total_tokens": 169820160} -{"current_steps": 20740, "total_steps": 20825, "loss": 0.7679, "learning_rate": 2.2678516999552478e-09, "epoch": 0.9959183673469387, "percentage": 99.59, "elapsed_time": "1 day, 5:34:09", "remaining_time": "0:07:16", "throughput": 1596.07, "total_tokens": 169902080} -{"current_steps": 20750, "total_steps": 20825, "loss": 0.9723, "learning_rate": 1.7656343978378342e-09, "epoch": 0.9963985594237695, "percentage": 99.64, "elapsed_time": "1 day, 5:34:55", "remaining_time": "0:06:24", "throughput": 1596.16, "total_tokens": 169984000} -{"current_steps": 20760, "total_steps": 20825, "loss": 1.1212, "learning_rate": 1.3261914996953728e-09, "epoch": 0.9968787515006002, "percentage": 99.69, "elapsed_time": "1 day, 5:35:40", "remaining_time": "0:05:33", "throughput": 1596.26, "total_tokens": 170065920} -{"current_steps": 20770, "total_steps": 20825, "loss": 0.9877, "learning_rate": 9.49524109034039e-10, "epoch": 0.9973589435774309, "percentage": 99.74, "elapsed_time": "1 day, 5:36:25", "remaining_time": "0:04:42", "throughput": 1596.35, "total_tokens": 170147840} -{"current_steps": 20780, "total_steps": 20825, "loss": 0.8818, "learning_rate": 6.356331717305431e-10, "epoch": 0.9978391356542617, "percentage": 99.78, "elapsed_time": "1 day, 5:37:10", "remaining_time": "0:03:50", "throughput": 1596.44, "total_tokens": 170229760} -{"current_steps": 20790, "total_steps": 20825, "loss": 0.9168, "learning_rate": 3.8451947600437466e-10, "epoch": 0.9983193277310924, "percentage": 99.83, "elapsed_time": "1 day, 5:37:55", "remaining_time": "0:02:59", "throughput": 1596.53, "total_tokens": 170311680} -{"current_steps": 20800, "total_steps": 20825, "loss": 0.8026, "learning_rate": 1.9618365244833404e-10, "epoch": 0.9987995198079231, "percentage": 99.88, "elapsed_time": "1 day, 5:38:41", "remaining_time": "0:02:08", "throughput": 1596.62, "total_tokens": 170393600} -{"current_steps": 20810, "total_steps": 20825, "loss": 0.9025, "learning_rate": 7.062617399800075e-11, "epoch": 0.999279711884754, "percentage": 99.93, "elapsed_time": "1 day, 5:39:26", "remaining_time": "0:01:16", "throughput": 1596.71, "total_tokens": 170475520} -{"current_steps": 20820, "total_steps": 20825, "loss": 0.9373, "learning_rate": 7.847355951162705e-12, "epoch": 0.9997599039615847, "percentage": 99.98, "elapsed_time": "1 day, 5:40:11", "remaining_time": "0:00:25", "throughput": 1596.8, "total_tokens": 170557440} -{"current_steps": 20825, "total_steps": 20825, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "1 day, 5:40:37", "remaining_time": "0:00:00", "throughput": 1596.8, "total_tokens": 170598400} +{"current_steps": 10, "total_steps": 20825, "loss": 1.3449, "learning_rate": 5.000000000000001e-07, "epoch": 0.0004801920768307323, "percentage": 0.05, "elapsed_time": "0:00:54", "remaining_time": "1 day, 7:39:43", "throughput": 1495.98, "total_tokens": 81920} +{"current_steps": 20, "total_steps": 20825, "loss": 1.339, "learning_rate": 1.0000000000000002e-06, "epoch": 0.0009603841536614646, "percentage": 0.1, "elapsed_time": "0:01:40", "remaining_time": "1 day, 5:01:07", "throughput": 1631.46, "total_tokens": 163840} +{"current_steps": 30, "total_steps": 20825, "loss": 1.3256, "learning_rate": 1.5e-06, "epoch": 0.0014405762304921968, "percentage": 0.14, "elapsed_time": "0:02:25", "remaining_time": "1 day, 4:06:41", "throughput": 1683.31, "total_tokens": 245760} +{"current_steps": 40, "total_steps": 20825, "loss": 1.4026, "learning_rate": 2.0000000000000003e-06, "epoch": 0.0019207683073229293, "percentage": 0.19, "elapsed_time": "0:03:10", "remaining_time": "1 day, 3:32:10", "throughput": 1717.64, "total_tokens": 327680} +{"current_steps": 50, "total_steps": 20825, "loss": 1.1825, "learning_rate": 2.5e-06, "epoch": 0.0024009603841536613, "percentage": 0.24, "elapsed_time": "0:03:59", "remaining_time": "1 day, 3:35:19", "throughput": 1713.55, "total_tokens": 409600} +{"current_steps": 60, "total_steps": 20825, "loss": 1.0617, "learning_rate": 3e-06, "epoch": 0.0028811524609843936, "percentage": 0.29, "elapsed_time": "0:04:45", "remaining_time": "1 day, 3:24:18", "throughput": 1724.19, "total_tokens": 491520} +{"current_steps": 70, "total_steps": 20825, "loss": 1.2085, "learning_rate": 3.5000000000000004e-06, "epoch": 0.0033613445378151263, "percentage": 0.34, "elapsed_time": "0:05:30", "remaining_time": "1 day, 3:14:55", "throughput": 1733.26, "total_tokens": 573440} +{"current_steps": 80, "total_steps": 20825, "loss": 1.2014, "learning_rate": 4.000000000000001e-06, "epoch": 0.0038415366146458585, "percentage": 0.38, "elapsed_time": "0:06:16", "remaining_time": "1 day, 3:05:35", "throughput": 1742.37, "total_tokens": 655360} +{"current_steps": 90, "total_steps": 20825, "loss": 1.2691, "learning_rate": 4.5e-06, "epoch": 0.004321728691476591, "percentage": 0.43, "elapsed_time": "0:07:01", "remaining_time": "1 day, 2:58:16", "throughput": 1749.41, "total_tokens": 737280} +{"current_steps": 100, "total_steps": 20825, "loss": 1.1872, "learning_rate": 5e-06, "epoch": 0.004801920768307323, "percentage": 0.48, "elapsed_time": "0:07:47", "remaining_time": "1 day, 2:53:17", "throughput": 1753.97, "total_tokens": 819200} +{"current_steps": 110, "total_steps": 20825, "loss": 1.2103, "learning_rate": 5.500000000000001e-06, "epoch": 0.005282112845138055, "percentage": 0.53, "elapsed_time": "0:08:32", "remaining_time": "1 day, 2:48:09", "throughput": 1758.7, "total_tokens": 901120} +{"current_steps": 120, "total_steps": 20825, "loss": 1.4538, "learning_rate": 6e-06, "epoch": 0.005762304921968787, "percentage": 0.58, "elapsed_time": "0:09:17", "remaining_time": "1 day, 2:43:37", "throughput": 1762.83, "total_tokens": 983040} +{"current_steps": 130, "total_steps": 20825, "loss": 1.3365, "learning_rate": 6.5000000000000004e-06, "epoch": 0.00624249699879952, "percentage": 0.62, "elapsed_time": "0:10:02", "remaining_time": "1 day, 2:39:41", "throughput": 1766.31, "total_tokens": 1064960} +{"current_steps": 140, "total_steps": 20825, "loss": 1.0837, "learning_rate": 7.000000000000001e-06, "epoch": 0.0067226890756302525, "percentage": 0.67, "elapsed_time": "0:10:48", "remaining_time": "1 day, 2:36:06", "throughput": 1769.42, "total_tokens": 1146880} +{"current_steps": 150, "total_steps": 20825, "loss": 1.0649, "learning_rate": 7.5e-06, "epoch": 0.007202881152460984, "percentage": 0.72, "elapsed_time": "0:11:33", "remaining_time": "1 day, 2:32:43", "throughput": 1772.32, "total_tokens": 1228800} +{"current_steps": 160, "total_steps": 20825, "loss": 1.3666, "learning_rate": 8.000000000000001e-06, "epoch": 0.007683073229291717, "percentage": 0.77, "elapsed_time": "0:12:18", "remaining_time": "1 day, 2:29:45", "throughput": 1774.78, "total_tokens": 1310720} +{"current_steps": 170, "total_steps": 20825, "loss": 1.2506, "learning_rate": 8.500000000000002e-06, "epoch": 0.00816326530612245, "percentage": 0.82, "elapsed_time": "0:13:03", "remaining_time": "1 day, 2:27:04", "throughput": 1776.91, "total_tokens": 1392640} +{"current_steps": 180, "total_steps": 20825, "loss": 1.0234, "learning_rate": 9e-06, "epoch": 0.008643457382953182, "percentage": 0.86, "elapsed_time": "0:13:48", "remaining_time": "1 day, 2:24:13", "throughput": 1779.26, "total_tokens": 1474560} +{"current_steps": 190, "total_steps": 20825, "loss": 0.9989, "learning_rate": 9.5e-06, "epoch": 0.009123649459783913, "percentage": 0.91, "elapsed_time": "0:14:33", "remaining_time": "1 day, 2:21:58", "throughput": 1780.93, "total_tokens": 1556480} +{"current_steps": 200, "total_steps": 20825, "loss": 0.8422, "learning_rate": 1e-05, "epoch": 0.009603841536614645, "percentage": 0.96, "elapsed_time": "0:15:19", "remaining_time": "1 day, 2:20:29", "throughput": 1781.73, "total_tokens": 1638400} +{"current_steps": 210, "total_steps": 20825, "loss": 1.0182, "learning_rate": 1.05e-05, "epoch": 0.010084033613445379, "percentage": 1.01, "elapsed_time": "0:16:04", "remaining_time": "1 day, 2:18:30", "throughput": 1783.1, "total_tokens": 1720320} +{"current_steps": 220, "total_steps": 20825, "loss": 0.8848, "learning_rate": 1.1000000000000001e-05, "epoch": 0.01056422569027611, "percentage": 1.06, "elapsed_time": "0:16:49", "remaining_time": "1 day, 2:16:28", "throughput": 1784.54, "total_tokens": 1802240} +{"current_steps": 230, "total_steps": 20825, "loss": 1.1464, "learning_rate": 1.1500000000000002e-05, "epoch": 0.011044417767106842, "percentage": 1.1, "elapsed_time": "0:17:35", "remaining_time": "1 day, 2:15:02", "throughput": 1785.28, "total_tokens": 1884160} +{"current_steps": 240, "total_steps": 20825, "loss": 1.0084, "learning_rate": 1.2e-05, "epoch": 0.011524609843937574, "percentage": 1.15, "elapsed_time": "0:18:20", "remaining_time": "1 day, 2:13:16", "throughput": 1786.43, "total_tokens": 1966080} +{"current_steps": 250, "total_steps": 20825, "loss": 1.0096, "learning_rate": 1.25e-05, "epoch": 0.012004801920768308, "percentage": 1.2, "elapsed_time": "0:19:05", "remaining_time": "1 day, 2:11:40", "throughput": 1787.37, "total_tokens": 2048000} +{"current_steps": 260, "total_steps": 20825, "loss": 0.9685, "learning_rate": 1.3000000000000001e-05, "epoch": 0.01248499399759904, "percentage": 1.25, "elapsed_time": "0:19:51", "remaining_time": "1 day, 2:10:18", "throughput": 1788.06, "total_tokens": 2129920} +{"current_steps": 270, "total_steps": 20825, "loss": 1.109, "learning_rate": 1.3500000000000001e-05, "epoch": 0.012965186074429771, "percentage": 1.3, "elapsed_time": "0:20:36", "remaining_time": "1 day, 2:09:06", "throughput": 1788.55, "total_tokens": 2211840} +{"current_steps": 280, "total_steps": 20825, "loss": 1.079, "learning_rate": 1.4000000000000001e-05, "epoch": 0.013445378151260505, "percentage": 1.34, "elapsed_time": "0:21:21", "remaining_time": "1 day, 2:07:34", "throughput": 1789.43, "total_tokens": 2293760} +{"current_steps": 290, "total_steps": 20825, "loss": 1.0842, "learning_rate": 1.45e-05, "epoch": 0.013925570228091237, "percentage": 1.39, "elapsed_time": "0:22:07", "remaining_time": "1 day, 2:06:12", "throughput": 1790.12, "total_tokens": 2375680} +{"current_steps": 300, "total_steps": 20825, "loss": 1.0287, "learning_rate": 1.5e-05, "epoch": 0.014405762304921969, "percentage": 1.44, "elapsed_time": "0:22:52", "remaining_time": "1 day, 2:04:42", "throughput": 1790.96, "total_tokens": 2457600} +{"current_steps": 310, "total_steps": 20825, "loss": 1.1743, "learning_rate": 1.55e-05, "epoch": 0.0148859543817527, "percentage": 1.49, "elapsed_time": "0:23:37", "remaining_time": "1 day, 2:03:52", "throughput": 1791.05, "total_tokens": 2539520} +{"current_steps": 320, "total_steps": 20825, "loss": 1.1558, "learning_rate": 1.6000000000000003e-05, "epoch": 0.015366146458583434, "percentage": 1.54, "elapsed_time": "0:24:23", "remaining_time": "1 day, 2:02:33", "throughput": 1791.69, "total_tokens": 2621440} +{"current_steps": 330, "total_steps": 20825, "loss": 1.0934, "learning_rate": 1.65e-05, "epoch": 0.015846338535414166, "percentage": 1.58, "elapsed_time": "0:25:08", "remaining_time": "1 day, 2:01:21", "throughput": 1792.19, "total_tokens": 2703360} +{"current_steps": 340, "total_steps": 20825, "loss": 1.0637, "learning_rate": 1.7000000000000003e-05, "epoch": 0.0163265306122449, "percentage": 1.63, "elapsed_time": "0:25:53", "remaining_time": "1 day, 2:00:23", "throughput": 1792.42, "total_tokens": 2785280} +{"current_steps": 350, "total_steps": 20825, "loss": 1.1708, "learning_rate": 1.75e-05, "epoch": 0.01680672268907563, "percentage": 1.68, "elapsed_time": "0:26:39", "remaining_time": "1 day, 1:59:22", "throughput": 1792.71, "total_tokens": 2867200} +{"current_steps": 360, "total_steps": 20825, "loss": 0.9425, "learning_rate": 1.8e-05, "epoch": 0.017286914765906363, "percentage": 1.73, "elapsed_time": "0:27:24", "remaining_time": "1 day, 1:58:08", "throughput": 1793.26, "total_tokens": 2949120} +{"current_steps": 370, "total_steps": 20825, "loss": 0.9716, "learning_rate": 1.85e-05, "epoch": 0.017767106842737093, "percentage": 1.78, "elapsed_time": "0:28:09", "remaining_time": "1 day, 1:56:43", "throughput": 1794.02, "total_tokens": 3031040} +{"current_steps": 380, "total_steps": 20825, "loss": 1.0748, "learning_rate": 1.9e-05, "epoch": 0.018247298919567827, "percentage": 1.82, "elapsed_time": "0:28:54", "remaining_time": "1 day, 1:55:22", "throughput": 1794.69, "total_tokens": 3112960} +{"current_steps": 390, "total_steps": 20825, "loss": 0.9879, "learning_rate": 1.9500000000000003e-05, "epoch": 0.01872749099639856, "percentage": 1.87, "elapsed_time": "0:29:39", "remaining_time": "1 day, 1:54:10", "throughput": 1795.2, "total_tokens": 3194880} +{"current_steps": 400, "total_steps": 20825, "loss": 1.1051, "learning_rate": 2e-05, "epoch": 0.01920768307322929, "percentage": 1.92, "elapsed_time": "0:30:24", "remaining_time": "1 day, 1:52:53", "throughput": 1795.8, "total_tokens": 3276800} +{"current_steps": 410, "total_steps": 20825, "loss": 1.1197, "learning_rate": 2.05e-05, "epoch": 0.019687875150060024, "percentage": 1.97, "elapsed_time": "0:31:10", "remaining_time": "1 day, 1:51:59", "throughput": 1795.97, "total_tokens": 3358720} +{"current_steps": 420, "total_steps": 20825, "loss": 1.046, "learning_rate": 2.1e-05, "epoch": 0.020168067226890758, "percentage": 2.02, "elapsed_time": "0:31:55", "remaining_time": "1 day, 1:50:57", "throughput": 1796.29, "total_tokens": 3440640} +{"current_steps": 430, "total_steps": 20825, "loss": 1.0229, "learning_rate": 2.15e-05, "epoch": 0.020648259303721488, "percentage": 2.06, "elapsed_time": "0:32:40", "remaining_time": "1 day, 1:50:03", "throughput": 1796.45, "total_tokens": 3522560} +{"current_steps": 440, "total_steps": 20825, "loss": 1.138, "learning_rate": 2.2000000000000003e-05, "epoch": 0.02112845138055222, "percentage": 2.11, "elapsed_time": "0:33:25", "remaining_time": "1 day, 1:48:55", "throughput": 1796.88, "total_tokens": 3604480} +{"current_steps": 450, "total_steps": 20825, "loss": 0.9448, "learning_rate": 2.25e-05, "epoch": 0.021608643457382955, "percentage": 2.16, "elapsed_time": "0:34:11", "remaining_time": "1 day, 1:47:46", "throughput": 1797.32, "total_tokens": 3686400} +{"current_steps": 460, "total_steps": 20825, "loss": 0.9858, "learning_rate": 2.3000000000000003e-05, "epoch": 0.022088835534213685, "percentage": 2.21, "elapsed_time": "0:34:56", "remaining_time": "1 day, 1:46:47", "throughput": 1797.6, "total_tokens": 3768320} +{"current_steps": 470, "total_steps": 20825, "loss": 1.242, "learning_rate": 2.35e-05, "epoch": 0.02256902761104442, "percentage": 2.26, "elapsed_time": "0:35:41", "remaining_time": "1 day, 1:45:38", "throughput": 1798.05, "total_tokens": 3850240} +{"current_steps": 480, "total_steps": 20825, "loss": 1.046, "learning_rate": 2.4e-05, "epoch": 0.02304921968787515, "percentage": 2.3, "elapsed_time": "0:36:26", "remaining_time": "1 day, 1:44:33", "throughput": 1798.42, "total_tokens": 3932160} +{"current_steps": 490, "total_steps": 20825, "loss": 1.0759, "learning_rate": 2.45e-05, "epoch": 0.023529411764705882, "percentage": 2.35, "elapsed_time": "0:37:11", "remaining_time": "1 day, 1:43:32", "throughput": 1798.72, "total_tokens": 4014080} +{"current_steps": 500, "total_steps": 20825, "loss": 1.0796, "learning_rate": 2.5e-05, "epoch": 0.024009603841536616, "percentage": 2.4, "elapsed_time": "0:37:57", "remaining_time": "1 day, 1:42:44", "throughput": 1798.78, "total_tokens": 4096000} +{"current_steps": 510, "total_steps": 20825, "loss": 1.0057, "learning_rate": 2.5500000000000003e-05, "epoch": 0.024489795918367346, "percentage": 2.45, "elapsed_time": "0:38:42", "remaining_time": "1 day, 1:41:43", "throughput": 1799.08, "total_tokens": 4177920} +{"current_steps": 520, "total_steps": 20825, "loss": 0.9161, "learning_rate": 2.6000000000000002e-05, "epoch": 0.02496998799519808, "percentage": 2.5, "elapsed_time": "0:39:27", "remaining_time": "1 day, 1:40:39", "throughput": 1799.43, "total_tokens": 4259840} +{"current_steps": 530, "total_steps": 20825, "loss": 1.0109, "learning_rate": 2.6500000000000004e-05, "epoch": 0.025450180072028813, "percentage": 2.55, "elapsed_time": "0:40:12", "remaining_time": "1 day, 1:39:38", "throughput": 1799.73, "total_tokens": 4341760} +{"current_steps": 540, "total_steps": 20825, "loss": 0.9605, "learning_rate": 2.7000000000000002e-05, "epoch": 0.025930372148859543, "percentage": 2.59, "elapsed_time": "0:40:57", "remaining_time": "1 day, 1:38:43", "throughput": 1799.91, "total_tokens": 4423680} +{"current_steps": 550, "total_steps": 20825, "loss": 1.0826, "learning_rate": 2.7500000000000004e-05, "epoch": 0.026410564225690276, "percentage": 2.64, "elapsed_time": "0:41:42", "remaining_time": "1 day, 1:37:49", "throughput": 1800.09, "total_tokens": 4505600} +{"current_steps": 560, "total_steps": 20825, "loss": 1.2013, "learning_rate": 2.8000000000000003e-05, "epoch": 0.02689075630252101, "percentage": 2.69, "elapsed_time": "0:42:28", "remaining_time": "1 day, 1:36:59", "throughput": 1800.16, "total_tokens": 4587520} +{"current_steps": 570, "total_steps": 20825, "loss": 1.0361, "learning_rate": 2.8499999999999998e-05, "epoch": 0.02737094837935174, "percentage": 2.74, "elapsed_time": "0:43:13", "remaining_time": "1 day, 1:36:00", "throughput": 1800.43, "total_tokens": 4669440} +{"current_steps": 580, "total_steps": 20825, "loss": 1.1374, "learning_rate": 2.9e-05, "epoch": 0.027851140456182474, "percentage": 2.79, "elapsed_time": "0:43:58", "remaining_time": "1 day, 1:35:04", "throughput": 1800.63, "total_tokens": 4751360} +{"current_steps": 590, "total_steps": 20825, "loss": 1.1363, "learning_rate": 2.95e-05, "epoch": 0.028331332533013204, "percentage": 2.83, "elapsed_time": "0:44:43", "remaining_time": "1 day, 1:34:09", "throughput": 1800.82, "total_tokens": 4833280} +{"current_steps": 600, "total_steps": 20825, "loss": 0.8576, "learning_rate": 3e-05, "epoch": 0.028811524609843937, "percentage": 2.88, "elapsed_time": "0:45:29", "remaining_time": "1 day, 1:33:14", "throughput": 1801.02, "total_tokens": 4915200} +{"current_steps": 610, "total_steps": 20825, "loss": 1.2395, "learning_rate": 3.05e-05, "epoch": 0.02929171668667467, "percentage": 2.93, "elapsed_time": "0:46:14", "remaining_time": "1 day, 1:32:25", "throughput": 1801.09, "total_tokens": 4997120} +{"current_steps": 620, "total_steps": 20825, "loss": 0.9339, "learning_rate": 3.1e-05, "epoch": 0.0297719087635054, "percentage": 2.98, "elapsed_time": "0:46:59", "remaining_time": "1 day, 1:31:25", "throughput": 1801.37, "total_tokens": 5079040} +{"current_steps": 630, "total_steps": 20825, "loss": 0.9699, "learning_rate": 3.15e-05, "epoch": 0.030252100840336135, "percentage": 3.03, "elapsed_time": "0:47:44", "remaining_time": "1 day, 1:30:25", "throughput": 1801.65, "total_tokens": 5160960} +{"current_steps": 640, "total_steps": 20825, "loss": 0.9722, "learning_rate": 3.2000000000000005e-05, "epoch": 0.030732292917166868, "percentage": 3.07, "elapsed_time": "0:48:29", "remaining_time": "1 day, 1:29:28", "throughput": 1801.87, "total_tokens": 5242880} +{"current_steps": 650, "total_steps": 20825, "loss": 0.9991, "learning_rate": 3.2500000000000004e-05, "epoch": 0.031212484993997598, "percentage": 3.12, "elapsed_time": "0:49:15", "remaining_time": "1 day, 1:28:42", "throughput": 1801.89, "total_tokens": 5324800} +{"current_steps": 660, "total_steps": 20825, "loss": 0.8745, "learning_rate": 3.3e-05, "epoch": 0.03169267707082833, "percentage": 3.17, "elapsed_time": "0:50:00", "remaining_time": "1 day, 1:27:55", "throughput": 1801.91, "total_tokens": 5406720} +{"current_steps": 670, "total_steps": 20825, "loss": 0.8664, "learning_rate": 3.35e-05, "epoch": 0.032172869147659065, "percentage": 3.22, "elapsed_time": "0:50:45", "remaining_time": "1 day, 1:27:00", "throughput": 1802.1, "total_tokens": 5488640} +{"current_steps": 680, "total_steps": 20825, "loss": 0.88, "learning_rate": 3.4000000000000007e-05, "epoch": 0.0326530612244898, "percentage": 3.27, "elapsed_time": "0:51:31", "remaining_time": "1 day, 1:26:14", "throughput": 1802.12, "total_tokens": 5570560} +{"current_steps": 690, "total_steps": 20825, "loss": 1.0718, "learning_rate": 3.45e-05, "epoch": 0.033133253301320525, "percentage": 3.31, "elapsed_time": "0:52:16", "remaining_time": "1 day, 1:25:29", "throughput": 1802.11, "total_tokens": 5652480} +{"current_steps": 700, "total_steps": 20825, "loss": 1.0753, "learning_rate": 3.5e-05, "epoch": 0.03361344537815126, "percentage": 3.36, "elapsed_time": "0:53:01", "remaining_time": "1 day, 1:24:38", "throughput": 1802.21, "total_tokens": 5734400} +{"current_steps": 710, "total_steps": 20825, "loss": 0.9675, "learning_rate": 3.55e-05, "epoch": 0.03409363745498199, "percentage": 3.41, "elapsed_time": "0:53:47", "remaining_time": "1 day, 1:23:51", "throughput": 1802.26, "total_tokens": 5816320} +{"current_steps": 720, "total_steps": 20825, "loss": 0.9765, "learning_rate": 3.6e-05, "epoch": 0.034573829531812726, "percentage": 3.46, "elapsed_time": "0:54:32", "remaining_time": "1 day, 1:22:56", "throughput": 1802.44, "total_tokens": 5898240} +{"current_steps": 730, "total_steps": 20825, "loss": 0.9347, "learning_rate": 3.65e-05, "epoch": 0.03505402160864346, "percentage": 3.51, "elapsed_time": "0:55:17", "remaining_time": "1 day, 1:22:03", "throughput": 1802.59, "total_tokens": 5980160} +{"current_steps": 740, "total_steps": 20825, "loss": 0.9209, "learning_rate": 3.7e-05, "epoch": 0.035534213685474186, "percentage": 3.55, "elapsed_time": "0:56:02", "remaining_time": "1 day, 1:21:13", "throughput": 1802.68, "total_tokens": 6062080} +{"current_steps": 750, "total_steps": 20825, "loss": 1.0337, "learning_rate": 3.7500000000000003e-05, "epoch": 0.03601440576230492, "percentage": 3.6, "elapsed_time": "0:56:48", "remaining_time": "1 day, 1:20:21", "throughput": 1802.79, "total_tokens": 6144000} +{"current_steps": 760, "total_steps": 20825, "loss": 1.051, "learning_rate": 3.8e-05, "epoch": 0.036494597839135653, "percentage": 3.65, "elapsed_time": "0:57:33", "remaining_time": "1 day, 1:19:27", "throughput": 1802.97, "total_tokens": 6225920} +{"current_steps": 770, "total_steps": 20825, "loss": 0.9995, "learning_rate": 3.85e-05, "epoch": 0.03697478991596639, "percentage": 3.7, "elapsed_time": "0:58:18", "remaining_time": "1 day, 1:18:39", "throughput": 1803.02, "total_tokens": 6307840} +{"current_steps": 780, "total_steps": 20825, "loss": 1.0438, "learning_rate": 3.9000000000000006e-05, "epoch": 0.03745498199279712, "percentage": 3.75, "elapsed_time": "0:59:03", "remaining_time": "1 day, 1:17:45", "throughput": 1803.18, "total_tokens": 6389760} +{"current_steps": 790, "total_steps": 20825, "loss": 1.0693, "learning_rate": 3.9500000000000005e-05, "epoch": 0.037935174069627854, "percentage": 3.79, "elapsed_time": "0:59:48", "remaining_time": "1 day, 1:16:51", "throughput": 1803.36, "total_tokens": 6471680} +{"current_steps": 800, "total_steps": 20825, "loss": 0.9723, "learning_rate": 4e-05, "epoch": 0.03841536614645858, "percentage": 3.84, "elapsed_time": "1:00:33", "remaining_time": "1 day, 1:15:57", "throughput": 1803.54, "total_tokens": 6553600} +{"current_steps": 810, "total_steps": 20825, "loss": 1.1387, "learning_rate": 4.05e-05, "epoch": 0.038895558223289314, "percentage": 3.89, "elapsed_time": "1:01:18", "remaining_time": "1 day, 1:15:05", "throughput": 1803.66, "total_tokens": 6635520} +{"current_steps": 820, "total_steps": 20825, "loss": 1.0296, "learning_rate": 4.1e-05, "epoch": 0.03937575030012005, "percentage": 3.94, "elapsed_time": "1:02:03", "remaining_time": "1 day, 1:14:10", "throughput": 1803.85, "total_tokens": 6717440} +{"current_steps": 830, "total_steps": 20825, "loss": 0.9731, "learning_rate": 4.15e-05, "epoch": 0.03985594237695078, "percentage": 3.99, "elapsed_time": "1:02:49", "remaining_time": "1 day, 1:13:21", "throughput": 1803.93, "total_tokens": 6799360} +{"current_steps": 840, "total_steps": 20825, "loss": 0.9446, "learning_rate": 4.2e-05, "epoch": 0.040336134453781515, "percentage": 4.03, "elapsed_time": "1:03:34", "remaining_time": "1 day, 1:12:33", "throughput": 1803.97, "total_tokens": 6881280} +{"current_steps": 850, "total_steps": 20825, "loss": 0.9918, "learning_rate": 4.25e-05, "epoch": 0.04081632653061224, "percentage": 4.08, "elapsed_time": "1:04:19", "remaining_time": "1 day, 1:11:41", "throughput": 1804.1, "total_tokens": 6963200} +{"current_steps": 860, "total_steps": 20825, "loss": 0.9964, "learning_rate": 4.3e-05, "epoch": 0.041296518607442975, "percentage": 4.13, "elapsed_time": "1:05:04", "remaining_time": "1 day, 1:10:50", "throughput": 1804.21, "total_tokens": 7045120} +{"current_steps": 870, "total_steps": 20825, "loss": 1.0334, "learning_rate": 4.35e-05, "epoch": 0.04177671068427371, "percentage": 4.18, "elapsed_time": "1:05:49", "remaining_time": "1 day, 1:09:59", "throughput": 1804.34, "total_tokens": 7127040} +{"current_steps": 880, "total_steps": 20825, "loss": 0.8306, "learning_rate": 4.4000000000000006e-05, "epoch": 0.04225690276110444, "percentage": 4.23, "elapsed_time": "1:06:35", "remaining_time": "1 day, 1:09:10", "throughput": 1804.41, "total_tokens": 7208960} +{"current_steps": 890, "total_steps": 20825, "loss": 1.3483, "learning_rate": 4.4500000000000004e-05, "epoch": 0.042737094837935176, "percentage": 4.27, "elapsed_time": "1:07:20", "remaining_time": "1 day, 1:08:20", "throughput": 1804.49, "total_tokens": 7290880} +{"current_steps": 900, "total_steps": 20825, "loss": 1.1189, "learning_rate": 4.5e-05, "epoch": 0.04321728691476591, "percentage": 4.32, "elapsed_time": "1:08:05", "remaining_time": "1 day, 1:07:29", "throughput": 1804.61, "total_tokens": 7372800} +{"current_steps": 910, "total_steps": 20825, "loss": 1.1789, "learning_rate": 4.55e-05, "epoch": 0.043697478991596636, "percentage": 4.37, "elapsed_time": "1:08:51", "remaining_time": "1 day, 1:06:47", "throughput": 1804.54, "total_tokens": 7454720} +{"current_steps": 920, "total_steps": 20825, "loss": 1.0259, "learning_rate": 4.600000000000001e-05, "epoch": 0.04417767106842737, "percentage": 4.42, "elapsed_time": "1:09:36", "remaining_time": "1 day, 1:05:55", "throughput": 1804.67, "total_tokens": 7536640} +{"current_steps": 930, "total_steps": 20825, "loss": 1.0611, "learning_rate": 4.6500000000000005e-05, "epoch": 0.0446578631452581, "percentage": 4.47, "elapsed_time": "1:10:21", "remaining_time": "1 day, 1:05:07", "throughput": 1804.72, "total_tokens": 7618560} +{"current_steps": 940, "total_steps": 20825, "loss": 0.9896, "learning_rate": 4.7e-05, "epoch": 0.04513805522208884, "percentage": 4.51, "elapsed_time": "1:11:06", "remaining_time": "1 day, 1:04:17", "throughput": 1804.82, "total_tokens": 7700480} +{"current_steps": 950, "total_steps": 20825, "loss": 0.9137, "learning_rate": 4.75e-05, "epoch": 0.04561824729891957, "percentage": 4.56, "elapsed_time": "1:11:51", "remaining_time": "1 day, 1:03:26", "throughput": 1804.93, "total_tokens": 7782400} +{"current_steps": 960, "total_steps": 20825, "loss": 0.875, "learning_rate": 4.8e-05, "epoch": 0.0460984393757503, "percentage": 4.61, "elapsed_time": "1:12:36", "remaining_time": "1 day, 1:02:37", "throughput": 1804.99, "total_tokens": 7864320} +{"current_steps": 970, "total_steps": 20825, "loss": 1.0156, "learning_rate": 4.85e-05, "epoch": 0.04657863145258103, "percentage": 4.66, "elapsed_time": "1:13:22", "remaining_time": "1 day, 1:01:46", "throughput": 1805.11, "total_tokens": 7946240} +{"current_steps": 980, "total_steps": 20825, "loss": 0.8589, "learning_rate": 4.9e-05, "epoch": 0.047058823529411764, "percentage": 4.71, "elapsed_time": "1:14:07", "remaining_time": "1 day, 1:00:55", "throughput": 1805.22, "total_tokens": 8028160} +{"current_steps": 990, "total_steps": 20825, "loss": 0.8402, "learning_rate": 4.9500000000000004e-05, "epoch": 0.0475390156062425, "percentage": 4.75, "elapsed_time": "1:14:52", "remaining_time": "1 day, 1:00:10", "throughput": 1805.22, "total_tokens": 8110080} +{"current_steps": 1000, "total_steps": 20825, "loss": 0.8892, "learning_rate": 5e-05, "epoch": 0.04801920768307323, "percentage": 4.8, "elapsed_time": "1:15:37", "remaining_time": "1 day, 0:59:20", "throughput": 1805.31, "total_tokens": 8192000} +{"current_steps": 1010, "total_steps": 20825, "loss": 1.0213, "learning_rate": 4.9999968610581127e-05, "epoch": 0.048499399759903965, "percentage": 4.85, "elapsed_time": "1:16:38", "remaining_time": "1 day, 1:03:28", "throughput": 1799.43, "total_tokens": 8273920} +{"current_steps": 1020, "total_steps": 20825, "loss": 1.0984, "learning_rate": 4.9999874442403314e-05, "epoch": 0.04897959183673469, "percentage": 4.9, "elapsed_time": "1:17:23", "remaining_time": "1 day, 1:02:36", "throughput": 1799.56, "total_tokens": 8355840} +{"current_steps": 1030, "total_steps": 20825, "loss": 1.167, "learning_rate": 4.999971749570305e-05, "epoch": 0.049459783913565425, "percentage": 4.95, "elapsed_time": "1:18:08", "remaining_time": "1 day, 1:01:52", "throughput": 1799.54, "total_tokens": 8437760} +{"current_steps": 1040, "total_steps": 20825, "loss": 0.9767, "learning_rate": 4.999949777087444e-05, "epoch": 0.04993997599039616, "percentage": 4.99, "elapsed_time": "1:18:54", "remaining_time": "1 day, 1:01:03", "throughput": 1799.61, "total_tokens": 8519680} +{"current_steps": 1050, "total_steps": 20825, "loss": 0.8419, "learning_rate": 4.999921526846925e-05, "epoch": 0.05042016806722689, "percentage": 5.04, "elapsed_time": "1:19:39", "remaining_time": "1 day, 1:00:12", "throughput": 1799.71, "total_tokens": 8601600} +{"current_steps": 1060, "total_steps": 20825, "loss": 0.9681, "learning_rate": 4.9998869989196885e-05, "epoch": 0.050900360144057626, "percentage": 5.09, "elapsed_time": "1:20:24", "remaining_time": "1 day, 0:59:23", "throughput": 1799.78, "total_tokens": 8683520} +{"current_steps": 1070, "total_steps": 20825, "loss": 0.9462, "learning_rate": 4.99984619339244e-05, "epoch": 0.05138055222088835, "percentage": 5.14, "elapsed_time": "1:21:10", "remaining_time": "1 day, 0:58:34", "throughput": 1799.86, "total_tokens": 8765440} +{"current_steps": 1080, "total_steps": 20825, "loss": 1.0044, "learning_rate": 4.999799110367648e-05, "epoch": 0.051860744297719086, "percentage": 5.19, "elapsed_time": "1:21:55", "remaining_time": "1 day, 0:57:47", "throughput": 1799.89, "total_tokens": 8847360} +{"current_steps": 1090, "total_steps": 20825, "loss": 1.0218, "learning_rate": 4.999745749963545e-05, "epoch": 0.05234093637454982, "percentage": 5.23, "elapsed_time": "1:22:40", "remaining_time": "1 day, 0:56:59", "throughput": 1799.93, "total_tokens": 8929280} +{"current_steps": 1100, "total_steps": 20825, "loss": 0.8808, "learning_rate": 4.999686112314127e-05, "epoch": 0.05282112845138055, "percentage": 5.28, "elapsed_time": "1:23:26", "remaining_time": "1 day, 0:56:07", "throughput": 1800.07, "total_tokens": 9011200} +{"current_steps": 1110, "total_steps": 20825, "loss": 1.1594, "learning_rate": 4.999620197569155e-05, "epoch": 0.053301320528211286, "percentage": 5.33, "elapsed_time": "1:24:11", "remaining_time": "1 day, 0:55:17", "throughput": 1800.15, "total_tokens": 9093120} +{"current_steps": 1120, "total_steps": 20825, "loss": 0.8905, "learning_rate": 4.9995480058941483e-05, "epoch": 0.05378151260504202, "percentage": 5.38, "elapsed_time": "1:24:56", "remaining_time": "1 day, 0:54:27", "throughput": 1800.24, "total_tokens": 9175040} +{"current_steps": 1130, "total_steps": 20825, "loss": 0.9875, "learning_rate": 4.9994695374703934e-05, "epoch": 0.05426170468187275, "percentage": 5.43, "elapsed_time": "1:25:41", "remaining_time": "1 day, 0:53:36", "throughput": 1800.35, "total_tokens": 9256960} +{"current_steps": 1140, "total_steps": 20825, "loss": 0.8852, "learning_rate": 4.9993847924949364e-05, "epoch": 0.05474189675870348, "percentage": 5.47, "elapsed_time": "1:26:27", "remaining_time": "1 day, 0:52:46", "throughput": 1800.44, "total_tokens": 9338880} +{"current_steps": 1150, "total_steps": 20825, "loss": 0.91, "learning_rate": 4.999293771180584e-05, "epoch": 0.055222088835534214, "percentage": 5.52, "elapsed_time": "1:27:12", "remaining_time": "1 day, 0:51:55", "throughput": 1800.55, "total_tokens": 9420800} +{"current_steps": 1160, "total_steps": 20825, "loss": 1.0214, "learning_rate": 4.999196473755905e-05, "epoch": 0.05570228091236495, "percentage": 5.57, "elapsed_time": "1:27:57", "remaining_time": "1 day, 0:51:03", "throughput": 1800.68, "total_tokens": 9502720} +{"current_steps": 1170, "total_steps": 20825, "loss": 1.0768, "learning_rate": 4.9990929004652287e-05, "epoch": 0.05618247298919568, "percentage": 5.62, "elapsed_time": "1:28:42", "remaining_time": "1 day, 0:50:14", "throughput": 1800.76, "total_tokens": 9584640} +{"current_steps": 1180, "total_steps": 20825, "loss": 0.9418, "learning_rate": 4.9989830515686434e-05, "epoch": 0.05666266506602641, "percentage": 5.67, "elapsed_time": "1:29:27", "remaining_time": "1 day, 0:49:27", "throughput": 1800.8, "total_tokens": 9666560} +{"current_steps": 1190, "total_steps": 20825, "loss": 1.0168, "learning_rate": 4.998866927341995e-05, "epoch": 0.05714285714285714, "percentage": 5.71, "elapsed_time": "1:30:12", "remaining_time": "1 day, 0:48:33", "throughput": 1800.95, "total_tokens": 9748480} +{"current_steps": 1200, "total_steps": 20825, "loss": 0.9405, "learning_rate": 4.9987445280768916e-05, "epoch": 0.057623049219687875, "percentage": 5.76, "elapsed_time": "1:30:58", "remaining_time": "1 day, 0:47:50", "throughput": 1800.91, "total_tokens": 9830400} +{"current_steps": 1210, "total_steps": 20825, "loss": 1.0905, "learning_rate": 4.998615854080695e-05, "epoch": 0.05810324129651861, "percentage": 5.81, "elapsed_time": "1:31:43", "remaining_time": "1 day, 0:47:00", "throughput": 1801.0, "total_tokens": 9912320} +{"current_steps": 1220, "total_steps": 20825, "loss": 0.9024, "learning_rate": 4.998480905676527e-05, "epoch": 0.05858343337334934, "percentage": 5.86, "elapsed_time": "1:32:28", "remaining_time": "1 day, 0:46:10", "throughput": 1801.1, "total_tokens": 9994240} +{"current_steps": 1230, "total_steps": 20825, "loss": 1.2022, "learning_rate": 4.998339683203261e-05, "epoch": 0.059063625450180075, "percentage": 5.91, "elapsed_time": "1:33:13", "remaining_time": "1 day, 0:45:16", "throughput": 1801.26, "total_tokens": 10076160} +{"current_steps": 1240, "total_steps": 20825, "loss": 1.0539, "learning_rate": 4.9981921870155314e-05, "epoch": 0.0595438175270108, "percentage": 5.95, "elapsed_time": "1:33:58", "remaining_time": "1 day, 0:44:22", "throughput": 1801.44, "total_tokens": 10158080} +{"current_steps": 1250, "total_steps": 20825, "loss": 1.0482, "learning_rate": 4.998038417483721e-05, "epoch": 0.060024009603841535, "percentage": 6.0, "elapsed_time": "1:34:44", "remaining_time": "1 day, 0:43:39", "throughput": 1801.38, "total_tokens": 10240000} +{"current_steps": 1260, "total_steps": 20825, "loss": 1.0175, "learning_rate": 4.9978783749939705e-05, "epoch": 0.06050420168067227, "percentage": 6.05, "elapsed_time": "1:35:29", "remaining_time": "1 day, 0:42:53", "throughput": 1801.4, "total_tokens": 10321920} +{"current_steps": 1270, "total_steps": 20825, "loss": 0.902, "learning_rate": 4.997712059948171e-05, "epoch": 0.060984393757503, "percentage": 6.1, "elapsed_time": "1:36:15", "remaining_time": "1 day, 0:42:06", "throughput": 1801.43, "total_tokens": 10403840} +{"current_steps": 1280, "total_steps": 20825, "loss": 0.8692, "learning_rate": 4.997539472763964e-05, "epoch": 0.061464585834333736, "percentage": 6.15, "elapsed_time": "1:37:00", "remaining_time": "1 day, 0:41:15", "throughput": 1801.54, "total_tokens": 10485760} +{"current_steps": 1290, "total_steps": 20825, "loss": 1.1472, "learning_rate": 4.9973606138747434e-05, "epoch": 0.06194477791116446, "percentage": 6.19, "elapsed_time": "1:37:45", "remaining_time": "1 day, 0:40:30", "throughput": 1801.53, "total_tokens": 10567680} +{"current_steps": 1300, "total_steps": 20825, "loss": 0.8769, "learning_rate": 4.9971754837296516e-05, "epoch": 0.062424969987995196, "percentage": 6.24, "elapsed_time": "1:38:30", "remaining_time": "1 day, 0:39:38", "throughput": 1801.66, "total_tokens": 10649600} +{"current_steps": 1310, "total_steps": 20825, "loss": 1.2477, "learning_rate": 4.9969840827935776e-05, "epoch": 0.06290516206482594, "percentage": 6.29, "elapsed_time": "1:39:17", "remaining_time": "1 day, 0:39:01", "throughput": 1801.49, "total_tokens": 10731520} +{"current_steps": 1320, "total_steps": 20825, "loss": 0.674, "learning_rate": 4.99678641154716e-05, "epoch": 0.06338535414165666, "percentage": 6.34, "elapsed_time": "1:40:02", "remaining_time": "1 day, 0:38:21", "throughput": 1801.38, "total_tokens": 10813440} +{"current_steps": 1330, "total_steps": 20825, "loss": 1.063, "learning_rate": 4.9965824704867806e-05, "epoch": 0.06386554621848739, "percentage": 6.39, "elapsed_time": "1:40:48", "remaining_time": "1 day, 0:37:35", "throughput": 1801.38, "total_tokens": 10895360} +{"current_steps": 1340, "total_steps": 20825, "loss": 0.8696, "learning_rate": 4.996372260124567e-05, "epoch": 0.06434573829531813, "percentage": 6.43, "elapsed_time": "1:41:33", "remaining_time": "1 day, 0:36:52", "throughput": 1801.33, "total_tokens": 10977280} +{"current_steps": 1350, "total_steps": 20825, "loss": 0.7504, "learning_rate": 4.996155780988389e-05, "epoch": 0.06482593037214886, "percentage": 6.48, "elapsed_time": "1:42:19", "remaining_time": "1 day, 0:36:07", "throughput": 1801.33, "total_tokens": 11059200} +{"current_steps": 1360, "total_steps": 20825, "loss": 0.8579, "learning_rate": 4.9959330336218605e-05, "epoch": 0.0653061224489796, "percentage": 6.53, "elapsed_time": "1:43:04", "remaining_time": "1 day, 0:35:15", "throughput": 1801.46, "total_tokens": 11141120} +{"current_steps": 1370, "total_steps": 20825, "loss": 0.9259, "learning_rate": 4.995704018584334e-05, "epoch": 0.06578631452581032, "percentage": 6.58, "elapsed_time": "1:43:49", "remaining_time": "1 day, 0:34:29", "throughput": 1801.47, "total_tokens": 11223040} +{"current_steps": 1380, "total_steps": 20825, "loss": 0.7141, "learning_rate": 4.9954687364508996e-05, "epoch": 0.06626650660264105, "percentage": 6.63, "elapsed_time": "1:44:35", "remaining_time": "1 day, 0:33:44", "throughput": 1801.46, "total_tokens": 11304960} +{"current_steps": 1390, "total_steps": 20825, "loss": 0.8471, "learning_rate": 4.995227187812389e-05, "epoch": 0.06674669867947179, "percentage": 6.67, "elapsed_time": "1:45:20", "remaining_time": "1 day, 0:32:52", "throughput": 1801.6, "total_tokens": 11386880} +{"current_steps": 1400, "total_steps": 20825, "loss": 1.0521, "learning_rate": 4.9949793732753656e-05, "epoch": 0.06722689075630252, "percentage": 6.72, "elapsed_time": "1:46:05", "remaining_time": "1 day, 0:32:01", "throughput": 1801.72, "total_tokens": 11468800} +{"current_steps": 1410, "total_steps": 20825, "loss": 0.9402, "learning_rate": 4.994725293462132e-05, "epoch": 0.06770708283313326, "percentage": 6.77, "elapsed_time": "1:46:50", "remaining_time": "1 day, 0:31:10", "throughput": 1801.83, "total_tokens": 11550720} +{"current_steps": 1420, "total_steps": 20825, "loss": 0.9594, "learning_rate": 4.994464949010722e-05, "epoch": 0.06818727490996399, "percentage": 6.82, "elapsed_time": "1:47:35", "remaining_time": "1 day, 0:30:19", "throughput": 1801.93, "total_tokens": 11632640} +{"current_steps": 1430, "total_steps": 20825, "loss": 0.9039, "learning_rate": 4.994198340574898e-05, "epoch": 0.06866746698679471, "percentage": 6.87, "elapsed_time": "1:48:20", "remaining_time": "1 day, 0:29:31", "throughput": 1801.99, "total_tokens": 11714560} +{"current_steps": 1440, "total_steps": 20825, "loss": 0.8399, "learning_rate": 4.993925468824156e-05, "epoch": 0.06914765906362545, "percentage": 6.91, "elapsed_time": "1:49:06", "remaining_time": "1 day, 0:28:42", "throughput": 1802.06, "total_tokens": 11796480} +{"current_steps": 1450, "total_steps": 20825, "loss": 0.9013, "learning_rate": 4.99364633444372e-05, "epoch": 0.06962785114045618, "percentage": 6.96, "elapsed_time": "1:49:51", "remaining_time": "1 day, 0:27:55", "throughput": 1802.1, "total_tokens": 11878400} +{"current_steps": 1460, "total_steps": 20825, "loss": 0.9985, "learning_rate": 4.993360938134537e-05, "epoch": 0.07010804321728692, "percentage": 7.01, "elapsed_time": "1:50:36", "remaining_time": "1 day, 0:27:09", "throughput": 1802.11, "total_tokens": 11960320} +{"current_steps": 1470, "total_steps": 20825, "loss": 1.0197, "learning_rate": 4.993069280613282e-05, "epoch": 0.07058823529411765, "percentage": 7.06, "elapsed_time": "1:51:22", "remaining_time": "1 day, 0:26:24", "throughput": 1802.1, "total_tokens": 12042240} +{"current_steps": 1480, "total_steps": 20825, "loss": 0.964, "learning_rate": 4.9927713626123524e-05, "epoch": 0.07106842737094837, "percentage": 7.11, "elapsed_time": "1:52:07", "remaining_time": "1 day, 0:25:33", "throughput": 1802.2, "total_tokens": 12124160} +{"current_steps": 1490, "total_steps": 20825, "loss": 0.9385, "learning_rate": 4.992467184879865e-05, "epoch": 0.07154861944777911, "percentage": 7.15, "elapsed_time": "1:52:53", "remaining_time": "1 day, 0:24:51", "throughput": 1802.14, "total_tokens": 12206080} +{"current_steps": 1500, "total_steps": 20825, "loss": 1.0057, "learning_rate": 4.9921567481796585e-05, "epoch": 0.07202881152460984, "percentage": 7.2, "elapsed_time": "1:53:38", "remaining_time": "1 day, 0:24:00", "throughput": 1802.24, "total_tokens": 12288000} +{"current_steps": 1510, "total_steps": 20825, "loss": 0.955, "learning_rate": 4.9918400532912845e-05, "epoch": 0.07250900360144058, "percentage": 7.25, "elapsed_time": "1:54:23", "remaining_time": "1 day, 0:23:12", "throughput": 1802.3, "total_tokens": 12369920} +{"current_steps": 1520, "total_steps": 20825, "loss": 0.9024, "learning_rate": 4.991517101010015e-05, "epoch": 0.07298919567827131, "percentage": 7.3, "elapsed_time": "1:55:09", "remaining_time": "1 day, 0:22:30", "throughput": 1802.23, "total_tokens": 12451840} +{"current_steps": 1530, "total_steps": 20825, "loss": 1.0432, "learning_rate": 4.9911878921468304e-05, "epoch": 0.07346938775510205, "percentage": 7.35, "elapsed_time": "1:55:54", "remaining_time": "1 day, 0:21:43", "throughput": 1802.26, "total_tokens": 12533760} +{"current_steps": 1540, "total_steps": 20825, "loss": 0.9204, "learning_rate": 4.990852427528427e-05, "epoch": 0.07394957983193277, "percentage": 7.39, "elapsed_time": "1:56:39", "remaining_time": "1 day, 0:20:55", "throughput": 1802.32, "total_tokens": 12615680} +{"current_steps": 1550, "total_steps": 20825, "loss": 0.9548, "learning_rate": 4.9905107079972064e-05, "epoch": 0.0744297719087635, "percentage": 7.44, "elapsed_time": "1:57:25", "remaining_time": "1 day, 0:20:10", "throughput": 1802.3, "total_tokens": 12697600} +{"current_steps": 1560, "total_steps": 20825, "loss": 0.9657, "learning_rate": 4.990162734411279e-05, "epoch": 0.07490996398559424, "percentage": 7.49, "elapsed_time": "1:58:10", "remaining_time": "1 day, 0:19:21", "throughput": 1802.37, "total_tokens": 12779520} +{"current_steps": 1570, "total_steps": 20825, "loss": 1.0059, "learning_rate": 4.989808507644461e-05, "epoch": 0.07539015606242497, "percentage": 7.54, "elapsed_time": "1:58:55", "remaining_time": "1 day, 0:18:33", "throughput": 1802.43, "total_tokens": 12861440} +{"current_steps": 1580, "total_steps": 20825, "loss": 0.9245, "learning_rate": 4.989448028586269e-05, "epoch": 0.07587034813925571, "percentage": 7.59, "elapsed_time": "1:59:40", "remaining_time": "1 day, 0:17:43", "throughput": 1802.53, "total_tokens": 12943360} +{"current_steps": 1590, "total_steps": 20825, "loss": 0.8293, "learning_rate": 4.989081298141921e-05, "epoch": 0.07635054021608643, "percentage": 7.64, "elapsed_time": "2:00:26", "remaining_time": "1 day, 0:16:57", "throughput": 1802.53, "total_tokens": 13025280} +{"current_steps": 1600, "total_steps": 20825, "loss": 0.8068, "learning_rate": 4.988708317232334e-05, "epoch": 0.07683073229291716, "percentage": 7.68, "elapsed_time": "2:01:11", "remaining_time": "1 day, 0:16:10", "throughput": 1802.56, "total_tokens": 13107200} +{"current_steps": 1610, "total_steps": 20825, "loss": 0.8037, "learning_rate": 4.988329086794122e-05, "epoch": 0.0773109243697479, "percentage": 7.73, "elapsed_time": "2:01:56", "remaining_time": "1 day, 0:15:26", "throughput": 1802.54, "total_tokens": 13189120} +{"current_steps": 1620, "total_steps": 20825, "loss": 1.1678, "learning_rate": 4.9879436077795884e-05, "epoch": 0.07779111644657863, "percentage": 7.78, "elapsed_time": "2:02:42", "remaining_time": "1 day, 0:14:44", "throughput": 1802.47, "total_tokens": 13271040} +{"current_steps": 1630, "total_steps": 20825, "loss": 0.946, "learning_rate": 4.98755188115673e-05, "epoch": 0.07827130852340937, "percentage": 7.83, "elapsed_time": "2:03:28", "remaining_time": "1 day, 0:13:58", "throughput": 1802.48, "total_tokens": 13352960} +{"current_steps": 1640, "total_steps": 20825, "loss": 0.9426, "learning_rate": 4.9871539079092344e-05, "epoch": 0.0787515006002401, "percentage": 7.88, "elapsed_time": "2:04:13", "remaining_time": "1 day, 0:13:08", "throughput": 1802.56, "total_tokens": 13434880} +{"current_steps": 1650, "total_steps": 20825, "loss": 1.0174, "learning_rate": 4.9867496890364726e-05, "epoch": 0.07923169267707082, "percentage": 7.92, "elapsed_time": "2:04:58", "remaining_time": "1 day, 0:12:21", "throughput": 1802.61, "total_tokens": 13516800} +{"current_steps": 1660, "total_steps": 20825, "loss": 1.1374, "learning_rate": 4.9863392255535e-05, "epoch": 0.07971188475390156, "percentage": 7.97, "elapsed_time": "2:05:44", "remaining_time": "1 day, 0:11:41", "throughput": 1802.48, "total_tokens": 13598720} +{"current_steps": 1670, "total_steps": 20825, "loss": 0.9507, "learning_rate": 4.985922518491054e-05, "epoch": 0.08019207683073229, "percentage": 8.02, "elapsed_time": "2:06:29", "remaining_time": "1 day, 0:10:54", "throughput": 1802.52, "total_tokens": 13680640} +{"current_steps": 1680, "total_steps": 20825, "loss": 1.0419, "learning_rate": 4.9854995688955494e-05, "epoch": 0.08067226890756303, "percentage": 8.07, "elapsed_time": "2:07:14", "remaining_time": "1 day, 0:10:06", "throughput": 1802.57, "total_tokens": 13762560} +{"current_steps": 1690, "total_steps": 20825, "loss": 1.1634, "learning_rate": 4.9850703778290784e-05, "epoch": 0.08115246098439376, "percentage": 8.12, "elapsed_time": "2:08:00", "remaining_time": "1 day, 0:09:19", "throughput": 1802.61, "total_tokens": 13844480} +{"current_steps": 1700, "total_steps": 20825, "loss": 1.0925, "learning_rate": 4.984634946369404e-05, "epoch": 0.08163265306122448, "percentage": 8.16, "elapsed_time": "2:08:45", "remaining_time": "1 day, 0:08:36", "throughput": 1802.56, "total_tokens": 13926400} +{"current_steps": 1710, "total_steps": 20825, "loss": 1.2723, "learning_rate": 4.984193275609964e-05, "epoch": 0.08211284513805522, "percentage": 8.21, "elapsed_time": "2:09:31", "remaining_time": "1 day, 0:07:47", "throughput": 1802.63, "total_tokens": 14008320} +{"current_steps": 1720, "total_steps": 20825, "loss": 0.9903, "learning_rate": 4.983745366659859e-05, "epoch": 0.08259303721488595, "percentage": 8.26, "elapsed_time": "2:10:16", "remaining_time": "1 day, 0:06:59", "throughput": 1802.69, "total_tokens": 14090240} +{"current_steps": 1730, "total_steps": 20825, "loss": 0.9931, "learning_rate": 4.983291220643858e-05, "epoch": 0.08307322929171669, "percentage": 8.31, "elapsed_time": "2:11:01", "remaining_time": "1 day, 0:06:10", "throughput": 1802.75, "total_tokens": 14172160} +{"current_steps": 1740, "total_steps": 20825, "loss": 1.0356, "learning_rate": 4.982830838702392e-05, "epoch": 0.08355342136854742, "percentage": 8.36, "elapsed_time": "2:11:46", "remaining_time": "1 day, 0:05:22", "throughput": 1802.82, "total_tokens": 14254080} +{"current_steps": 1750, "total_steps": 20825, "loss": 0.9048, "learning_rate": 4.98236422199155e-05, "epoch": 0.08403361344537816, "percentage": 8.4, "elapsed_time": "2:12:31", "remaining_time": "1 day, 0:04:33", "throughput": 1802.89, "total_tokens": 14336000} +{"current_steps": 1760, "total_steps": 20825, "loss": 0.9876, "learning_rate": 4.9818913716830784e-05, "epoch": 0.08451380552220888, "percentage": 8.45, "elapsed_time": "2:13:17", "remaining_time": "1 day, 0:03:49", "throughput": 1802.86, "total_tokens": 14417920} +{"current_steps": 1770, "total_steps": 20825, "loss": 1.0288, "learning_rate": 4.981412288964377e-05, "epoch": 0.08499399759903961, "percentage": 8.5, "elapsed_time": "2:14:02", "remaining_time": "1 day, 0:03:01", "throughput": 1802.91, "total_tokens": 14499840} +{"current_steps": 1780, "total_steps": 20825, "loss": 1.0098, "learning_rate": 4.9809269750384956e-05, "epoch": 0.08547418967587035, "percentage": 8.55, "elapsed_time": "2:14:47", "remaining_time": "1 day, 0:02:15", "throughput": 1802.93, "total_tokens": 14581760} +{"current_steps": 1790, "total_steps": 20825, "loss": 1.1153, "learning_rate": 4.980435431124133e-05, "epoch": 0.08595438175270108, "percentage": 8.6, "elapsed_time": "2:15:33", "remaining_time": "1 day, 0:01:30", "throughput": 1802.91, "total_tokens": 14663680} +{"current_steps": 1800, "total_steps": 20825, "loss": 0.9484, "learning_rate": 4.97993765845563e-05, "epoch": 0.08643457382953182, "percentage": 8.64, "elapsed_time": "2:16:18", "remaining_time": "1 day, 0:00:44", "throughput": 1802.92, "total_tokens": 14745600} +{"current_steps": 1810, "total_steps": 20825, "loss": 0.9613, "learning_rate": 4.9794336582829714e-05, "epoch": 0.08691476590636255, "percentage": 8.69, "elapsed_time": "2:17:03", "remaining_time": "23:59:55", "throughput": 1803.0, "total_tokens": 14827520} +{"current_steps": 1820, "total_steps": 20825, "loss": 1.0271, "learning_rate": 4.9789234318717784e-05, "epoch": 0.08739495798319327, "percentage": 8.74, "elapsed_time": "2:17:48", "remaining_time": "23:59:06", "throughput": 1803.06, "total_tokens": 14909440} +{"current_steps": 1830, "total_steps": 20825, "loss": 1.0182, "learning_rate": 4.978406980503308e-05, "epoch": 0.08787515006002401, "percentage": 8.79, "elapsed_time": "2:18:34", "remaining_time": "23:58:18", "throughput": 1803.13, "total_tokens": 14991360} +{"current_steps": 1840, "total_steps": 20825, "loss": 0.9922, "learning_rate": 4.9778843054744494e-05, "epoch": 0.08835534213685474, "percentage": 8.84, "elapsed_time": "2:19:19", "remaining_time": "23:57:33", "throughput": 1803.12, "total_tokens": 15073280} +{"current_steps": 1850, "total_steps": 20825, "loss": 0.9673, "learning_rate": 4.977355408097719e-05, "epoch": 0.08883553421368548, "percentage": 8.88, "elapsed_time": "2:20:04", "remaining_time": "23:56:44", "throughput": 1803.2, "total_tokens": 15155200} +{"current_steps": 1860, "total_steps": 20825, "loss": 0.8494, "learning_rate": 4.9768202897012595e-05, "epoch": 0.0893157262905162, "percentage": 8.93, "elapsed_time": "2:20:49", "remaining_time": "23:55:55", "throughput": 1803.26, "total_tokens": 15237120} +{"current_steps": 1870, "total_steps": 20825, "loss": 1.0266, "learning_rate": 4.9762789516288354e-05, "epoch": 0.08979591836734693, "percentage": 8.98, "elapsed_time": "2:21:34", "remaining_time": "23:55:08", "throughput": 1803.31, "total_tokens": 15319040} +{"current_steps": 1880, "total_steps": 20825, "loss": 0.9799, "learning_rate": 4.97573139523983e-05, "epoch": 0.09027611044417767, "percentage": 9.03, "elapsed_time": "2:22:20", "remaining_time": "23:54:21", "throughput": 1803.34, "total_tokens": 15400960} +{"current_steps": 1890, "total_steps": 20825, "loss": 1.0606, "learning_rate": 4.9751776219092405e-05, "epoch": 0.0907563025210084, "percentage": 9.08, "elapsed_time": "2:23:05", "remaining_time": "23:53:35", "throughput": 1803.34, "total_tokens": 15482880} +{"current_steps": 1900, "total_steps": 20825, "loss": 0.8944, "learning_rate": 4.9746176330276783e-05, "epoch": 0.09123649459783914, "percentage": 9.12, "elapsed_time": "2:23:51", "remaining_time": "23:52:52", "throughput": 1803.3, "total_tokens": 15564800} +{"current_steps": 1910, "total_steps": 20825, "loss": 1.0702, "learning_rate": 4.97405143000136e-05, "epoch": 0.09171668667466987, "percentage": 9.17, "elapsed_time": "2:24:36", "remaining_time": "23:52:04", "throughput": 1803.34, "total_tokens": 15646720} +{"current_steps": 1920, "total_steps": 20825, "loss": 1.0714, "learning_rate": 4.9734790142521096e-05, "epoch": 0.0921968787515006, "percentage": 9.22, "elapsed_time": "2:25:22", "remaining_time": "23:51:21", "throughput": 1803.29, "total_tokens": 15728640} +{"current_steps": 1930, "total_steps": 20825, "loss": 1.1282, "learning_rate": 4.9729003872173494e-05, "epoch": 0.09267707082833133, "percentage": 9.27, "elapsed_time": "2:26:07", "remaining_time": "23:50:37", "throughput": 1803.27, "total_tokens": 15810560} +{"current_steps": 1940, "total_steps": 20825, "loss": 0.9172, "learning_rate": 4.972315550350102e-05, "epoch": 0.09315726290516206, "percentage": 9.32, "elapsed_time": "2:26:53", "remaining_time": "23:49:53", "throughput": 1803.24, "total_tokens": 15892480} +{"current_steps": 1950, "total_steps": 20825, "loss": 0.9888, "learning_rate": 4.971724505118982e-05, "epoch": 0.0936374549819928, "percentage": 9.36, "elapsed_time": "2:27:38", "remaining_time": "23:49:05", "throughput": 1803.3, "total_tokens": 15974400} +{"current_steps": 1960, "total_steps": 20825, "loss": 1.052, "learning_rate": 4.971127253008194e-05, "epoch": 0.09411764705882353, "percentage": 9.41, "elapsed_time": "2:28:24", "remaining_time": "23:48:21", "throughput": 1803.26, "total_tokens": 16056320} +{"current_steps": 1970, "total_steps": 20825, "loss": 1.0703, "learning_rate": 4.970523795517532e-05, "epoch": 0.09459783913565427, "percentage": 9.46, "elapsed_time": "2:29:09", "remaining_time": "23:47:34", "throughput": 1803.29, "total_tokens": 16138240} +{"current_steps": 1980, "total_steps": 20825, "loss": 0.8602, "learning_rate": 4.969914134162368e-05, "epoch": 0.095078031212485, "percentage": 9.51, "elapsed_time": "2:29:54", "remaining_time": "23:46:49", "throughput": 1803.28, "total_tokens": 16220160} +{"current_steps": 1990, "total_steps": 20825, "loss": 0.914, "learning_rate": 4.9692982704736566e-05, "epoch": 0.09555822328931572, "percentage": 9.56, "elapsed_time": "2:30:40", "remaining_time": "23:46:03", "throughput": 1803.29, "total_tokens": 16302080} +{"current_steps": 2000, "total_steps": 20825, "loss": 0.8096, "learning_rate": 4.968676205997925e-05, "epoch": 0.09603841536614646, "percentage": 9.6, "elapsed_time": "2:31:25", "remaining_time": "23:45:17", "throughput": 1803.3, "total_tokens": 16384000} +{"current_steps": 2010, "total_steps": 20825, "loss": 1.0233, "learning_rate": 4.9680479422972735e-05, "epoch": 0.09651860744297719, "percentage": 9.65, "elapsed_time": "2:32:14", "remaining_time": "23:45:04", "throughput": 1802.63, "total_tokens": 16465920} +{"current_steps": 2020, "total_steps": 20825, "loss": 0.9492, "learning_rate": 4.9674134809493686e-05, "epoch": 0.09699879951980793, "percentage": 9.7, "elapsed_time": "2:32:59", "remaining_time": "23:44:15", "throughput": 1802.7, "total_tokens": 16547840} +{"current_steps": 2030, "total_steps": 20825, "loss": 0.9868, "learning_rate": 4.9667728235474396e-05, "epoch": 0.09747899159663866, "percentage": 9.75, "elapsed_time": "2:33:44", "remaining_time": "23:43:27", "throughput": 1802.75, "total_tokens": 16629760} +{"current_steps": 2040, "total_steps": 20825, "loss": 0.8727, "learning_rate": 4.9661259717002764e-05, "epoch": 0.09795918367346938, "percentage": 9.8, "elapsed_time": "2:34:30", "remaining_time": "23:42:42", "throughput": 1802.73, "total_tokens": 16711680} +{"current_steps": 2050, "total_steps": 20825, "loss": 1.0359, "learning_rate": 4.9654729270322234e-05, "epoch": 0.09843937575030012, "percentage": 9.84, "elapsed_time": "2:35:15", "remaining_time": "23:41:54", "throughput": 1802.8, "total_tokens": 16793600} +{"current_steps": 2060, "total_steps": 20825, "loss": 0.9957, "learning_rate": 4.964813691183174e-05, "epoch": 0.09891956782713085, "percentage": 9.89, "elapsed_time": "2:36:00", "remaining_time": "23:41:06", "throughput": 1802.86, "total_tokens": 16875520} +{"current_steps": 2070, "total_steps": 20825, "loss": 0.8838, "learning_rate": 4.964148265808573e-05, "epoch": 0.09939975990396159, "percentage": 9.94, "elapsed_time": "2:36:45", "remaining_time": "23:40:16", "throughput": 1802.94, "total_tokens": 16957440} +{"current_steps": 2080, "total_steps": 20825, "loss": 0.8697, "learning_rate": 4.963476652579404e-05, "epoch": 0.09987995198079232, "percentage": 9.99, "elapsed_time": "2:37:30", "remaining_time": "23:39:28", "throughput": 1803.01, "total_tokens": 17039360} +{"current_steps": 2090, "total_steps": 20825, "loss": 1.1534, "learning_rate": 4.962798853182192e-05, "epoch": 0.10036014405762304, "percentage": 10.04, "elapsed_time": "2:38:16", "remaining_time": "23:38:43", "throughput": 1802.99, "total_tokens": 17121280} +{"current_steps": 2100, "total_steps": 20825, "loss": 1.1309, "learning_rate": 4.9621148693189954e-05, "epoch": 0.10084033613445378, "percentage": 10.08, "elapsed_time": "2:39:01", "remaining_time": "23:37:57", "throughput": 1803.01, "total_tokens": 17203200} +{"current_steps": 2110, "total_steps": 20825, "loss": 1.208, "learning_rate": 4.9614247027074024e-05, "epoch": 0.10132052821128451, "percentage": 10.13, "elapsed_time": "2:39:46", "remaining_time": "23:37:09", "throughput": 1803.06, "total_tokens": 17285120} +{"current_steps": 2120, "total_steps": 20825, "loss": 0.8207, "learning_rate": 4.960728355080527e-05, "epoch": 0.10180072028811525, "percentage": 10.18, "elapsed_time": "2:40:31", "remaining_time": "23:36:20", "throughput": 1803.14, "total_tokens": 17367040} +{"current_steps": 2130, "total_steps": 20825, "loss": 0.914, "learning_rate": 4.9600258281870046e-05, "epoch": 0.10228091236494598, "percentage": 10.23, "elapsed_time": "2:41:16", "remaining_time": "23:35:34", "throughput": 1803.14, "total_tokens": 17448960} +{"current_steps": 2140, "total_steps": 20825, "loss": 0.9198, "learning_rate": 4.959317123790988e-05, "epoch": 0.1027611044417767, "percentage": 10.28, "elapsed_time": "2:42:02", "remaining_time": "23:34:48", "throughput": 1803.16, "total_tokens": 17530880} +{"current_steps": 2150, "total_steps": 20825, "loss": 0.9969, "learning_rate": 4.958602243672145e-05, "epoch": 0.10324129651860744, "percentage": 10.32, "elapsed_time": "2:42:47", "remaining_time": "23:33:59", "throughput": 1803.23, "total_tokens": 17612800} +{"current_steps": 2160, "total_steps": 20825, "loss": 0.9702, "learning_rate": 4.9578811896256475e-05, "epoch": 0.10372148859543817, "percentage": 10.37, "elapsed_time": "2:43:32", "remaining_time": "23:33:11", "throughput": 1803.29, "total_tokens": 17694720} +{"current_steps": 2170, "total_steps": 20825, "loss": 0.9843, "learning_rate": 4.957153963462172e-05, "epoch": 0.10420168067226891, "percentage": 10.42, "elapsed_time": "2:44:17", "remaining_time": "23:32:23", "throughput": 1803.35, "total_tokens": 17776640} +{"current_steps": 2180, "total_steps": 20825, "loss": 0.9514, "learning_rate": 4.9564205670078965e-05, "epoch": 0.10468187274909964, "percentage": 10.47, "elapsed_time": "2:45:03", "remaining_time": "23:31:40", "throughput": 1803.29, "total_tokens": 17858560} +{"current_steps": 2190, "total_steps": 20825, "loss": 0.9166, "learning_rate": 4.955681002104492e-05, "epoch": 0.10516206482593037, "percentage": 10.52, "elapsed_time": "2:45:48", "remaining_time": "23:30:53", "throughput": 1803.33, "total_tokens": 17940480} +{"current_steps": 2200, "total_steps": 20825, "loss": 0.9447, "learning_rate": 4.954935270609119e-05, "epoch": 0.1056422569027611, "percentage": 10.56, "elapsed_time": "2:46:33", "remaining_time": "23:30:05", "throughput": 1803.37, "total_tokens": 18022400} +{"current_steps": 2210, "total_steps": 20825, "loss": 1.0235, "learning_rate": 4.9541833743944244e-05, "epoch": 0.10612244897959183, "percentage": 10.61, "elapsed_time": "2:47:19", "remaining_time": "23:29:19", "throughput": 1803.4, "total_tokens": 18104320} +{"current_steps": 2220, "total_steps": 20825, "loss": 0.9329, "learning_rate": 4.953425315348534e-05, "epoch": 0.10660264105642257, "percentage": 10.66, "elapsed_time": "2:48:04", "remaining_time": "23:28:30", "throughput": 1803.47, "total_tokens": 18186240} +{"current_steps": 2230, "total_steps": 20825, "loss": 1.0003, "learning_rate": 4.952661095375051e-05, "epoch": 0.1070828331332533, "percentage": 10.71, "elapsed_time": "2:48:49", "remaining_time": "23:27:42", "throughput": 1803.52, "total_tokens": 18268160} +{"current_steps": 2240, "total_steps": 20825, "loss": 0.852, "learning_rate": 4.95189071639305e-05, "epoch": 0.10756302521008404, "percentage": 10.76, "elapsed_time": "2:49:34", "remaining_time": "23:26:55", "throughput": 1803.55, "total_tokens": 18350080} +{"current_steps": 2250, "total_steps": 20825, "loss": 0.8421, "learning_rate": 4.951114180337069e-05, "epoch": 0.10804321728691477, "percentage": 10.8, "elapsed_time": "2:50:19", "remaining_time": "23:26:11", "throughput": 1803.52, "total_tokens": 18432000} +{"current_steps": 2260, "total_steps": 20825, "loss": 0.7993, "learning_rate": 4.95033148915711e-05, "epoch": 0.1085234093637455, "percentage": 10.85, "elapsed_time": "2:51:05", "remaining_time": "23:25:25", "throughput": 1803.53, "total_tokens": 18513920} +{"current_steps": 2270, "total_steps": 20825, "loss": 0.8758, "learning_rate": 4.949542644818631e-05, "epoch": 0.10900360144057623, "percentage": 10.9, "elapsed_time": "2:51:50", "remaining_time": "23:24:38", "throughput": 1803.57, "total_tokens": 18595840} +{"current_steps": 2280, "total_steps": 20825, "loss": 1.0688, "learning_rate": 4.948747649302542e-05, "epoch": 0.10948379351740696, "percentage": 10.95, "elapsed_time": "2:52:35", "remaining_time": "23:23:49", "throughput": 1803.64, "total_tokens": 18677760} +{"current_steps": 2290, "total_steps": 20825, "loss": 0.9846, "learning_rate": 4.947946504605198e-05, "epoch": 0.1099639855942377, "percentage": 11.0, "elapsed_time": "2:53:20", "remaining_time": "23:23:01", "throughput": 1803.7, "total_tokens": 18759680} +{"current_steps": 2300, "total_steps": 20825, "loss": 0.9205, "learning_rate": 4.947139212738395e-05, "epoch": 0.11044417767106843, "percentage": 11.04, "elapsed_time": "2:54:05", "remaining_time": "23:22:13", "throughput": 1803.75, "total_tokens": 18841600} +{"current_steps": 2310, "total_steps": 20825, "loss": 1.0461, "learning_rate": 4.946325775729368e-05, "epoch": 0.11092436974789915, "percentage": 11.09, "elapsed_time": "2:54:51", "remaining_time": "23:21:30", "throughput": 1803.71, "total_tokens": 18923520} +{"current_steps": 2320, "total_steps": 20825, "loss": 0.9106, "learning_rate": 4.945506195620784e-05, "epoch": 0.1114045618247299, "percentage": 11.14, "elapsed_time": "2:55:36", "remaining_time": "23:20:43", "throughput": 1803.74, "total_tokens": 19005440} +{"current_steps": 2330, "total_steps": 20825, "loss": 0.9038, "learning_rate": 4.944680474470731e-05, "epoch": 0.11188475390156062, "percentage": 11.19, "elapsed_time": "2:56:21", "remaining_time": "23:19:57", "throughput": 1803.76, "total_tokens": 19087360} +{"current_steps": 2340, "total_steps": 20825, "loss": 1.1003, "learning_rate": 4.943848614352724e-05, "epoch": 0.11236494597839136, "percentage": 11.24, "elapsed_time": "2:57:07", "remaining_time": "23:19:10", "throughput": 1803.78, "total_tokens": 19169280} +{"current_steps": 2350, "total_steps": 20825, "loss": 0.8852, "learning_rate": 4.943010617355691e-05, "epoch": 0.11284513805522209, "percentage": 11.28, "elapsed_time": "2:57:52", "remaining_time": "23:18:23", "throughput": 1803.83, "total_tokens": 19251200} +{"current_steps": 2360, "total_steps": 20825, "loss": 0.9907, "learning_rate": 4.94216648558397e-05, "epoch": 0.11332533013205282, "percentage": 11.33, "elapsed_time": "2:58:37", "remaining_time": "23:17:34", "throughput": 1803.89, "total_tokens": 19333120} +{"current_steps": 2370, "total_steps": 20825, "loss": 0.8463, "learning_rate": 4.9413162211573075e-05, "epoch": 0.11380552220888356, "percentage": 11.38, "elapsed_time": "2:59:22", "remaining_time": "23:16:49", "throughput": 1803.9, "total_tokens": 19415040} +{"current_steps": 2380, "total_steps": 20825, "loss": 1.3157, "learning_rate": 4.9404598262108456e-05, "epoch": 0.11428571428571428, "percentage": 11.43, "elapsed_time": "3:00:08", "remaining_time": "23:16:04", "throughput": 1803.89, "total_tokens": 19496960} +{"current_steps": 2390, "total_steps": 20825, "loss": 1.0501, "learning_rate": 4.939597302895125e-05, "epoch": 0.11476590636254502, "percentage": 11.48, "elapsed_time": "3:00:53", "remaining_time": "23:15:17", "throughput": 1803.91, "total_tokens": 19578880} +{"current_steps": 2400, "total_steps": 20825, "loss": 0.9628, "learning_rate": 4.938728653376075e-05, "epoch": 0.11524609843937575, "percentage": 11.52, "elapsed_time": "3:01:38", "remaining_time": "23:14:29", "throughput": 1803.96, "total_tokens": 19660800} +{"current_steps": 2410, "total_steps": 20825, "loss": 0.8814, "learning_rate": 4.9378538798350046e-05, "epoch": 0.11572629051620648, "percentage": 11.57, "elapsed_time": "3:02:23", "remaining_time": "23:13:43", "throughput": 1803.99, "total_tokens": 19742720} +{"current_steps": 2420, "total_steps": 20825, "loss": 0.8009, "learning_rate": 4.936972984468608e-05, "epoch": 0.11620648259303722, "percentage": 11.62, "elapsed_time": "3:03:09", "remaining_time": "23:13:02", "throughput": 1803.88, "total_tokens": 19824640} +{"current_steps": 2430, "total_steps": 20825, "loss": 0.8686, "learning_rate": 4.936085969488947e-05, "epoch": 0.11668667466986794, "percentage": 11.67, "elapsed_time": "3:03:55", "remaining_time": "23:12:16", "throughput": 1803.91, "total_tokens": 19906560} +{"current_steps": 2440, "total_steps": 20825, "loss": 0.7769, "learning_rate": 4.9351928371234525e-05, "epoch": 0.11716686674669868, "percentage": 11.72, "elapsed_time": "3:04:40", "remaining_time": "23:11:30", "throughput": 1803.92, "total_tokens": 19988480} +{"current_steps": 2450, "total_steps": 20825, "loss": 0.8771, "learning_rate": 4.934293589614917e-05, "epoch": 0.11764705882352941, "percentage": 11.76, "elapsed_time": "3:05:25", "remaining_time": "23:10:43", "throughput": 1803.95, "total_tokens": 20070400} +{"current_steps": 2460, "total_steps": 20825, "loss": 1.0355, "learning_rate": 4.93338822922149e-05, "epoch": 0.11812725090036015, "percentage": 11.81, "elapsed_time": "3:06:11", "remaining_time": "23:09:58", "throughput": 1803.94, "total_tokens": 20152320} +{"current_steps": 2470, "total_steps": 20825, "loss": 0.9881, "learning_rate": 4.932476758216669e-05, "epoch": 0.11860744297719088, "percentage": 11.86, "elapsed_time": "3:06:56", "remaining_time": "23:09:11", "throughput": 1803.97, "total_tokens": 20234240} +{"current_steps": 2480, "total_steps": 20825, "loss": 0.9443, "learning_rate": 4.931559178889297e-05, "epoch": 0.1190876350540216, "percentage": 11.91, "elapsed_time": "3:07:41", "remaining_time": "23:08:24", "throughput": 1804.01, "total_tokens": 20316160} +{"current_steps": 2490, "total_steps": 20825, "loss": 1.0363, "learning_rate": 4.9306354935435594e-05, "epoch": 0.11956782713085234, "percentage": 11.96, "elapsed_time": "3:08:27", "remaining_time": "23:07:38", "throughput": 1804.02, "total_tokens": 20398080} +{"current_steps": 2500, "total_steps": 20825, "loss": 1.0079, "learning_rate": 4.929705704498969e-05, "epoch": 0.12004801920768307, "percentage": 12.0, "elapsed_time": "3:09:12", "remaining_time": "23:06:51", "throughput": 1804.05, "total_tokens": 20480000} +{"current_steps": 2510, "total_steps": 20825, "loss": 0.9076, "learning_rate": 4.928769814090371e-05, "epoch": 0.12052821128451381, "percentage": 12.05, "elapsed_time": "3:09:57", "remaining_time": "23:06:04", "throughput": 1804.09, "total_tokens": 20561920} +{"current_steps": 2520, "total_steps": 20825, "loss": 1.0913, "learning_rate": 4.927827824667929e-05, "epoch": 0.12100840336134454, "percentage": 12.1, "elapsed_time": "3:10:42", "remaining_time": "23:05:17", "throughput": 1804.13, "total_tokens": 20643840} +{"current_steps": 2530, "total_steps": 20825, "loss": 1.0558, "learning_rate": 4.926879738597122e-05, "epoch": 0.12148859543817526, "percentage": 12.15, "elapsed_time": "3:11:27", "remaining_time": "23:04:30", "throughput": 1804.17, "total_tokens": 20725760} +{"current_steps": 2540, "total_steps": 20825, "loss": 1.1955, "learning_rate": 4.925925558258741e-05, "epoch": 0.121968787515006, "percentage": 12.2, "elapsed_time": "3:12:13", "remaining_time": "23:03:47", "throughput": 1804.11, "total_tokens": 20807680} +{"current_steps": 2550, "total_steps": 20825, "loss": 0.9205, "learning_rate": 4.924965286048879e-05, "epoch": 0.12244897959183673, "percentage": 12.24, "elapsed_time": "3:12:58", "remaining_time": "23:03:01", "throughput": 1804.12, "total_tokens": 20889600} +{"current_steps": 2560, "total_steps": 20825, "loss": 1.0418, "learning_rate": 4.9239989243789275e-05, "epoch": 0.12292917166866747, "percentage": 12.29, "elapsed_time": "3:13:44", "remaining_time": "23:02:17", "throughput": 1804.09, "total_tokens": 20971520} +{"current_steps": 2570, "total_steps": 20825, "loss": 1.0242, "learning_rate": 4.9230264756755685e-05, "epoch": 0.1234093637454982, "percentage": 12.34, "elapsed_time": "3:14:29", "remaining_time": "23:01:31", "throughput": 1804.11, "total_tokens": 21053440} +{"current_steps": 2580, "total_steps": 20825, "loss": 0.9804, "learning_rate": 4.9220479423807694e-05, "epoch": 0.12388955582232893, "percentage": 12.39, "elapsed_time": "3:15:15", "remaining_time": "23:00:46", "throughput": 1804.09, "total_tokens": 21135360} +{"current_steps": 2590, "total_steps": 20825, "loss": 1.0083, "learning_rate": 4.9210633269517776e-05, "epoch": 0.12436974789915967, "percentage": 12.44, "elapsed_time": "3:16:00", "remaining_time": "22:59:58", "throughput": 1804.15, "total_tokens": 21217280} +{"current_steps": 2600, "total_steps": 20825, "loss": 0.9283, "learning_rate": 4.920072631861115e-05, "epoch": 0.12484993997599039, "percentage": 12.48, "elapsed_time": "3:16:45", "remaining_time": "22:59:12", "throughput": 1804.17, "total_tokens": 21299200} +{"current_steps": 2610, "total_steps": 20825, "loss": 1.1134, "learning_rate": 4.919075859596567e-05, "epoch": 0.12533013205282112, "percentage": 12.53, "elapsed_time": "3:17:30", "remaining_time": "22:58:25", "throughput": 1804.2, "total_tokens": 21381120} +{"current_steps": 2620, "total_steps": 20825, "loss": 1.1302, "learning_rate": 4.918073012661183e-05, "epoch": 0.12581032412965187, "percentage": 12.58, "elapsed_time": "3:18:15", "remaining_time": "22:57:38", "throughput": 1804.23, "total_tokens": 21463040} +{"current_steps": 2630, "total_steps": 20825, "loss": 1.0637, "learning_rate": 4.9170640935732654e-05, "epoch": 0.1262905162064826, "percentage": 12.63, "elapsed_time": "3:19:01", "remaining_time": "22:56:54", "throughput": 1804.21, "total_tokens": 21544960} +{"current_steps": 2640, "total_steps": 20825, "loss": 0.8478, "learning_rate": 4.916049104866365e-05, "epoch": 0.12677070828331333, "percentage": 12.68, "elapsed_time": "3:19:47", "remaining_time": "22:56:10", "throughput": 1804.18, "total_tokens": 21626880} +{"current_steps": 2650, "total_steps": 20825, "loss": 0.9934, "learning_rate": 4.915028049089274e-05, "epoch": 0.12725090036014405, "percentage": 12.73, "elapsed_time": "3:20:32", "remaining_time": "22:55:24", "throughput": 1804.19, "total_tokens": 21708800} +{"current_steps": 2660, "total_steps": 20825, "loss": 0.9332, "learning_rate": 4.914000928806021e-05, "epoch": 0.12773109243697478, "percentage": 12.77, "elapsed_time": "3:21:17", "remaining_time": "22:54:38", "throughput": 1804.2, "total_tokens": 21790720} +{"current_steps": 2670, "total_steps": 20825, "loss": 1.0782, "learning_rate": 4.912967746595861e-05, "epoch": 0.12821128451380553, "percentage": 12.82, "elapsed_time": "3:22:03", "remaining_time": "22:53:52", "throughput": 1804.2, "total_tokens": 21872640} +{"current_steps": 2680, "total_steps": 20825, "loss": 1.1305, "learning_rate": 4.911928505053275e-05, "epoch": 0.12869147659063626, "percentage": 12.87, "elapsed_time": "3:22:48", "remaining_time": "22:53:08", "throughput": 1804.19, "total_tokens": 21954560} +{"current_steps": 2690, "total_steps": 20825, "loss": 0.9965, "learning_rate": 4.9108832067879574e-05, "epoch": 0.129171668667467, "percentage": 12.92, "elapsed_time": "3:23:34", "remaining_time": "22:52:23", "throughput": 1804.18, "total_tokens": 22036480} +{"current_steps": 2700, "total_steps": 20825, "loss": 0.8051, "learning_rate": 4.909831854424812e-05, "epoch": 0.12965186074429771, "percentage": 12.97, "elapsed_time": "3:24:19", "remaining_time": "22:51:37", "throughput": 1804.18, "total_tokens": 22118400} +{"current_steps": 2710, "total_steps": 20825, "loss": 0.9556, "learning_rate": 4.908774450603946e-05, "epoch": 0.13013205282112844, "percentage": 13.01, "elapsed_time": "3:25:04", "remaining_time": "22:50:50", "throughput": 1804.21, "total_tokens": 22200320} +{"current_steps": 2720, "total_steps": 20825, "loss": 1.0562, "learning_rate": 4.907710997980664e-05, "epoch": 0.1306122448979592, "percentage": 13.06, "elapsed_time": "3:25:49", "remaining_time": "22:50:03", "throughput": 1804.25, "total_tokens": 22282240} +{"current_steps": 2730, "total_steps": 20825, "loss": 0.9203, "learning_rate": 4.906641499225457e-05, "epoch": 0.13109243697478992, "percentage": 13.11, "elapsed_time": "3:26:34", "remaining_time": "22:49:16", "throughput": 1804.29, "total_tokens": 22364160} +{"current_steps": 2740, "total_steps": 20825, "loss": 0.9196, "learning_rate": 4.905565957024003e-05, "epoch": 0.13157262905162065, "percentage": 13.16, "elapsed_time": "3:27:20", "remaining_time": "22:48:34", "throughput": 1804.21, "total_tokens": 22446080} +{"current_steps": 2750, "total_steps": 20825, "loss": 0.9674, "learning_rate": 4.9044843740771505e-05, "epoch": 0.13205282112845138, "percentage": 13.21, "elapsed_time": "3:28:06", "remaining_time": "22:47:48", "throughput": 1804.23, "total_tokens": 22528000} +{"current_steps": 2760, "total_steps": 20825, "loss": 1.1255, "learning_rate": 4.9033967531009225e-05, "epoch": 0.1325330132052821, "percentage": 13.25, "elapsed_time": "3:28:51", "remaining_time": "22:47:03", "throughput": 1804.23, "total_tokens": 22609920} +{"current_steps": 2770, "total_steps": 20825, "loss": 1.1679, "learning_rate": 4.902303096826502e-05, "epoch": 0.13301320528211286, "percentage": 13.3, "elapsed_time": "3:29:36", "remaining_time": "22:46:16", "throughput": 1804.26, "total_tokens": 22691840} +{"current_steps": 2780, "total_steps": 20825, "loss": 0.8948, "learning_rate": 4.901203408000227e-05, "epoch": 0.13349339735894358, "percentage": 13.35, "elapsed_time": "3:30:22", "remaining_time": "22:45:29", "throughput": 1804.28, "total_tokens": 22773760} +{"current_steps": 2790, "total_steps": 20825, "loss": 1.1007, "learning_rate": 4.9000976893835856e-05, "epoch": 0.1339735894357743, "percentage": 13.4, "elapsed_time": "3:31:07", "remaining_time": "22:44:43", "throughput": 1804.31, "total_tokens": 22855680} +{"current_steps": 2800, "total_steps": 20825, "loss": 0.9984, "learning_rate": 4.898985943753207e-05, "epoch": 0.13445378151260504, "percentage": 13.45, "elapsed_time": "3:31:53", "remaining_time": "22:44:00", "throughput": 1804.26, "total_tokens": 22937600} +{"current_steps": 2810, "total_steps": 20825, "loss": 0.7598, "learning_rate": 4.897868173900854e-05, "epoch": 0.13493397358943576, "percentage": 13.49, "elapsed_time": "3:32:38", "remaining_time": "22:43:13", "throughput": 1804.28, "total_tokens": 23019520} +{"current_steps": 2820, "total_steps": 20825, "loss": 1.0037, "learning_rate": 4.89674438263342e-05, "epoch": 0.13541416566626652, "percentage": 13.54, "elapsed_time": "3:33:23", "remaining_time": "22:42:28", "throughput": 1804.28, "total_tokens": 23101440} +{"current_steps": 2830, "total_steps": 20825, "loss": 0.9097, "learning_rate": 4.8956145727729156e-05, "epoch": 0.13589435774309724, "percentage": 13.59, "elapsed_time": "3:34:08", "remaining_time": "22:41:41", "throughput": 1804.3, "total_tokens": 23183360} +{"current_steps": 2840, "total_steps": 20825, "loss": 0.8392, "learning_rate": 4.8944787471564686e-05, "epoch": 0.13637454981992797, "percentage": 13.64, "elapsed_time": "3:34:54", "remaining_time": "22:40:55", "throughput": 1804.33, "total_tokens": 23265280} +{"current_steps": 2850, "total_steps": 20825, "loss": 0.8909, "learning_rate": 4.89333690863631e-05, "epoch": 0.1368547418967587, "percentage": 13.69, "elapsed_time": "3:35:39", "remaining_time": "22:40:07", "throughput": 1804.38, "total_tokens": 23347200} +{"current_steps": 2860, "total_steps": 20825, "loss": 0.908, "learning_rate": 4.892189060079773e-05, "epoch": 0.13733493397358942, "percentage": 13.73, "elapsed_time": "3:36:24", "remaining_time": "22:39:22", "throughput": 1804.37, "total_tokens": 23429120} +{"current_steps": 2870, "total_steps": 20825, "loss": 0.8255, "learning_rate": 4.8910352043692806e-05, "epoch": 0.13781512605042018, "percentage": 13.78, "elapsed_time": "3:37:10", "remaining_time": "22:38:40", "throughput": 1804.3, "total_tokens": 23511040} +{"current_steps": 2880, "total_steps": 20825, "loss": 0.9484, "learning_rate": 4.889875344402342e-05, "epoch": 0.1382953181272509, "percentage": 13.83, "elapsed_time": "3:37:55", "remaining_time": "22:37:52", "throughput": 1804.35, "total_tokens": 23592960} +{"current_steps": 2890, "total_steps": 20825, "loss": 1.0808, "learning_rate": 4.8887094830915427e-05, "epoch": 0.13877551020408163, "percentage": 13.88, "elapsed_time": "3:38:40", "remaining_time": "22:37:05", "throughput": 1804.38, "total_tokens": 23674880} +{"current_steps": 2900, "total_steps": 20825, "loss": 0.9569, "learning_rate": 4.8875376233645396e-05, "epoch": 0.13925570228091236, "percentage": 13.93, "elapsed_time": "3:39:25", "remaining_time": "22:36:19", "throughput": 1804.42, "total_tokens": 23756800} +{"current_steps": 2910, "total_steps": 20825, "loss": 0.9723, "learning_rate": 4.886359768164054e-05, "epoch": 0.13973589435774308, "percentage": 13.97, "elapsed_time": "3:40:11", "remaining_time": "22:35:32", "throughput": 1804.45, "total_tokens": 23838720} +{"current_steps": 2920, "total_steps": 20825, "loss": 0.9003, "learning_rate": 4.88517592044786e-05, "epoch": 0.14021608643457384, "percentage": 14.02, "elapsed_time": "3:40:56", "remaining_time": "22:34:45", "throughput": 1804.48, "total_tokens": 23920640} +{"current_steps": 2930, "total_steps": 20825, "loss": 1.0471, "learning_rate": 4.8839860831887805e-05, "epoch": 0.14069627851140457, "percentage": 14.07, "elapsed_time": "3:41:41", "remaining_time": "22:34:00", "throughput": 1804.48, "total_tokens": 24002560} +{"current_steps": 2940, "total_steps": 20825, "loss": 0.8685, "learning_rate": 4.882790259374681e-05, "epoch": 0.1411764705882353, "percentage": 14.12, "elapsed_time": "3:42:26", "remaining_time": "22:33:12", "throughput": 1804.52, "total_tokens": 24084480} +{"current_steps": 2950, "total_steps": 20825, "loss": 0.9955, "learning_rate": 4.881588452008456e-05, "epoch": 0.14165666266506602, "percentage": 14.17, "elapsed_time": "3:43:12", "remaining_time": "22:32:26", "throughput": 1804.53, "total_tokens": 24166400} +{"current_steps": 2960, "total_steps": 20825, "loss": 1.0356, "learning_rate": 4.880380664108032e-05, "epoch": 0.14213685474189675, "percentage": 14.21, "elapsed_time": "3:43:57", "remaining_time": "22:31:40", "throughput": 1804.56, "total_tokens": 24248320} +{"current_steps": 2970, "total_steps": 20825, "loss": 0.8951, "learning_rate": 4.879166898706347e-05, "epoch": 0.1426170468187275, "percentage": 14.26, "elapsed_time": "3:44:42", "remaining_time": "22:30:52", "throughput": 1804.61, "total_tokens": 24330240} +{"current_steps": 2980, "total_steps": 20825, "loss": 0.9876, "learning_rate": 4.877947158851352e-05, "epoch": 0.14309723889555823, "percentage": 14.31, "elapsed_time": "3:45:27", "remaining_time": "22:30:06", "throughput": 1804.61, "total_tokens": 24412160} +{"current_steps": 2990, "total_steps": 20825, "loss": 0.8405, "learning_rate": 4.876721447606002e-05, "epoch": 0.14357743097238895, "percentage": 14.36, "elapsed_time": "3:46:12", "remaining_time": "22:29:19", "throughput": 1804.66, "total_tokens": 24494080} +{"current_steps": 3000, "total_steps": 20825, "loss": 1.0846, "learning_rate": 4.875489768048247e-05, "epoch": 0.14405762304921968, "percentage": 14.41, "elapsed_time": "3:46:57", "remaining_time": "22:28:32", "throughput": 1804.7, "total_tokens": 24576000} +{"current_steps": 3010, "total_steps": 20825, "loss": 0.9156, "learning_rate": 4.8742521232710234e-05, "epoch": 0.14453781512605043, "percentage": 14.45, "elapsed_time": "3:47:46", "remaining_time": "22:28:03", "throughput": 1804.32, "total_tokens": 24657920} +{"current_steps": 3020, "total_steps": 20825, "loss": 0.9555, "learning_rate": 4.873008516382245e-05, "epoch": 0.14501800720288116, "percentage": 14.5, "elapsed_time": "3:48:31", "remaining_time": "22:27:18", "throughput": 1804.33, "total_tokens": 24739840} +{"current_steps": 3030, "total_steps": 20825, "loss": 0.9566, "learning_rate": 4.871758950504801e-05, "epoch": 0.1454981992797119, "percentage": 14.55, "elapsed_time": "3:49:16", "remaining_time": "22:26:31", "throughput": 1804.36, "total_tokens": 24821760} +{"current_steps": 3040, "total_steps": 20825, "loss": 0.95, "learning_rate": 4.870503428776544e-05, "epoch": 0.14597839135654261, "percentage": 14.6, "elapsed_time": "3:50:01", "remaining_time": "22:25:45", "throughput": 1804.37, "total_tokens": 24903680} +{"current_steps": 3050, "total_steps": 20825, "loss": 1.0182, "learning_rate": 4.869241954350281e-05, "epoch": 0.14645858343337334, "percentage": 14.65, "elapsed_time": "3:50:46", "remaining_time": "22:24:58", "throughput": 1804.41, "total_tokens": 24985600} +{"current_steps": 3060, "total_steps": 20825, "loss": 0.9629, "learning_rate": 4.867974530393767e-05, "epoch": 0.1469387755102041, "percentage": 14.69, "elapsed_time": "3:51:32", "remaining_time": "22:24:10", "throughput": 1804.45, "total_tokens": 25067520} +{"current_steps": 3070, "total_steps": 20825, "loss": 0.8619, "learning_rate": 4.8667011600896994e-05, "epoch": 0.14741896758703482, "percentage": 14.74, "elapsed_time": "3:52:17", "remaining_time": "22:23:23", "throughput": 1804.49, "total_tokens": 25149440} +{"current_steps": 3080, "total_steps": 20825, "loss": 0.8969, "learning_rate": 4.8654218466357064e-05, "epoch": 0.14789915966386555, "percentage": 14.79, "elapsed_time": "3:53:02", "remaining_time": "22:22:36", "throughput": 1804.53, "total_tokens": 25231360} +{"current_steps": 3090, "total_steps": 20825, "loss": 0.9565, "learning_rate": 4.86413659324434e-05, "epoch": 0.14837935174069627, "percentage": 14.84, "elapsed_time": "3:53:47", "remaining_time": "22:21:49", "throughput": 1804.57, "total_tokens": 25313280} +{"current_steps": 3100, "total_steps": 20825, "loss": 0.8552, "learning_rate": 4.8628454031430694e-05, "epoch": 0.148859543817527, "percentage": 14.89, "elapsed_time": "3:54:32", "remaining_time": "22:21:02", "throughput": 1804.61, "total_tokens": 25395200} +{"current_steps": 3110, "total_steps": 20825, "loss": 1.1013, "learning_rate": 4.8615482795742696e-05, "epoch": 0.14933973589435776, "percentage": 14.93, "elapsed_time": "3:55:17", "remaining_time": "22:20:15", "throughput": 1804.64, "total_tokens": 25477120} +{"current_steps": 3120, "total_steps": 20825, "loss": 1.1029, "learning_rate": 4.860245225795219e-05, "epoch": 0.14981992797118848, "percentage": 14.98, "elapsed_time": "3:56:03", "remaining_time": "22:19:32", "throughput": 1804.59, "total_tokens": 25559040} +{"current_steps": 3130, "total_steps": 20825, "loss": 1.162, "learning_rate": 4.858936245078084e-05, "epoch": 0.1503001200480192, "percentage": 15.03, "elapsed_time": "3:56:48", "remaining_time": "22:18:46", "throughput": 1804.59, "total_tokens": 25640960} +{"current_steps": 3140, "total_steps": 20825, "loss": 1.0493, "learning_rate": 4.857621340709917e-05, "epoch": 0.15078031212484994, "percentage": 15.08, "elapsed_time": "3:57:33", "remaining_time": "22:18:00", "throughput": 1804.61, "total_tokens": 25722880} +{"current_steps": 3150, "total_steps": 20825, "loss": 0.8903, "learning_rate": 4.856300515992646e-05, "epoch": 0.15126050420168066, "percentage": 15.13, "elapsed_time": "3:58:19", "remaining_time": "22:17:16", "throughput": 1804.59, "total_tokens": 25804800} +{"current_steps": 3160, "total_steps": 20825, "loss": 0.9819, "learning_rate": 4.854973774243062e-05, "epoch": 0.15174069627851142, "percentage": 15.17, "elapsed_time": "3:59:04", "remaining_time": "22:16:28", "throughput": 1804.63, "total_tokens": 25886720} +{"current_steps": 3170, "total_steps": 20825, "loss": 0.9732, "learning_rate": 4.8536411187928186e-05, "epoch": 0.15222088835534214, "percentage": 15.22, "elapsed_time": "3:59:49", "remaining_time": "22:15:40", "throughput": 1804.69, "total_tokens": 25968640} +{"current_steps": 3180, "total_steps": 20825, "loss": 0.9799, "learning_rate": 4.852302552988418e-05, "epoch": 0.15270108043217287, "percentage": 15.27, "elapsed_time": "4:00:34", "remaining_time": "22:14:55", "throughput": 1804.69, "total_tokens": 26050560} +{"current_steps": 3190, "total_steps": 20825, "loss": 1.0295, "learning_rate": 4.850958080191205e-05, "epoch": 0.1531812725090036, "percentage": 15.32, "elapsed_time": "4:01:20", "remaining_time": "22:14:09", "throughput": 1804.71, "total_tokens": 26132480} +{"current_steps": 3200, "total_steps": 20825, "loss": 0.942, "learning_rate": 4.849607703777356e-05, "epoch": 0.15366146458583432, "percentage": 15.37, "elapsed_time": "4:02:05", "remaining_time": "22:13:23", "throughput": 1804.72, "total_tokens": 26214400} +{"current_steps": 3210, "total_steps": 20825, "loss": 0.7757, "learning_rate": 4.8482514271378745e-05, "epoch": 0.15414165666266508, "percentage": 15.41, "elapsed_time": "4:02:50", "remaining_time": "22:12:36", "throughput": 1804.75, "total_tokens": 26296320} +{"current_steps": 3220, "total_steps": 20825, "loss": 0.8739, "learning_rate": 4.846889253678578e-05, "epoch": 0.1546218487394958, "percentage": 15.46, "elapsed_time": "4:03:35", "remaining_time": "22:11:51", "throughput": 1804.75, "total_tokens": 26378240} +{"current_steps": 3230, "total_steps": 20825, "loss": 0.931, "learning_rate": 4.845521186820096e-05, "epoch": 0.15510204081632653, "percentage": 15.51, "elapsed_time": "4:04:21", "remaining_time": "22:11:04", "throughput": 1804.78, "total_tokens": 26460160} +{"current_steps": 3240, "total_steps": 20825, "loss": 0.955, "learning_rate": 4.8441472299978504e-05, "epoch": 0.15558223289315726, "percentage": 15.56, "elapsed_time": "4:05:06", "remaining_time": "22:10:18", "throughput": 1804.79, "total_tokens": 26542080} +{"current_steps": 3250, "total_steps": 20825, "loss": 0.9456, "learning_rate": 4.8427673866620615e-05, "epoch": 0.15606242496998798, "percentage": 15.61, "elapsed_time": "4:05:51", "remaining_time": "22:09:32", "throughput": 1804.81, "total_tokens": 26624000} +{"current_steps": 3260, "total_steps": 20825, "loss": 0.8613, "learning_rate": 4.841381660277725e-05, "epoch": 0.15654261704681874, "percentage": 15.65, "elapsed_time": "4:06:37", "remaining_time": "22:08:47", "throughput": 1804.8, "total_tokens": 26705920} +{"current_steps": 3270, "total_steps": 20825, "loss": 0.9297, "learning_rate": 4.839990054324614e-05, "epoch": 0.15702280912364946, "percentage": 15.7, "elapsed_time": "4:07:22", "remaining_time": "22:08:00", "throughput": 1804.84, "total_tokens": 26787840} +{"current_steps": 3280, "total_steps": 20825, "loss": 1.0529, "learning_rate": 4.838592572297265e-05, "epoch": 0.1575030012004802, "percentage": 15.75, "elapsed_time": "4:08:07", "remaining_time": "22:07:13", "throughput": 1804.87, "total_tokens": 26869760} +{"current_steps": 3290, "total_steps": 20825, "loss": 0.9072, "learning_rate": 4.837189217704968e-05, "epoch": 0.15798319327731092, "percentage": 15.8, "elapsed_time": "4:08:52", "remaining_time": "22:06:26", "throughput": 1804.91, "total_tokens": 26951680} +{"current_steps": 3300, "total_steps": 20825, "loss": 0.8515, "learning_rate": 4.835779994071764e-05, "epoch": 0.15846338535414164, "percentage": 15.85, "elapsed_time": "4:09:37", "remaining_time": "22:05:41", "throughput": 1804.9, "total_tokens": 27033600} +{"current_steps": 3310, "total_steps": 20825, "loss": 0.9548, "learning_rate": 4.8343649049364284e-05, "epoch": 0.1589435774309724, "percentage": 15.89, "elapsed_time": "4:10:23", "remaining_time": "22:04:56", "throughput": 1804.89, "total_tokens": 27115520} +{"current_steps": 3320, "total_steps": 20825, "loss": 0.9565, "learning_rate": 4.832943953852468e-05, "epoch": 0.15942376950780313, "percentage": 15.94, "elapsed_time": "4:11:08", "remaining_time": "22:04:10", "throughput": 1804.92, "total_tokens": 27197440} +{"current_steps": 3330, "total_steps": 20825, "loss": 0.8896, "learning_rate": 4.831517144388109e-05, "epoch": 0.15990396158463385, "percentage": 15.99, "elapsed_time": "4:11:53", "remaining_time": "22:03:22", "throughput": 1804.96, "total_tokens": 27279360} +{"current_steps": 3340, "total_steps": 20825, "loss": 0.7648, "learning_rate": 4.830084480126288e-05, "epoch": 0.16038415366146458, "percentage": 16.04, "elapsed_time": "4:12:38", "remaining_time": "22:02:36", "throughput": 1804.99, "total_tokens": 27361280} +{"current_steps": 3350, "total_steps": 20825, "loss": 0.9537, "learning_rate": 4.828645964664647e-05, "epoch": 0.1608643457382953, "percentage": 16.09, "elapsed_time": "4:13:23", "remaining_time": "22:01:50", "throughput": 1805.0, "total_tokens": 27443200} +{"current_steps": 3360, "total_steps": 20825, "loss": 1.0036, "learning_rate": 4.8272016016155166e-05, "epoch": 0.16134453781512606, "percentage": 16.13, "elapsed_time": "4:14:09", "remaining_time": "22:01:05", "throughput": 1804.99, "total_tokens": 27525120} +{"current_steps": 3370, "total_steps": 20825, "loss": 1.1458, "learning_rate": 4.825751394605916e-05, "epoch": 0.1618247298919568, "percentage": 16.18, "elapsed_time": "4:14:54", "remaining_time": "22:00:17", "throughput": 1805.05, "total_tokens": 27607040} +{"current_steps": 3380, "total_steps": 20825, "loss": 0.8404, "learning_rate": 4.824295347277537e-05, "epoch": 0.1623049219687875, "percentage": 16.23, "elapsed_time": "4:15:39", "remaining_time": "21:59:31", "throughput": 1805.06, "total_tokens": 27688960} +{"current_steps": 3390, "total_steps": 20825, "loss": 1.1109, "learning_rate": 4.8228334632867375e-05, "epoch": 0.16278511404561824, "percentage": 16.28, "elapsed_time": "4:16:25", "remaining_time": "21:58:47", "throughput": 1805.02, "total_tokens": 27770880} +{"current_steps": 3400, "total_steps": 20825, "loss": 1.0581, "learning_rate": 4.8213657463045344e-05, "epoch": 0.16326530612244897, "percentage": 16.33, "elapsed_time": "4:17:10", "remaining_time": "21:58:00", "throughput": 1805.07, "total_tokens": 27852800} +{"current_steps": 3410, "total_steps": 20825, "loss": 1.0135, "learning_rate": 4.819892200016588e-05, "epoch": 0.16374549819927972, "percentage": 16.37, "elapsed_time": "4:17:55", "remaining_time": "21:57:12", "throughput": 1805.13, "total_tokens": 27934720} +{"current_steps": 3420, "total_steps": 20825, "loss": 0.8944, "learning_rate": 4.818412828123201e-05, "epoch": 0.16422569027611045, "percentage": 16.42, "elapsed_time": "4:18:40", "remaining_time": "21:56:25", "throughput": 1805.16, "total_tokens": 28016640} +{"current_steps": 3430, "total_steps": 20825, "loss": 0.8662, "learning_rate": 4.816927634339302e-05, "epoch": 0.16470588235294117, "percentage": 16.47, "elapsed_time": "4:19:25", "remaining_time": "21:55:39", "throughput": 1805.17, "total_tokens": 28098560} +{"current_steps": 3440, "total_steps": 20825, "loss": 0.7626, "learning_rate": 4.815436622394441e-05, "epoch": 0.1651860744297719, "percentage": 16.52, "elapsed_time": "4:20:10", "remaining_time": "21:54:52", "throughput": 1805.21, "total_tokens": 28180480} +{"current_steps": 3450, "total_steps": 20825, "loss": 1.0245, "learning_rate": 4.813939796032779e-05, "epoch": 0.16566626650660263, "percentage": 16.57, "elapsed_time": "4:20:55", "remaining_time": "21:54:07", "throughput": 1805.22, "total_tokens": 28262400} +{"current_steps": 3460, "total_steps": 20825, "loss": 0.9836, "learning_rate": 4.812437159013076e-05, "epoch": 0.16614645858343338, "percentage": 16.61, "elapsed_time": "4:21:41", "remaining_time": "21:53:21", "throughput": 1805.23, "total_tokens": 28344320} +{"current_steps": 3470, "total_steps": 20825, "loss": 0.8955, "learning_rate": 4.810928715108683e-05, "epoch": 0.1666266506602641, "percentage": 16.66, "elapsed_time": "4:22:26", "remaining_time": "21:52:34", "throughput": 1805.25, "total_tokens": 28426240} +{"current_steps": 3480, "total_steps": 20825, "loss": 0.8607, "learning_rate": 4.809414468107536e-05, "epoch": 0.16710684273709484, "percentage": 16.71, "elapsed_time": "4:23:11", "remaining_time": "21:51:48", "throughput": 1805.28, "total_tokens": 28508160} +{"current_steps": 3490, "total_steps": 20825, "loss": 0.7663, "learning_rate": 4.8078944218121404e-05, "epoch": 0.16758703481392556, "percentage": 16.76, "elapsed_time": "4:23:56", "remaining_time": "21:51:01", "throughput": 1805.31, "total_tokens": 28590080} +{"current_steps": 3500, "total_steps": 20825, "loss": 1.1082, "learning_rate": 4.806368580039566e-05, "epoch": 0.16806722689075632, "percentage": 16.81, "elapsed_time": "4:24:41", "remaining_time": "21:50:15", "throughput": 1805.33, "total_tokens": 28672000} +{"current_steps": 3510, "total_steps": 20825, "loss": 0.7908, "learning_rate": 4.804836946621437e-05, "epoch": 0.16854741896758704, "percentage": 16.85, "elapsed_time": "4:25:27", "remaining_time": "21:49:29", "throughput": 1805.35, "total_tokens": 28753920} +{"current_steps": 3520, "total_steps": 20825, "loss": 0.9984, "learning_rate": 4.803299525403919e-05, "epoch": 0.16902761104441777, "percentage": 16.9, "elapsed_time": "4:26:12", "remaining_time": "21:48:44", "throughput": 1805.33, "total_tokens": 28835840} +{"current_steps": 3530, "total_steps": 20825, "loss": 1.1216, "learning_rate": 4.801756320247713e-05, "epoch": 0.1695078031212485, "percentage": 16.95, "elapsed_time": "4:26:57", "remaining_time": "21:47:57", "throughput": 1805.36, "total_tokens": 28917760} +{"current_steps": 3540, "total_steps": 20825, "loss": 0.9355, "learning_rate": 4.800207335028044e-05, "epoch": 0.16998799519807922, "percentage": 17.0, "elapsed_time": "4:27:43", "remaining_time": "21:47:12", "throughput": 1805.37, "total_tokens": 28999680} +{"current_steps": 3550, "total_steps": 20825, "loss": 0.8603, "learning_rate": 4.798652573634651e-05, "epoch": 0.17046818727490998, "percentage": 17.05, "elapsed_time": "4:28:28", "remaining_time": "21:46:25", "throughput": 1805.4, "total_tokens": 29081600} +{"current_steps": 3560, "total_steps": 20825, "loss": 0.6316, "learning_rate": 4.797092039971779e-05, "epoch": 0.1709483793517407, "percentage": 17.09, "elapsed_time": "4:29:13", "remaining_time": "21:45:38", "throughput": 1805.42, "total_tokens": 29163520} +{"current_steps": 3570, "total_steps": 20825, "loss": 0.8794, "learning_rate": 4.7955257379581675e-05, "epoch": 0.17142857142857143, "percentage": 17.14, "elapsed_time": "4:29:58", "remaining_time": "21:44:51", "throughput": 1805.46, "total_tokens": 29245440} +{"current_steps": 3580, "total_steps": 20825, "loss": 1.2806, "learning_rate": 4.7939536715270415e-05, "epoch": 0.17190876350540216, "percentage": 17.19, "elapsed_time": "4:30:43", "remaining_time": "21:44:07", "throughput": 1805.44, "total_tokens": 29327360} +{"current_steps": 3590, "total_steps": 20825, "loss": 0.7021, "learning_rate": 4.792375844626101e-05, "epoch": 0.17238895558223288, "percentage": 17.24, "elapsed_time": "4:31:29", "remaining_time": "21:43:23", "throughput": 1805.41, "total_tokens": 29409280} +{"current_steps": 3600, "total_steps": 20825, "loss": 0.9755, "learning_rate": 4.790792261217512e-05, "epoch": 0.17286914765906364, "percentage": 17.29, "elapsed_time": "4:32:14", "remaining_time": "21:42:37", "throughput": 1805.42, "total_tokens": 29491200} +{"current_steps": 3610, "total_steps": 20825, "loss": 0.929, "learning_rate": 4.789202925277895e-05, "epoch": 0.17334933973589436, "percentage": 17.33, "elapsed_time": "4:32:59", "remaining_time": "21:41:50", "throughput": 1805.46, "total_tokens": 29573120} +{"current_steps": 3620, "total_steps": 20825, "loss": 0.8966, "learning_rate": 4.787607840798317e-05, "epoch": 0.1738295318127251, "percentage": 17.38, "elapsed_time": "4:33:45", "remaining_time": "21:41:04", "throughput": 1805.48, "total_tokens": 29655040} +{"current_steps": 3630, "total_steps": 20825, "loss": 0.9054, "learning_rate": 4.786007011784279e-05, "epoch": 0.17430972388955582, "percentage": 17.43, "elapsed_time": "4:34:30", "remaining_time": "21:40:18", "throughput": 1805.48, "total_tokens": 29736960} +{"current_steps": 3640, "total_steps": 20825, "loss": 0.881, "learning_rate": 4.78440044225571e-05, "epoch": 0.17478991596638654, "percentage": 17.48, "elapsed_time": "4:35:15", "remaining_time": "21:39:32", "throughput": 1805.5, "total_tokens": 29818880} +{"current_steps": 3650, "total_steps": 20825, "loss": 0.7921, "learning_rate": 4.7827881362469506e-05, "epoch": 0.1752701080432173, "percentage": 17.53, "elapsed_time": "4:36:00", "remaining_time": "21:38:47", "throughput": 1805.5, "total_tokens": 29900800} +{"current_steps": 3660, "total_steps": 20825, "loss": 0.956, "learning_rate": 4.781170097806751e-05, "epoch": 0.17575030012004803, "percentage": 17.58, "elapsed_time": "4:36:45", "remaining_time": "21:38:00", "throughput": 1805.54, "total_tokens": 29982720} +{"current_steps": 3670, "total_steps": 20825, "loss": 0.9339, "learning_rate": 4.779546330998253e-05, "epoch": 0.17623049219687875, "percentage": 17.62, "elapsed_time": "4:37:31", "remaining_time": "21:37:13", "throughput": 1805.56, "total_tokens": 30064640} +{"current_steps": 3680, "total_steps": 20825, "loss": 1.2112, "learning_rate": 4.7779168398989826e-05, "epoch": 0.17671068427370948, "percentage": 17.67, "elapsed_time": "4:38:16", "remaining_time": "21:36:28", "throughput": 1805.56, "total_tokens": 30146560} +{"current_steps": 3690, "total_steps": 20825, "loss": 0.9783, "learning_rate": 4.7762816286008454e-05, "epoch": 0.1771908763505402, "percentage": 17.72, "elapsed_time": "4:39:01", "remaining_time": "21:35:42", "throughput": 1805.58, "total_tokens": 30228480} +{"current_steps": 3700, "total_steps": 20825, "loss": 1.1071, "learning_rate": 4.774640701210106e-05, "epoch": 0.17767106842737096, "percentage": 17.77, "elapsed_time": "4:39:47", "remaining_time": "21:34:57", "throughput": 1805.56, "total_tokens": 30310400} +{"current_steps": 3710, "total_steps": 20825, "loss": 1.0155, "learning_rate": 4.7729940618473854e-05, "epoch": 0.1781512605042017, "percentage": 17.82, "elapsed_time": "4:40:32", "remaining_time": "21:34:11", "throughput": 1805.58, "total_tokens": 30392320} +{"current_steps": 3720, "total_steps": 20825, "loss": 0.9545, "learning_rate": 4.771341714647648e-05, "epoch": 0.1786314525810324, "percentage": 17.86, "elapsed_time": "4:41:17", "remaining_time": "21:33:25", "throughput": 1805.59, "total_tokens": 30474240} +{"current_steps": 3730, "total_steps": 20825, "loss": 0.8737, "learning_rate": 4.76968366376019e-05, "epoch": 0.17911164465786314, "percentage": 17.91, "elapsed_time": "4:42:03", "remaining_time": "21:32:41", "throughput": 1805.55, "total_tokens": 30556160} +{"current_steps": 3740, "total_steps": 20825, "loss": 0.9804, "learning_rate": 4.768019913348634e-05, "epoch": 0.17959183673469387, "percentage": 17.96, "elapsed_time": "4:42:48", "remaining_time": "21:31:56", "throughput": 1805.56, "total_tokens": 30638080} +{"current_steps": 3750, "total_steps": 20825, "loss": 0.8976, "learning_rate": 4.766350467590911e-05, "epoch": 0.18007202881152462, "percentage": 18.01, "elapsed_time": "4:43:33", "remaining_time": "21:31:10", "throughput": 1805.58, "total_tokens": 30720000} +{"current_steps": 3760, "total_steps": 20825, "loss": 0.9886, "learning_rate": 4.764675330679256e-05, "epoch": 0.18055222088835535, "percentage": 18.06, "elapsed_time": "4:44:19", "remaining_time": "21:30:23", "throughput": 1805.6, "total_tokens": 30801920} +{"current_steps": 3770, "total_steps": 20825, "loss": 0.9472, "learning_rate": 4.7629945068201954e-05, "epoch": 0.18103241296518607, "percentage": 18.1, "elapsed_time": "4:45:04", "remaining_time": "21:29:37", "throughput": 1805.62, "total_tokens": 30883840} +{"current_steps": 3780, "total_steps": 20825, "loss": 0.8187, "learning_rate": 4.7613080002345345e-05, "epoch": 0.1815126050420168, "percentage": 18.15, "elapsed_time": "4:45:49", "remaining_time": "21:28:52", "throughput": 1805.63, "total_tokens": 30965760} +{"current_steps": 3790, "total_steps": 20825, "loss": 1.0672, "learning_rate": 4.759615815157352e-05, "epoch": 0.18199279711884753, "percentage": 18.2, "elapsed_time": "4:46:35", "remaining_time": "21:28:09", "throughput": 1805.56, "total_tokens": 31047680} +{"current_steps": 3800, "total_steps": 20825, "loss": 0.854, "learning_rate": 4.7579179558379836e-05, "epoch": 0.18247298919567828, "percentage": 18.25, "elapsed_time": "4:47:20", "remaining_time": "21:27:23", "throughput": 1805.57, "total_tokens": 31129600} +{"current_steps": 3810, "total_steps": 20825, "loss": 0.759, "learning_rate": 4.7562144265400146e-05, "epoch": 0.182953181272509, "percentage": 18.3, "elapsed_time": "4:48:05", "remaining_time": "21:26:36", "throughput": 1805.6, "total_tokens": 31211520} +{"current_steps": 3820, "total_steps": 20825, "loss": 1.0452, "learning_rate": 4.754505231541268e-05, "epoch": 0.18343337334933973, "percentage": 18.34, "elapsed_time": "4:48:51", "remaining_time": "21:25:51", "throughput": 1805.6, "total_tokens": 31293440} +{"current_steps": 3830, "total_steps": 20825, "loss": 0.8398, "learning_rate": 4.752790375133797e-05, "epoch": 0.18391356542617046, "percentage": 18.39, "elapsed_time": "4:49:36", "remaining_time": "21:25:04", "throughput": 1805.63, "total_tokens": 31375360} +{"current_steps": 3840, "total_steps": 20825, "loss": 0.9282, "learning_rate": 4.751069861623867e-05, "epoch": 0.1843937575030012, "percentage": 18.44, "elapsed_time": "4:50:21", "remaining_time": "21:24:20", "throughput": 1805.61, "total_tokens": 31457280} +{"current_steps": 3850, "total_steps": 20825, "loss": 1.0174, "learning_rate": 4.749343695331952e-05, "epoch": 0.18487394957983194, "percentage": 18.49, "elapsed_time": "4:51:07", "remaining_time": "21:23:35", "throughput": 1805.61, "total_tokens": 31539200} +{"current_steps": 3860, "total_steps": 20825, "loss": 0.8329, "learning_rate": 4.747611880592721e-05, "epoch": 0.18535414165666267, "percentage": 18.54, "elapsed_time": "4:51:52", "remaining_time": "21:22:48", "throughput": 1805.64, "total_tokens": 31621120} +{"current_steps": 3870, "total_steps": 20825, "loss": 1.0112, "learning_rate": 4.745874421755027e-05, "epoch": 0.1858343337334934, "percentage": 18.58, "elapsed_time": "4:52:37", "remaining_time": "21:22:01", "throughput": 1805.67, "total_tokens": 31703040} +{"current_steps": 3880, "total_steps": 20825, "loss": 0.8418, "learning_rate": 4.744131323181895e-05, "epoch": 0.18631452581032412, "percentage": 18.63, "elapsed_time": "4:53:22", "remaining_time": "21:21:16", "throughput": 1805.68, "total_tokens": 31784960} +{"current_steps": 3890, "total_steps": 20825, "loss": 0.9913, "learning_rate": 4.742382589250514e-05, "epoch": 0.18679471788715485, "percentage": 18.68, "elapsed_time": "4:54:08", "remaining_time": "21:20:30", "throughput": 1805.68, "total_tokens": 31866880} +{"current_steps": 3900, "total_steps": 20825, "loss": 1.0409, "learning_rate": 4.740628224352222e-05, "epoch": 0.1872749099639856, "percentage": 18.73, "elapsed_time": "4:54:53", "remaining_time": "21:19:44", "throughput": 1805.7, "total_tokens": 31948800} +{"current_steps": 3910, "total_steps": 20825, "loss": 0.9342, "learning_rate": 4.7388682328925e-05, "epoch": 0.18775510204081633, "percentage": 18.78, "elapsed_time": "4:55:38", "remaining_time": "21:19:00", "throughput": 1805.67, "total_tokens": 32030720} +{"current_steps": 3920, "total_steps": 20825, "loss": 0.9206, "learning_rate": 4.737102619290956e-05, "epoch": 0.18823529411764706, "percentage": 18.82, "elapsed_time": "4:56:23", "remaining_time": "21:18:13", "throughput": 1805.71, "total_tokens": 32112640} +{"current_steps": 3930, "total_steps": 20825, "loss": 0.9706, "learning_rate": 4.7353313879813165e-05, "epoch": 0.18871548619447778, "percentage": 18.87, "elapsed_time": "4:57:08", "remaining_time": "21:17:26", "throughput": 1805.75, "total_tokens": 32194560} +{"current_steps": 3940, "total_steps": 20825, "loss": 1.0686, "learning_rate": 4.733554543411417e-05, "epoch": 0.18919567827130854, "percentage": 18.92, "elapsed_time": "4:57:54", "remaining_time": "21:16:41", "throughput": 1805.74, "total_tokens": 32276480} +{"current_steps": 3950, "total_steps": 20825, "loss": 0.9365, "learning_rate": 4.731772090043184e-05, "epoch": 0.18967587034813926, "percentage": 18.97, "elapsed_time": "4:58:39", "remaining_time": "21:15:54", "throughput": 1805.76, "total_tokens": 32358400} +{"current_steps": 3960, "total_steps": 20825, "loss": 0.8931, "learning_rate": 4.729984032352635e-05, "epoch": 0.19015606242497, "percentage": 19.02, "elapsed_time": "4:59:24", "remaining_time": "21:15:09", "throughput": 1805.77, "total_tokens": 32440320} +{"current_steps": 3970, "total_steps": 20825, "loss": 0.9301, "learning_rate": 4.728190374829854e-05, "epoch": 0.19063625450180072, "percentage": 19.06, "elapsed_time": "5:00:09", "remaining_time": "21:14:22", "throughput": 1805.79, "total_tokens": 32522240} +{"current_steps": 3980, "total_steps": 20825, "loss": 0.9234, "learning_rate": 4.726391121978992e-05, "epoch": 0.19111644657863144, "percentage": 19.11, "elapsed_time": "5:00:55", "remaining_time": "21:13:39", "throughput": 1805.74, "total_tokens": 32604160} +{"current_steps": 3990, "total_steps": 20825, "loss": 0.9042, "learning_rate": 4.7245862783182496e-05, "epoch": 0.1915966386554622, "percentage": 19.16, "elapsed_time": "5:01:40", "remaining_time": "21:12:53", "throughput": 1805.76, "total_tokens": 32686080} +{"current_steps": 4000, "total_steps": 20825, "loss": 1.0318, "learning_rate": 4.722775848379866e-05, "epoch": 0.19207683073229292, "percentage": 19.21, "elapsed_time": "5:02:26", "remaining_time": "21:12:06", "throughput": 1805.79, "total_tokens": 32768000} +{"current_steps": 4010, "total_steps": 20825, "loss": 0.8199, "learning_rate": 4.720959836710107e-05, "epoch": 0.19255702280912365, "percentage": 19.26, "elapsed_time": "5:03:14", "remaining_time": "21:11:34", "throughput": 1805.49, "total_tokens": 32849920} +{"current_steps": 4020, "total_steps": 20825, "loss": 0.9483, "learning_rate": 4.7191382478692594e-05, "epoch": 0.19303721488595438, "percentage": 19.3, "elapsed_time": "5:04:00", "remaining_time": "21:10:49", "throughput": 1805.47, "total_tokens": 32931840} +{"current_steps": 4030, "total_steps": 20825, "loss": 0.8141, "learning_rate": 4.7173110864316104e-05, "epoch": 0.1935174069627851, "percentage": 19.35, "elapsed_time": "5:04:45", "remaining_time": "21:10:03", "throughput": 1805.49, "total_tokens": 33013760} +{"current_steps": 4040, "total_steps": 20825, "loss": 0.8107, "learning_rate": 4.7154783569854444e-05, "epoch": 0.19399759903961586, "percentage": 19.4, "elapsed_time": "5:05:31", "remaining_time": "21:09:19", "throughput": 1805.45, "total_tokens": 33095680} +{"current_steps": 4050, "total_steps": 20825, "loss": 0.9762, "learning_rate": 4.713640064133025e-05, "epoch": 0.19447779111644659, "percentage": 19.45, "elapsed_time": "5:06:16", "remaining_time": "21:08:35", "throughput": 1805.41, "total_tokens": 33177600} +{"current_steps": 4060, "total_steps": 20825, "loss": 0.8789, "learning_rate": 4.7117962124905885e-05, "epoch": 0.1949579831932773, "percentage": 19.5, "elapsed_time": "5:07:01", "remaining_time": "21:07:49", "throughput": 1805.43, "total_tokens": 33259520} +{"current_steps": 4070, "total_steps": 20825, "loss": 0.9835, "learning_rate": 4.709946806688329e-05, "epoch": 0.19543817527010804, "percentage": 19.54, "elapsed_time": "5:07:47", "remaining_time": "21:07:03", "throughput": 1805.45, "total_tokens": 33341440} +{"current_steps": 4080, "total_steps": 20825, "loss": 0.8732, "learning_rate": 4.708091851370389e-05, "epoch": 0.19591836734693877, "percentage": 19.59, "elapsed_time": "5:08:32", "remaining_time": "21:06:18", "throughput": 1805.44, "total_tokens": 33423360} +{"current_steps": 4090, "total_steps": 20825, "loss": 0.9604, "learning_rate": 4.706231351194845e-05, "epoch": 0.19639855942376952, "percentage": 19.64, "elapsed_time": "5:09:17", "remaining_time": "21:05:32", "throughput": 1805.46, "total_tokens": 33505280} +{"current_steps": 4100, "total_steps": 20825, "loss": 0.8032, "learning_rate": 4.7043653108336994e-05, "epoch": 0.19687875150060025, "percentage": 19.69, "elapsed_time": "5:10:02", "remaining_time": "21:04:46", "throughput": 1805.48, "total_tokens": 33587200} +{"current_steps": 4110, "total_steps": 20825, "loss": 0.9989, "learning_rate": 4.702493734972866e-05, "epoch": 0.19735894357743097, "percentage": 19.74, "elapsed_time": "5:10:48", "remaining_time": "21:04:01", "throughput": 1805.48, "total_tokens": 33669120} +{"current_steps": 4120, "total_steps": 20825, "loss": 1.0064, "learning_rate": 4.700616628312158e-05, "epoch": 0.1978391356542617, "percentage": 19.78, "elapsed_time": "5:11:33", "remaining_time": "21:03:15", "throughput": 1805.48, "total_tokens": 33751040} +{"current_steps": 4130, "total_steps": 20825, "loss": 0.8425, "learning_rate": 4.69873399556528e-05, "epoch": 0.19831932773109243, "percentage": 19.83, "elapsed_time": "5:12:19", "remaining_time": "21:02:30", "throughput": 1805.48, "total_tokens": 33832960} +{"current_steps": 4140, "total_steps": 20825, "loss": 1.0941, "learning_rate": 4.696845841459811e-05, "epoch": 0.19879951980792318, "percentage": 19.88, "elapsed_time": "5:13:04", "remaining_time": "21:01:44", "throughput": 1805.48, "total_tokens": 33914880} +{"current_steps": 4150, "total_steps": 20825, "loss": 0.8666, "learning_rate": 4.6949521707371965e-05, "epoch": 0.1992797118847539, "percentage": 19.93, "elapsed_time": "5:13:49", "remaining_time": "21:00:58", "throughput": 1805.49, "total_tokens": 33996800} +{"current_steps": 4160, "total_steps": 20825, "loss": 0.8477, "learning_rate": 4.693052988152733e-05, "epoch": 0.19975990396158463, "percentage": 19.98, "elapsed_time": "5:14:34", "remaining_time": "21:00:12", "throughput": 1805.53, "total_tokens": 34078720} +{"current_steps": 4170, "total_steps": 20825, "loss": 1.0889, "learning_rate": 4.691148298475561e-05, "epoch": 0.20024009603841536, "percentage": 20.02, "elapsed_time": "5:15:20", "remaining_time": "20:59:27", "throughput": 1805.51, "total_tokens": 34160640} +{"current_steps": 4180, "total_steps": 20825, "loss": 0.9039, "learning_rate": 4.689238106488647e-05, "epoch": 0.2007202881152461, "percentage": 20.07, "elapsed_time": "5:16:05", "remaining_time": "20:58:41", "throughput": 1805.53, "total_tokens": 34242560} +{"current_steps": 4190, "total_steps": 20825, "loss": 0.8954, "learning_rate": 4.687322416988779e-05, "epoch": 0.20120048019207684, "percentage": 20.12, "elapsed_time": "5:16:50", "remaining_time": "20:57:54", "throughput": 1805.56, "total_tokens": 34324480} +{"current_steps": 4200, "total_steps": 20825, "loss": 0.92, "learning_rate": 4.685401234786544e-05, "epoch": 0.20168067226890757, "percentage": 20.17, "elapsed_time": "5:17:35", "remaining_time": "20:57:07", "throughput": 1805.59, "total_tokens": 34406400} +{"current_steps": 4210, "total_steps": 20825, "loss": 0.9093, "learning_rate": 4.683474564706327e-05, "epoch": 0.2021608643457383, "percentage": 20.22, "elapsed_time": "5:18:20", "remaining_time": "20:56:20", "throughput": 1805.64, "total_tokens": 34488320} +{"current_steps": 4220, "total_steps": 20825, "loss": 0.8968, "learning_rate": 4.681542411586294e-05, "epoch": 0.20264105642256902, "percentage": 20.26, "elapsed_time": "5:19:05", "remaining_time": "20:55:34", "throughput": 1805.64, "total_tokens": 34570240} +{"current_steps": 4230, "total_steps": 20825, "loss": 1.0459, "learning_rate": 4.6796047802783755e-05, "epoch": 0.20312124849939975, "percentage": 20.31, "elapsed_time": "5:19:50", "remaining_time": "20:54:48", "throughput": 1805.66, "total_tokens": 34652160} +{"current_steps": 4240, "total_steps": 20825, "loss": 0.8744, "learning_rate": 4.6776616756482624e-05, "epoch": 0.2036014405762305, "percentage": 20.36, "elapsed_time": "5:20:36", "remaining_time": "20:54:04", "throughput": 1805.65, "total_tokens": 34734080} +{"current_steps": 4250, "total_steps": 20825, "loss": 0.8492, "learning_rate": 4.6757131025753886e-05, "epoch": 0.20408163265306123, "percentage": 20.41, "elapsed_time": "5:21:21", "remaining_time": "20:53:17", "throughput": 1805.67, "total_tokens": 34816000} +{"current_steps": 4260, "total_steps": 20825, "loss": 1.1252, "learning_rate": 4.67375906595292e-05, "epoch": 0.20456182472989196, "percentage": 20.46, "elapsed_time": "5:22:06", "remaining_time": "20:52:31", "throughput": 1805.69, "total_tokens": 34897920} +{"current_steps": 4270, "total_steps": 20825, "loss": 1.1081, "learning_rate": 4.671799570687743e-05, "epoch": 0.20504201680672268, "percentage": 20.5, "elapsed_time": "5:22:51", "remaining_time": "20:51:45", "throughput": 1805.7, "total_tokens": 34979840} +{"current_steps": 4280, "total_steps": 20825, "loss": 0.917, "learning_rate": 4.6698346217004494e-05, "epoch": 0.2055222088835534, "percentage": 20.55, "elapsed_time": "5:23:37", "remaining_time": "20:50:59", "throughput": 1805.72, "total_tokens": 35061760} +{"current_steps": 4290, "total_steps": 20825, "loss": 1.1476, "learning_rate": 4.66786422392533e-05, "epoch": 0.20600240096038416, "percentage": 20.6, "elapsed_time": "5:24:22", "remaining_time": "20:50:13", "throughput": 1805.73, "total_tokens": 35143680} +{"current_steps": 4300, "total_steps": 20825, "loss": 0.9777, "learning_rate": 4.665888382310356e-05, "epoch": 0.2064825930372149, "percentage": 20.65, "elapsed_time": "5:25:07", "remaining_time": "20:49:28", "throughput": 1805.73, "total_tokens": 35225600} +{"current_steps": 4310, "total_steps": 20825, "loss": 0.9304, "learning_rate": 4.663907101817167e-05, "epoch": 0.20696278511404562, "percentage": 20.7, "elapsed_time": "5:25:52", "remaining_time": "20:48:42", "throughput": 1805.74, "total_tokens": 35307520} +{"current_steps": 4320, "total_steps": 20825, "loss": 1.0128, "learning_rate": 4.661920387421064e-05, "epoch": 0.20744297719087634, "percentage": 20.74, "elapsed_time": "5:26:37", "remaining_time": "20:47:56", "throughput": 1805.77, "total_tokens": 35389440} +{"current_steps": 4330, "total_steps": 20825, "loss": 0.904, "learning_rate": 4.65992824411099e-05, "epoch": 0.20792316926770707, "percentage": 20.79, "elapsed_time": "5:27:23", "remaining_time": "20:47:10", "throughput": 1805.78, "total_tokens": 35471360} +{"current_steps": 4340, "total_steps": 20825, "loss": 1.1092, "learning_rate": 4.657930676889526e-05, "epoch": 0.20840336134453782, "percentage": 20.84, "elapsed_time": "5:28:08", "remaining_time": "20:46:24", "throughput": 1805.8, "total_tokens": 35553280} +{"current_steps": 4350, "total_steps": 20825, "loss": 0.7555, "learning_rate": 4.655927690772868e-05, "epoch": 0.20888355342136855, "percentage": 20.89, "elapsed_time": "5:28:53", "remaining_time": "20:45:38", "throughput": 1805.82, "total_tokens": 35635200} +{"current_steps": 4360, "total_steps": 20825, "loss": 0.7976, "learning_rate": 4.6539192907908204e-05, "epoch": 0.20936374549819928, "percentage": 20.94, "elapsed_time": "5:29:38", "remaining_time": "20:44:52", "throughput": 1805.82, "total_tokens": 35717120} +{"current_steps": 4370, "total_steps": 20825, "loss": 1.0636, "learning_rate": 4.6519054819867856e-05, "epoch": 0.20984393757503, "percentage": 20.98, "elapsed_time": "5:30:24", "remaining_time": "20:44:07", "throughput": 1805.82, "total_tokens": 35799040} +{"current_steps": 4380, "total_steps": 20825, "loss": 0.9967, "learning_rate": 4.649886269417746e-05, "epoch": 0.21032412965186073, "percentage": 21.03, "elapsed_time": "5:31:09", "remaining_time": "20:43:20", "throughput": 1805.84, "total_tokens": 35880960} +{"current_steps": 4390, "total_steps": 20825, "loss": 0.8918, "learning_rate": 4.647861658154254e-05, "epoch": 0.21080432172869148, "percentage": 21.08, "elapsed_time": "5:31:54", "remaining_time": "20:42:35", "throughput": 1805.83, "total_tokens": 35962880} +{"current_steps": 4400, "total_steps": 20825, "loss": 1.0406, "learning_rate": 4.6458316532804214e-05, "epoch": 0.2112845138055222, "percentage": 21.13, "elapsed_time": "5:32:40", "remaining_time": "20:41:49", "throughput": 1805.85, "total_tokens": 36044800} +{"current_steps": 4410, "total_steps": 20825, "loss": 0.9447, "learning_rate": 4.643796259893899e-05, "epoch": 0.21176470588235294, "percentage": 21.18, "elapsed_time": "5:33:25", "remaining_time": "20:41:03", "throughput": 1805.87, "total_tokens": 36126720} +{"current_steps": 4420, "total_steps": 20825, "loss": 0.9381, "learning_rate": 4.641755483105874e-05, "epoch": 0.21224489795918366, "percentage": 21.22, "elapsed_time": "5:34:10", "remaining_time": "20:40:18", "throughput": 1805.86, "total_tokens": 36208640} +{"current_steps": 4430, "total_steps": 20825, "loss": 0.8216, "learning_rate": 4.63970932804105e-05, "epoch": 0.21272509003601442, "percentage": 21.27, "elapsed_time": "5:34:56", "remaining_time": "20:39:34", "throughput": 1805.83, "total_tokens": 36290560} +{"current_steps": 4440, "total_steps": 20825, "loss": 0.9, "learning_rate": 4.637657799837635e-05, "epoch": 0.21320528211284515, "percentage": 21.32, "elapsed_time": "5:35:41", "remaining_time": "20:38:48", "throughput": 1805.84, "total_tokens": 36372480} +{"current_steps": 4450, "total_steps": 20825, "loss": 0.8199, "learning_rate": 4.635600903647333e-05, "epoch": 0.21368547418967587, "percentage": 21.37, "elapsed_time": "5:36:27", "remaining_time": "20:38:03", "throughput": 1805.83, "total_tokens": 36454400} +{"current_steps": 4460, "total_steps": 20825, "loss": 0.8799, "learning_rate": 4.633538644635326e-05, "epoch": 0.2141656662665066, "percentage": 21.42, "elapsed_time": "5:37:12", "remaining_time": "20:37:18", "throughput": 1805.83, "total_tokens": 36536320} +{"current_steps": 4470, "total_steps": 20825, "loss": 0.9863, "learning_rate": 4.631471027980262e-05, "epoch": 0.21464585834333733, "percentage": 21.46, "elapsed_time": "5:37:57", "remaining_time": "20:36:32", "throughput": 1805.85, "total_tokens": 36618240} +{"current_steps": 4480, "total_steps": 20825, "loss": 0.8663, "learning_rate": 4.629398058874245e-05, "epoch": 0.21512605042016808, "percentage": 21.51, "elapsed_time": "5:38:42", "remaining_time": "20:35:46", "throughput": 1805.86, "total_tokens": 36700160} +{"current_steps": 4490, "total_steps": 20825, "loss": 0.9576, "learning_rate": 4.6273197425228166e-05, "epoch": 0.2156062424969988, "percentage": 21.56, "elapsed_time": "5:39:28", "remaining_time": "20:35:01", "throughput": 1805.86, "total_tokens": 36782080} +{"current_steps": 4500, "total_steps": 20825, "loss": 0.9573, "learning_rate": 4.62523608414495e-05, "epoch": 0.21608643457382953, "percentage": 21.61, "elapsed_time": "5:40:13", "remaining_time": "20:34:15", "throughput": 1805.88, "total_tokens": 36864000} +{"current_steps": 4510, "total_steps": 20825, "loss": 0.795, "learning_rate": 4.623147088973031e-05, "epoch": 0.21656662665066026, "percentage": 21.66, "elapsed_time": "5:40:58", "remaining_time": "20:33:28", "throughput": 1805.91, "total_tokens": 36945920} +{"current_steps": 4520, "total_steps": 20825, "loss": 1.1473, "learning_rate": 4.6210527622528465e-05, "epoch": 0.217046818727491, "percentage": 21.7, "elapsed_time": "5:41:43", "remaining_time": "20:32:42", "throughput": 1805.92, "total_tokens": 37027840} +{"current_steps": 4530, "total_steps": 20825, "loss": 0.8676, "learning_rate": 4.618953109243573e-05, "epoch": 0.21752701080432174, "percentage": 21.75, "elapsed_time": "5:42:28", "remaining_time": "20:31:56", "throughput": 1805.94, "total_tokens": 37109760} +{"current_steps": 4540, "total_steps": 20825, "loss": 0.9233, "learning_rate": 4.616848135217761e-05, "epoch": 0.21800720288115247, "percentage": 21.8, "elapsed_time": "5:43:14", "remaining_time": "20:31:11", "throughput": 1805.93, "total_tokens": 37191680} +{"current_steps": 4550, "total_steps": 20825, "loss": 0.831, "learning_rate": 4.6147378454613246e-05, "epoch": 0.2184873949579832, "percentage": 21.85, "elapsed_time": "5:43:59", "remaining_time": "20:30:25", "throughput": 1805.94, "total_tokens": 37273600} +{"current_steps": 4560, "total_steps": 20825, "loss": 0.8871, "learning_rate": 4.6126222452735233e-05, "epoch": 0.21896758703481392, "percentage": 21.9, "elapsed_time": "5:44:44", "remaining_time": "20:29:40", "throughput": 1805.93, "total_tokens": 37355520} +{"current_steps": 4570, "total_steps": 20825, "loss": 0.9688, "learning_rate": 4.6105013399669564e-05, "epoch": 0.21944777911164465, "percentage": 21.94, "elapsed_time": "5:45:30", "remaining_time": "20:28:55", "throughput": 1805.93, "total_tokens": 37437440} +{"current_steps": 4580, "total_steps": 20825, "loss": 0.8533, "learning_rate": 4.608375134867541e-05, "epoch": 0.2199279711884754, "percentage": 21.99, "elapsed_time": "5:46:15", "remaining_time": "20:28:09", "throughput": 1805.94, "total_tokens": 37519360} +{"current_steps": 4590, "total_steps": 20825, "loss": 0.8995, "learning_rate": 4.6062436353145044e-05, "epoch": 0.22040816326530613, "percentage": 22.04, "elapsed_time": "5:47:00", "remaining_time": "20:27:23", "throughput": 1805.95, "total_tokens": 37601280} +{"current_steps": 4600, "total_steps": 20825, "loss": 1.2521, "learning_rate": 4.60410684666037e-05, "epoch": 0.22088835534213686, "percentage": 22.09, "elapsed_time": "5:47:45", "remaining_time": "20:26:37", "throughput": 1805.97, "total_tokens": 37683200} +{"current_steps": 4610, "total_steps": 20825, "loss": 0.998, "learning_rate": 4.601964774270941e-05, "epoch": 0.22136854741896758, "percentage": 22.14, "elapsed_time": "5:48:31", "remaining_time": "20:25:51", "throughput": 1805.99, "total_tokens": 37765120} +{"current_steps": 4620, "total_steps": 20825, "loss": 1.036, "learning_rate": 4.599817423525292e-05, "epoch": 0.2218487394957983, "percentage": 22.18, "elapsed_time": "5:49:16", "remaining_time": "20:25:05", "throughput": 1806.0, "total_tokens": 37847040} +{"current_steps": 4630, "total_steps": 20825, "loss": 1.0166, "learning_rate": 4.597664799815749e-05, "epoch": 0.22232893157262906, "percentage": 22.23, "elapsed_time": "5:50:01", "remaining_time": "20:24:19", "throughput": 1806.02, "total_tokens": 37928960} +{"current_steps": 4640, "total_steps": 20825, "loss": 0.9113, "learning_rate": 4.595506908547881e-05, "epoch": 0.2228091236494598, "percentage": 22.28, "elapsed_time": "5:50:46", "remaining_time": "20:23:33", "throughput": 1806.04, "total_tokens": 38010880} +{"current_steps": 4650, "total_steps": 20825, "loss": 0.9429, "learning_rate": 4.593343755140483e-05, "epoch": 0.22328931572629052, "percentage": 22.33, "elapsed_time": "5:51:31", "remaining_time": "20:22:47", "throughput": 1806.05, "total_tokens": 38092800} +{"current_steps": 4660, "total_steps": 20825, "loss": 1.0135, "learning_rate": 4.5911753450255665e-05, "epoch": 0.22376950780312124, "percentage": 22.38, "elapsed_time": "5:52:16", "remaining_time": "20:22:01", "throughput": 1806.07, "total_tokens": 38174720} +{"current_steps": 4670, "total_steps": 20825, "loss": 0.7263, "learning_rate": 4.589001683648343e-05, "epoch": 0.22424969987995197, "percentage": 22.42, "elapsed_time": "5:53:02", "remaining_time": "20:21:16", "throughput": 1806.05, "total_tokens": 38256640} +{"current_steps": 4680, "total_steps": 20825, "loss": 0.9288, "learning_rate": 4.586822776467208e-05, "epoch": 0.22472989195678272, "percentage": 22.47, "elapsed_time": "5:53:47", "remaining_time": "20:20:31", "throughput": 1806.04, "total_tokens": 38338560} +{"current_steps": 4690, "total_steps": 20825, "loss": 0.9058, "learning_rate": 4.584638628953733e-05, "epoch": 0.22521008403361345, "percentage": 22.52, "elapsed_time": "5:54:33", "remaining_time": "20:19:47", "throughput": 1806.03, "total_tokens": 38420480} +{"current_steps": 4700, "total_steps": 20825, "loss": 0.8911, "learning_rate": 4.582449246592647e-05, "epoch": 0.22569027611044418, "percentage": 22.57, "elapsed_time": "5:55:18", "remaining_time": "20:19:00", "throughput": 1806.05, "total_tokens": 38502400} +{"current_steps": 4710, "total_steps": 20825, "loss": 0.8064, "learning_rate": 4.5802546348818264e-05, "epoch": 0.2261704681872749, "percentage": 22.62, "elapsed_time": "5:56:03", "remaining_time": "20:18:14", "throughput": 1806.07, "total_tokens": 38584320} +{"current_steps": 4720, "total_steps": 20825, "loss": 0.9667, "learning_rate": 4.578054799332277e-05, "epoch": 0.22665066026410563, "percentage": 22.67, "elapsed_time": "5:56:48", "remaining_time": "20:17:29", "throughput": 1806.08, "total_tokens": 38666240} +{"current_steps": 4730, "total_steps": 20825, "loss": 1.0298, "learning_rate": 4.575849745468124e-05, "epoch": 0.22713085234093638, "percentage": 22.71, "elapsed_time": "5:57:34", "remaining_time": "20:16:43", "throughput": 1806.09, "total_tokens": 38748160} +{"current_steps": 4740, "total_steps": 20825, "loss": 0.87, "learning_rate": 4.573639478826596e-05, "epoch": 0.2276110444177671, "percentage": 22.76, "elapsed_time": "5:58:19", "remaining_time": "20:15:57", "throughput": 1806.1, "total_tokens": 38830080} +{"current_steps": 4750, "total_steps": 20825, "loss": 1.0355, "learning_rate": 4.571424004958012e-05, "epoch": 0.22809123649459784, "percentage": 22.81, "elapsed_time": "5:59:04", "remaining_time": "20:15:11", "throughput": 1806.12, "total_tokens": 38912000} +{"current_steps": 4760, "total_steps": 20825, "loss": 1.1281, "learning_rate": 4.5692033294257666e-05, "epoch": 0.22857142857142856, "percentage": 22.86, "elapsed_time": "5:59:49", "remaining_time": "20:14:24", "throughput": 1806.14, "total_tokens": 38993920} +{"current_steps": 4770, "total_steps": 20825, "loss": 0.9067, "learning_rate": 4.5669774578063174e-05, "epoch": 0.2290516206482593, "percentage": 22.91, "elapsed_time": "6:00:34", "remaining_time": "20:13:39", "throughput": 1806.16, "total_tokens": 39075840} +{"current_steps": 4780, "total_steps": 20825, "loss": 0.9853, "learning_rate": 4.56474639568917e-05, "epoch": 0.22953181272509005, "percentage": 22.95, "elapsed_time": "6:01:19", "remaining_time": "20:12:52", "throughput": 1806.18, "total_tokens": 39157760} +{"current_steps": 4790, "total_steps": 20825, "loss": 0.9676, "learning_rate": 4.5625101486768626e-05, "epoch": 0.23001200480192077, "percentage": 23.0, "elapsed_time": "6:02:05", "remaining_time": "20:12:06", "throughput": 1806.19, "total_tokens": 39239680} +{"current_steps": 4800, "total_steps": 20825, "loss": 0.9445, "learning_rate": 4.560268722384956e-05, "epoch": 0.2304921968787515, "percentage": 23.05, "elapsed_time": "6:02:50", "remaining_time": "20:11:21", "throughput": 1806.2, "total_tokens": 39321600} +{"current_steps": 4810, "total_steps": 20825, "loss": 0.939, "learning_rate": 4.558022122442016e-05, "epoch": 0.23097238895558223, "percentage": 23.1, "elapsed_time": "6:03:35", "remaining_time": "20:10:35", "throughput": 1806.22, "total_tokens": 39403520} +{"current_steps": 4820, "total_steps": 20825, "loss": 0.9579, "learning_rate": 4.555770354489598e-05, "epoch": 0.23145258103241295, "percentage": 23.15, "elapsed_time": "6:04:20", "remaining_time": "20:09:49", "throughput": 1806.22, "total_tokens": 39485440} +{"current_steps": 4830, "total_steps": 20825, "loss": 0.8217, "learning_rate": 4.5535134241822394e-05, "epoch": 0.2319327731092437, "percentage": 23.19, "elapsed_time": "6:05:06", "remaining_time": "20:09:03", "throughput": 1806.23, "total_tokens": 39567360} +{"current_steps": 4840, "total_steps": 20825, "loss": 0.8828, "learning_rate": 4.551251337187436e-05, "epoch": 0.23241296518607443, "percentage": 23.24, "elapsed_time": "6:05:51", "remaining_time": "20:08:17", "throughput": 1806.26, "total_tokens": 39649280} +{"current_steps": 4850, "total_steps": 20825, "loss": 1.0273, "learning_rate": 4.548984099185638e-05, "epoch": 0.23289315726290516, "percentage": 23.29, "elapsed_time": "6:06:36", "remaining_time": "20:07:31", "throughput": 1806.27, "total_tokens": 39731200} +{"current_steps": 4860, "total_steps": 20825, "loss": 0.8631, "learning_rate": 4.546711715870227e-05, "epoch": 0.23337334933973589, "percentage": 23.34, "elapsed_time": "6:07:22", "remaining_time": "20:06:49", "throughput": 1806.2, "total_tokens": 39813120} +{"current_steps": 4870, "total_steps": 20825, "loss": 0.9249, "learning_rate": 4.5444341929475064e-05, "epoch": 0.23385354141656664, "percentage": 23.39, "elapsed_time": "6:08:07", "remaining_time": "20:06:03", "throughput": 1806.21, "total_tokens": 39895040} +{"current_steps": 4880, "total_steps": 20825, "loss": 1.3656, "learning_rate": 4.5421515361366854e-05, "epoch": 0.23433373349339737, "percentage": 23.43, "elapsed_time": "6:08:53", "remaining_time": "20:05:18", "throughput": 1806.18, "total_tokens": 39976960} +{"current_steps": 4890, "total_steps": 20825, "loss": 0.6605, "learning_rate": 4.5398637511698665e-05, "epoch": 0.2348139255702281, "percentage": 23.48, "elapsed_time": "6:09:39", "remaining_time": "20:04:35", "throughput": 1806.14, "total_tokens": 40058880} +{"current_steps": 4900, "total_steps": 20825, "loss": 0.9551, "learning_rate": 4.5375708437920284e-05, "epoch": 0.23529411764705882, "percentage": 23.53, "elapsed_time": "6:10:24", "remaining_time": "20:03:49", "throughput": 1806.16, "total_tokens": 40140800} +{"current_steps": 4910, "total_steps": 20825, "loss": 1.0701, "learning_rate": 4.535272819761014e-05, "epoch": 0.23577430972388955, "percentage": 23.58, "elapsed_time": "6:11:09", "remaining_time": "20:03:03", "throughput": 1806.18, "total_tokens": 40222720} +{"current_steps": 4920, "total_steps": 20825, "loss": 1.026, "learning_rate": 4.532969684847514e-05, "epoch": 0.2362545018007203, "percentage": 23.63, "elapsed_time": "6:11:54", "remaining_time": "20:02:17", "throughput": 1806.2, "total_tokens": 40304640} +{"current_steps": 4930, "total_steps": 20825, "loss": 0.9408, "learning_rate": 4.530661444835054e-05, "epoch": 0.23673469387755103, "percentage": 23.67, "elapsed_time": "6:12:39", "remaining_time": "20:01:30", "throughput": 1806.22, "total_tokens": 40386560} +{"current_steps": 4940, "total_steps": 20825, "loss": 1.0037, "learning_rate": 4.5283481055199784e-05, "epoch": 0.23721488595438175, "percentage": 23.72, "elapsed_time": "6:13:24", "remaining_time": "20:00:44", "throughput": 1806.25, "total_tokens": 40468480} +{"current_steps": 4950, "total_steps": 20825, "loss": 1.1308, "learning_rate": 4.526029672711437e-05, "epoch": 0.23769507803121248, "percentage": 23.77, "elapsed_time": "6:14:10", "remaining_time": "19:59:59", "throughput": 1806.23, "total_tokens": 40550400} +{"current_steps": 4960, "total_steps": 20825, "loss": 0.9735, "learning_rate": 4.523706152231373e-05, "epoch": 0.2381752701080432, "percentage": 23.82, "elapsed_time": "6:14:56", "remaining_time": "19:59:15", "throughput": 1806.2, "total_tokens": 40632320} +{"current_steps": 4970, "total_steps": 20825, "loss": 1.0495, "learning_rate": 4.5213775499145e-05, "epoch": 0.23865546218487396, "percentage": 23.87, "elapsed_time": "6:15:41", "remaining_time": "19:58:29", "throughput": 1806.21, "total_tokens": 40714240} +{"current_steps": 4980, "total_steps": 20825, "loss": 0.7898, "learning_rate": 4.519043871608297e-05, "epoch": 0.2391356542617047, "percentage": 23.91, "elapsed_time": "6:16:26", "remaining_time": "19:57:44", "throughput": 1806.22, "total_tokens": 40796160} +{"current_steps": 4990, "total_steps": 20825, "loss": 0.8855, "learning_rate": 4.5167051231729894e-05, "epoch": 0.23961584633853542, "percentage": 23.96, "elapsed_time": "6:17:11", "remaining_time": "19:56:57", "throughput": 1806.25, "total_tokens": 40878080} +{"current_steps": 5000, "total_steps": 20825, "loss": 0.9249, "learning_rate": 4.514361310481533e-05, "epoch": 0.24009603841536614, "percentage": 24.01, "elapsed_time": "6:17:56", "remaining_time": "19:56:11", "throughput": 1806.26, "total_tokens": 40960000} +{"current_steps": 5010, "total_steps": 20825, "loss": 0.9561, "learning_rate": 4.512012439419601e-05, "epoch": 0.24057623049219687, "percentage": 24.06, "elapsed_time": "6:18:45", "remaining_time": "19:55:37", "throughput": 1805.98, "total_tokens": 41041920} +{"current_steps": 5020, "total_steps": 20825, "loss": 1.0238, "learning_rate": 4.509658515885568e-05, "epoch": 0.24105642256902762, "percentage": 24.11, "elapsed_time": "6:19:31", "remaining_time": "19:54:53", "throughput": 1805.96, "total_tokens": 41123840} +{"current_steps": 5030, "total_steps": 20825, "loss": 0.8584, "learning_rate": 4.5072995457904995e-05, "epoch": 0.24153661464585835, "percentage": 24.15, "elapsed_time": "6:20:16", "remaining_time": "19:54:07", "throughput": 1805.97, "total_tokens": 41205760} +{"current_steps": 5040, "total_steps": 20825, "loss": 0.9193, "learning_rate": 4.50493553505813e-05, "epoch": 0.24201680672268908, "percentage": 24.2, "elapsed_time": "6:21:01", "remaining_time": "19:53:21", "throughput": 1805.97, "total_tokens": 41287680} +{"current_steps": 5050, "total_steps": 20825, "loss": 1.0409, "learning_rate": 4.502566489624855e-05, "epoch": 0.2424969987995198, "percentage": 24.25, "elapsed_time": "6:21:47", "remaining_time": "19:52:36", "throughput": 1805.97, "total_tokens": 41369600} +{"current_steps": 5060, "total_steps": 20825, "loss": 0.9899, "learning_rate": 4.50019241543971e-05, "epoch": 0.24297719087635053, "percentage": 24.3, "elapsed_time": "6:22:32", "remaining_time": "19:51:49", "throughput": 1806.0, "total_tokens": 41451520} +{"current_steps": 5070, "total_steps": 20825, "loss": 0.9473, "learning_rate": 4.4978133184643586e-05, "epoch": 0.24345738295318128, "percentage": 24.35, "elapsed_time": "6:23:17", "remaining_time": "19:51:04", "throughput": 1806.01, "total_tokens": 41533440} +{"current_steps": 5080, "total_steps": 20825, "loss": 0.937, "learning_rate": 4.495429204673081e-05, "epoch": 0.243937575030012, "percentage": 24.39, "elapsed_time": "6:24:02", "remaining_time": "19:50:17", "throughput": 1806.04, "total_tokens": 41615360} +{"current_steps": 5090, "total_steps": 20825, "loss": 0.8483, "learning_rate": 4.493040080052752e-05, "epoch": 0.24441776710684274, "percentage": 24.44, "elapsed_time": "6:24:47", "remaining_time": "19:49:32", "throughput": 1806.05, "total_tokens": 41697280} +{"current_steps": 5100, "total_steps": 20825, "loss": 1.0361, "learning_rate": 4.49064595060283e-05, "epoch": 0.24489795918367346, "percentage": 24.49, "elapsed_time": "6:25:32", "remaining_time": "19:48:46", "throughput": 1806.06, "total_tokens": 41779200} +{"current_steps": 5110, "total_steps": 20825, "loss": 1.0274, "learning_rate": 4.488246822335341e-05, "epoch": 0.2453781512605042, "percentage": 24.54, "elapsed_time": "6:26:18", "remaining_time": "19:48:00", "throughput": 1806.07, "total_tokens": 41861120} +{"current_steps": 5120, "total_steps": 20825, "loss": 1.4537, "learning_rate": 4.485842701274865e-05, "epoch": 0.24585834333733494, "percentage": 24.59, "elapsed_time": "6:27:03", "remaining_time": "19:47:15", "throughput": 1806.05, "total_tokens": 41943040} +{"current_steps": 5130, "total_steps": 20825, "loss": 0.8386, "learning_rate": 4.4834335934585194e-05, "epoch": 0.24633853541416567, "percentage": 24.63, "elapsed_time": "6:27:49", "remaining_time": "19:46:31", "throughput": 1806.03, "total_tokens": 42024960} +{"current_steps": 5140, "total_steps": 20825, "loss": 0.8449, "learning_rate": 4.4810195049359435e-05, "epoch": 0.2468187274909964, "percentage": 24.68, "elapsed_time": "6:28:34", "remaining_time": "19:45:45", "throughput": 1806.04, "total_tokens": 42106880} +{"current_steps": 5150, "total_steps": 20825, "loss": 0.9216, "learning_rate": 4.4786004417692836e-05, "epoch": 0.24729891956782712, "percentage": 24.73, "elapsed_time": "6:29:19", "remaining_time": "19:44:59", "throughput": 1806.06, "total_tokens": 42188800} +{"current_steps": 5160, "total_steps": 20825, "loss": 1.0769, "learning_rate": 4.4761764100331795e-05, "epoch": 0.24777911164465785, "percentage": 24.78, "elapsed_time": "6:30:04", "remaining_time": "19:44:13", "throughput": 1806.07, "total_tokens": 42270720} +{"current_steps": 5170, "total_steps": 20825, "loss": 0.8806, "learning_rate": 4.473747415814747e-05, "epoch": 0.2482593037214886, "percentage": 24.83, "elapsed_time": "6:30:49", "remaining_time": "19:43:27", "throughput": 1806.09, "total_tokens": 42352640} +{"current_steps": 5180, "total_steps": 20825, "loss": 1.0999, "learning_rate": 4.471313465213562e-05, "epoch": 0.24873949579831933, "percentage": 24.87, "elapsed_time": "6:31:35", "remaining_time": "19:42:42", "throughput": 1806.08, "total_tokens": 42434560} +{"current_steps": 5190, "total_steps": 20825, "loss": 0.8831, "learning_rate": 4.46887456434165e-05, "epoch": 0.24921968787515006, "percentage": 24.92, "elapsed_time": "6:32:20", "remaining_time": "19:41:56", "throughput": 1806.1, "total_tokens": 42516480} +{"current_steps": 5200, "total_steps": 20825, "loss": 0.8431, "learning_rate": 4.466430719323465e-05, "epoch": 0.24969987995198079, "percentage": 24.97, "elapsed_time": "6:33:05", "remaining_time": "19:41:10", "throughput": 1806.11, "total_tokens": 42598400} +{"current_steps": 5210, "total_steps": 20825, "loss": 1.0951, "learning_rate": 4.463981936295876e-05, "epoch": 0.25018007202881154, "percentage": 25.02, "elapsed_time": "6:33:50", "remaining_time": "19:40:24", "throughput": 1806.13, "total_tokens": 42680320} +{"current_steps": 5220, "total_steps": 20825, "loss": 0.8407, "learning_rate": 4.461528221408153e-05, "epoch": 0.25066026410564224, "percentage": 25.07, "elapsed_time": "6:34:35", "remaining_time": "19:39:38", "throughput": 1806.15, "total_tokens": 42762240} +{"current_steps": 5230, "total_steps": 20825, "loss": 0.9482, "learning_rate": 4.459069580821953e-05, "epoch": 0.251140456182473, "percentage": 25.11, "elapsed_time": "6:35:21", "remaining_time": "19:38:52", "throughput": 1806.16, "total_tokens": 42844160} +{"current_steps": 5240, "total_steps": 20825, "loss": 0.7797, "learning_rate": 4.4566060207112983e-05, "epoch": 0.25162064825930375, "percentage": 25.16, "elapsed_time": "6:36:06", "remaining_time": "19:38:07", "throughput": 1806.16, "total_tokens": 42926080} +{"current_steps": 5250, "total_steps": 20825, "loss": 0.9646, "learning_rate": 4.454137547262566e-05, "epoch": 0.25210084033613445, "percentage": 25.21, "elapsed_time": "6:36:51", "remaining_time": "19:37:21", "throughput": 1806.17, "total_tokens": 43008000} +{"current_steps": 5260, "total_steps": 20825, "loss": 0.9503, "learning_rate": 4.451664166674472e-05, "epoch": 0.2525810324129652, "percentage": 25.26, "elapsed_time": "6:37:36", "remaining_time": "19:36:35", "throughput": 1806.18, "total_tokens": 43089920} +{"current_steps": 5270, "total_steps": 20825, "loss": 0.8684, "learning_rate": 4.449185885158056e-05, "epoch": 0.2530612244897959, "percentage": 25.31, "elapsed_time": "6:38:22", "remaining_time": "19:35:49", "throughput": 1806.19, "total_tokens": 43171840} +{"current_steps": 5280, "total_steps": 20825, "loss": 0.9119, "learning_rate": 4.4467027089366625e-05, "epoch": 0.25354141656662665, "percentage": 25.35, "elapsed_time": "6:39:07", "remaining_time": "19:35:04", "throughput": 1806.2, "total_tokens": 43253760} +{"current_steps": 5290, "total_steps": 20825, "loss": 0.9446, "learning_rate": 4.444214644245928e-05, "epoch": 0.2540216086434574, "percentage": 25.4, "elapsed_time": "6:39:52", "remaining_time": "19:34:18", "throughput": 1806.21, "total_tokens": 43335680} +{"current_steps": 5300, "total_steps": 20825, "loss": 0.8618, "learning_rate": 4.441721697333765e-05, "epoch": 0.2545018007202881, "percentage": 25.45, "elapsed_time": "6:40:37", "remaining_time": "19:33:32", "throughput": 1806.23, "total_tokens": 43417600} +{"current_steps": 5310, "total_steps": 20825, "loss": 0.8695, "learning_rate": 4.4392238744603464e-05, "epoch": 0.25498199279711886, "percentage": 25.5, "elapsed_time": "6:41:22", "remaining_time": "19:32:46", "throughput": 1806.24, "total_tokens": 43499520} +{"current_steps": 5320, "total_steps": 20825, "loss": 1.0076, "learning_rate": 4.436721181898088e-05, "epoch": 0.25546218487394956, "percentage": 25.55, "elapsed_time": "6:42:08", "remaining_time": "19:32:01", "throughput": 1806.24, "total_tokens": 43581440} +{"current_steps": 5330, "total_steps": 20825, "loss": 0.9059, "learning_rate": 4.434213625931636e-05, "epoch": 0.2559423769507803, "percentage": 25.59, "elapsed_time": "6:42:53", "remaining_time": "19:31:15", "throughput": 1806.25, "total_tokens": 43663360} +{"current_steps": 5340, "total_steps": 20825, "loss": 0.9168, "learning_rate": 4.431701212857847e-05, "epoch": 0.25642256902761107, "percentage": 25.64, "elapsed_time": "6:43:38", "remaining_time": "19:30:30", "throughput": 1806.25, "total_tokens": 43745280} +{"current_steps": 5350, "total_steps": 20825, "loss": 0.7605, "learning_rate": 4.429183948985777e-05, "epoch": 0.25690276110444177, "percentage": 25.69, "elapsed_time": "6:44:24", "remaining_time": "19:29:46", "throughput": 1806.2, "total_tokens": 43827200} +{"current_steps": 5360, "total_steps": 20825, "loss": 0.8832, "learning_rate": 4.426661840636662e-05, "epoch": 0.2573829531812725, "percentage": 25.74, "elapsed_time": "6:45:10", "remaining_time": "19:29:00", "throughput": 1806.21, "total_tokens": 43909120} +{"current_steps": 5370, "total_steps": 20825, "loss": 1.0383, "learning_rate": 4.424134894143903e-05, "epoch": 0.2578631452581032, "percentage": 25.79, "elapsed_time": "6:45:55", "remaining_time": "19:28:14", "throughput": 1806.23, "total_tokens": 43991040} +{"current_steps": 5380, "total_steps": 20825, "loss": 1.0498, "learning_rate": 4.42160311585305e-05, "epoch": 0.258343337334934, "percentage": 25.83, "elapsed_time": "6:46:40", "remaining_time": "19:27:28", "throughput": 1806.25, "total_tokens": 44072960} +{"current_steps": 5390, "total_steps": 20825, "loss": 0.6946, "learning_rate": 4.419066512121788e-05, "epoch": 0.25882352941176473, "percentage": 25.88, "elapsed_time": "6:47:25", "remaining_time": "19:26:44", "throughput": 1806.23, "total_tokens": 44154880} +{"current_steps": 5400, "total_steps": 20825, "loss": 0.898, "learning_rate": 4.4165250893199176e-05, "epoch": 0.25930372148859543, "percentage": 25.93, "elapsed_time": "6:48:11", "remaining_time": "19:25:59", "throughput": 1806.21, "total_tokens": 44236800} +{"current_steps": 5410, "total_steps": 20825, "loss": 0.8575, "learning_rate": 4.413978853829342e-05, "epoch": 0.2597839135654262, "percentage": 25.98, "elapsed_time": "6:48:56", "remaining_time": "19:25:14", "throughput": 1806.21, "total_tokens": 44318720} +{"current_steps": 5420, "total_steps": 20825, "loss": 0.953, "learning_rate": 4.411427812044049e-05, "epoch": 0.2602641056422569, "percentage": 26.03, "elapsed_time": "6:49:42", "remaining_time": "19:24:28", "throughput": 1806.21, "total_tokens": 44400640} +{"current_steps": 5430, "total_steps": 20825, "loss": 1.0408, "learning_rate": 4.408871970370096e-05, "epoch": 0.26074429771908764, "percentage": 26.07, "elapsed_time": "6:50:27", "remaining_time": "19:23:43", "throughput": 1806.21, "total_tokens": 44482560} +{"current_steps": 5440, "total_steps": 20825, "loss": 0.9933, "learning_rate": 4.406311335225595e-05, "epoch": 0.2612244897959184, "percentage": 26.12, "elapsed_time": "6:51:12", "remaining_time": "19:22:58", "throughput": 1806.21, "total_tokens": 44564480} +{"current_steps": 5450, "total_steps": 20825, "loss": 0.8562, "learning_rate": 4.4037459130406923e-05, "epoch": 0.2617046818727491, "percentage": 26.17, "elapsed_time": "6:51:58", "remaining_time": "19:22:13", "throughput": 1806.19, "total_tokens": 44646400} +{"current_steps": 5460, "total_steps": 20825, "loss": 0.9538, "learning_rate": 4.401175710257558e-05, "epoch": 0.26218487394957984, "percentage": 26.22, "elapsed_time": "6:52:44", "remaining_time": "19:21:28", "throughput": 1806.17, "total_tokens": 44728320} +{"current_steps": 5470, "total_steps": 20825, "loss": 0.8955, "learning_rate": 4.398600733330365e-05, "epoch": 0.26266506602641054, "percentage": 26.27, "elapsed_time": "6:53:29", "remaining_time": "19:20:42", "throughput": 1806.2, "total_tokens": 44810240} +{"current_steps": 5480, "total_steps": 20825, "loss": 1.1404, "learning_rate": 4.3960209887252766e-05, "epoch": 0.2631452581032413, "percentage": 26.31, "elapsed_time": "6:54:15", "remaining_time": "19:19:59", "throughput": 1806.13, "total_tokens": 44892160} +{"current_steps": 5490, "total_steps": 20825, "loss": 1.0361, "learning_rate": 4.3934364829204265e-05, "epoch": 0.26362545018007205, "percentage": 26.36, "elapsed_time": "6:55:00", "remaining_time": "19:19:13", "throughput": 1806.14, "total_tokens": 44974080} +{"current_steps": 5500, "total_steps": 20825, "loss": 0.8763, "learning_rate": 4.3908472224059064e-05, "epoch": 0.26410564225690275, "percentage": 26.41, "elapsed_time": "6:55:45", "remaining_time": "19:18:27", "throughput": 1806.16, "total_tokens": 45056000} +{"current_steps": 5510, "total_steps": 20825, "loss": 0.8841, "learning_rate": 4.388253213683747e-05, "epoch": 0.2645858343337335, "percentage": 26.46, "elapsed_time": "6:56:30", "remaining_time": "19:17:42", "throughput": 1806.17, "total_tokens": 45137920} +{"current_steps": 5520, "total_steps": 20825, "loss": 0.841, "learning_rate": 4.385654463267901e-05, "epoch": 0.2650660264105642, "percentage": 26.51, "elapsed_time": "6:57:16", "remaining_time": "19:16:56", "throughput": 1806.18, "total_tokens": 45219840} +{"current_steps": 5530, "total_steps": 20825, "loss": 1.1014, "learning_rate": 4.383050977684231e-05, "epoch": 0.26554621848739496, "percentage": 26.55, "elapsed_time": "6:58:01", "remaining_time": "19:16:10", "throughput": 1806.18, "total_tokens": 45301760} +{"current_steps": 5540, "total_steps": 20825, "loss": 0.7611, "learning_rate": 4.3804427634704885e-05, "epoch": 0.2660264105642257, "percentage": 26.6, "elapsed_time": "6:58:46", "remaining_time": "19:15:25", "throughput": 1806.2, "total_tokens": 45383680} +{"current_steps": 5550, "total_steps": 20825, "loss": 0.854, "learning_rate": 4.3778298271762995e-05, "epoch": 0.2665066026410564, "percentage": 26.65, "elapsed_time": "6:59:31", "remaining_time": "19:14:38", "throughput": 1806.22, "total_tokens": 45465600} +{"current_steps": 5560, "total_steps": 20825, "loss": 0.9457, "learning_rate": 4.375212175363149e-05, "epoch": 0.26698679471788717, "percentage": 26.7, "elapsed_time": "7:00:17", "remaining_time": "19:13:53", "throughput": 1806.22, "total_tokens": 45547520} +{"current_steps": 5570, "total_steps": 20825, "loss": 0.8236, "learning_rate": 4.372589814604362e-05, "epoch": 0.26746698679471786, "percentage": 26.75, "elapsed_time": "7:01:02", "remaining_time": "19:13:09", "throughput": 1806.19, "total_tokens": 45629440} +{"current_steps": 5580, "total_steps": 20825, "loss": 0.8256, "learning_rate": 4.369962751485089e-05, "epoch": 0.2679471788715486, "percentage": 26.79, "elapsed_time": "7:01:48", "remaining_time": "19:12:23", "throughput": 1806.19, "total_tokens": 45711360} +{"current_steps": 5590, "total_steps": 20825, "loss": 0.7786, "learning_rate": 4.367330992602289e-05, "epoch": 0.2684273709483794, "percentage": 26.84, "elapsed_time": "7:02:33", "remaining_time": "19:11:38", "throughput": 1806.18, "total_tokens": 45793280} +{"current_steps": 5600, "total_steps": 20825, "loss": 0.7805, "learning_rate": 4.3646945445647114e-05, "epoch": 0.2689075630252101, "percentage": 26.89, "elapsed_time": "7:03:19", "remaining_time": "19:10:53", "throughput": 1806.17, "total_tokens": 45875200} +{"current_steps": 5610, "total_steps": 20825, "loss": 1.0227, "learning_rate": 4.362053413992883e-05, "epoch": 0.2693877551020408, "percentage": 26.94, "elapsed_time": "7:04:04", "remaining_time": "19:10:07", "throughput": 1806.19, "total_tokens": 45957120} +{"current_steps": 5620, "total_steps": 20825, "loss": 0.7345, "learning_rate": 4.359407607519088e-05, "epoch": 0.2698679471788715, "percentage": 26.99, "elapsed_time": "7:04:49", "remaining_time": "19:09:22", "throughput": 1806.18, "total_tokens": 46039040} +{"current_steps": 5630, "total_steps": 20825, "loss": 0.9656, "learning_rate": 4.356757131787353e-05, "epoch": 0.2703481392557023, "percentage": 27.03, "elapsed_time": "7:05:35", "remaining_time": "19:08:38", "throughput": 1806.16, "total_tokens": 46120960} +{"current_steps": 5640, "total_steps": 20825, "loss": 0.8838, "learning_rate": 4.354101993453429e-05, "epoch": 0.27082833133253303, "percentage": 27.08, "elapsed_time": "7:06:20", "remaining_time": "19:07:52", "throughput": 1806.17, "total_tokens": 46202880} +{"current_steps": 5650, "total_steps": 20825, "loss": 0.8414, "learning_rate": 4.3514421991847746e-05, "epoch": 0.27130852340936373, "percentage": 27.13, "elapsed_time": "7:07:05", "remaining_time": "19:07:06", "throughput": 1806.18, "total_tokens": 46284800} +{"current_steps": 5660, "total_steps": 20825, "loss": 0.8546, "learning_rate": 4.3487777556605446e-05, "epoch": 0.2717887154861945, "percentage": 27.18, "elapsed_time": "7:07:51", "remaining_time": "19:06:21", "throughput": 1806.18, "total_tokens": 46366720} +{"current_steps": 5670, "total_steps": 20825, "loss": 1.0363, "learning_rate": 4.3461086695715625e-05, "epoch": 0.2722689075630252, "percentage": 27.23, "elapsed_time": "7:08:36", "remaining_time": "19:05:36", "throughput": 1806.16, "total_tokens": 46448640} +{"current_steps": 5680, "total_steps": 20825, "loss": 0.799, "learning_rate": 4.343434947620315e-05, "epoch": 0.27274909963985594, "percentage": 27.27, "elapsed_time": "7:09:21", "remaining_time": "19:04:51", "throughput": 1806.17, "total_tokens": 46530560} +{"current_steps": 5690, "total_steps": 20825, "loss": 0.9422, "learning_rate": 4.340756596520929e-05, "epoch": 0.2732292917166867, "percentage": 27.32, "elapsed_time": "7:10:07", "remaining_time": "19:04:05", "throughput": 1806.18, "total_tokens": 46612480} +{"current_steps": 5700, "total_steps": 20825, "loss": 0.904, "learning_rate": 4.338073622999154e-05, "epoch": 0.2737094837935174, "percentage": 27.37, "elapsed_time": "7:10:52", "remaining_time": "19:03:19", "throughput": 1806.2, "total_tokens": 46694400} +{"current_steps": 5710, "total_steps": 20825, "loss": 1.2078, "learning_rate": 4.335386033792347e-05, "epoch": 0.27418967587034815, "percentage": 27.42, "elapsed_time": "7:11:37", "remaining_time": "19:02:34", "throughput": 1806.18, "total_tokens": 46776320} +{"current_steps": 5720, "total_steps": 20825, "loss": 0.887, "learning_rate": 4.332693835649461e-05, "epoch": 0.27466986794717885, "percentage": 27.47, "elapsed_time": "7:12:23", "remaining_time": "19:01:48", "throughput": 1806.2, "total_tokens": 46858240} +{"current_steps": 5730, "total_steps": 20825, "loss": 0.9954, "learning_rate": 4.329997035331015e-05, "epoch": 0.2751500600240096, "percentage": 27.52, "elapsed_time": "7:13:08", "remaining_time": "19:01:03", "throughput": 1806.2, "total_tokens": 46940160} +{"current_steps": 5740, "total_steps": 20825, "loss": 0.8496, "learning_rate": 4.3272956396090906e-05, "epoch": 0.27563025210084036, "percentage": 27.56, "elapsed_time": "7:13:53", "remaining_time": "19:00:17", "throughput": 1806.22, "total_tokens": 47022080} +{"current_steps": 5750, "total_steps": 20825, "loss": 0.9616, "learning_rate": 4.324589655267306e-05, "epoch": 0.27611044417767105, "percentage": 27.61, "elapsed_time": "7:14:38", "remaining_time": "18:59:31", "throughput": 1806.23, "total_tokens": 47104000} +{"current_steps": 5760, "total_steps": 20825, "loss": 1.0649, "learning_rate": 4.321879089100805e-05, "epoch": 0.2765906362545018, "percentage": 27.66, "elapsed_time": "7:15:23", "remaining_time": "18:58:45", "throughput": 1806.24, "total_tokens": 47185920} +{"current_steps": 5770, "total_steps": 20825, "loss": 0.9002, "learning_rate": 4.319163947916234e-05, "epoch": 0.2770708283313325, "percentage": 27.71, "elapsed_time": "7:16:08", "remaining_time": "18:57:59", "throughput": 1806.26, "total_tokens": 47267840} +{"current_steps": 5780, "total_steps": 20825, "loss": 0.9649, "learning_rate": 4.316444238531729e-05, "epoch": 0.27755102040816326, "percentage": 27.76, "elapsed_time": "7:16:53", "remaining_time": "18:57:13", "throughput": 1806.28, "total_tokens": 47349760} +{"current_steps": 5790, "total_steps": 20825, "loss": 0.9747, "learning_rate": 4.313719967776899e-05, "epoch": 0.278031212484994, "percentage": 27.8, "elapsed_time": "7:17:39", "remaining_time": "18:56:27", "throughput": 1806.29, "total_tokens": 47431680} +{"current_steps": 5800, "total_steps": 20825, "loss": 1.0223, "learning_rate": 4.310991142492805e-05, "epoch": 0.2785114045618247, "percentage": 27.85, "elapsed_time": "7:18:24", "remaining_time": "18:55:43", "throughput": 1806.27, "total_tokens": 47513600} +{"current_steps": 5810, "total_steps": 20825, "loss": 0.9318, "learning_rate": 4.308257769531947e-05, "epoch": 0.27899159663865547, "percentage": 27.9, "elapsed_time": "7:19:09", "remaining_time": "18:54:57", "throughput": 1806.29, "total_tokens": 47595520} +{"current_steps": 5820, "total_steps": 20825, "loss": 1.0057, "learning_rate": 4.3055198557582445e-05, "epoch": 0.27947178871548617, "percentage": 27.95, "elapsed_time": "7:19:55", "remaining_time": "18:54:11", "throughput": 1806.3, "total_tokens": 47677440} +{"current_steps": 5830, "total_steps": 20825, "loss": 1.126, "learning_rate": 4.3027774080470174e-05, "epoch": 0.2799519807923169, "percentage": 28.0, "elapsed_time": "7:20:40", "remaining_time": "18:53:25", "throughput": 1806.3, "total_tokens": 47759360} +{"current_steps": 5840, "total_steps": 20825, "loss": 0.8118, "learning_rate": 4.300030433284974e-05, "epoch": 0.2804321728691477, "percentage": 28.04, "elapsed_time": "7:21:25", "remaining_time": "18:52:40", "throughput": 1806.3, "total_tokens": 47841280} +{"current_steps": 5850, "total_steps": 20825, "loss": 0.7263, "learning_rate": 4.29727893837019e-05, "epoch": 0.2809123649459784, "percentage": 28.09, "elapsed_time": "7:22:11", "remaining_time": "18:51:55", "throughput": 1806.3, "total_tokens": 47923200} +{"current_steps": 5860, "total_steps": 20825, "loss": 0.8095, "learning_rate": 4.294522930212091e-05, "epoch": 0.28139255702280913, "percentage": 28.14, "elapsed_time": "7:22:56", "remaining_time": "18:51:09", "throughput": 1806.32, "total_tokens": 48005120} +{"current_steps": 5870, "total_steps": 20825, "loss": 0.9164, "learning_rate": 4.291762415731437e-05, "epoch": 0.28187274909963983, "percentage": 28.19, "elapsed_time": "7:23:41", "remaining_time": "18:50:23", "throughput": 1806.34, "total_tokens": 48087040} +{"current_steps": 5880, "total_steps": 20825, "loss": 1.0349, "learning_rate": 4.288997401860303e-05, "epoch": 0.2823529411764706, "percentage": 28.24, "elapsed_time": "7:24:27", "remaining_time": "18:49:39", "throughput": 1806.29, "total_tokens": 48168960} +{"current_steps": 5890, "total_steps": 20825, "loss": 1.3606, "learning_rate": 4.286227895542064e-05, "epoch": 0.28283313325330134, "percentage": 28.28, "elapsed_time": "7:25:12", "remaining_time": "18:48:53", "throughput": 1806.3, "total_tokens": 48250880} +{"current_steps": 5900, "total_steps": 20825, "loss": 0.8476, "learning_rate": 4.283453903731375e-05, "epoch": 0.28331332533013204, "percentage": 28.33, "elapsed_time": "7:25:58", "remaining_time": "18:48:08", "throughput": 1806.29, "total_tokens": 48332800} +{"current_steps": 5910, "total_steps": 20825, "loss": 1.1286, "learning_rate": 4.2806754333941546e-05, "epoch": 0.2837935174069628, "percentage": 28.38, "elapsed_time": "7:26:43", "remaining_time": "18:47:23", "throughput": 1806.3, "total_tokens": 48414720} +{"current_steps": 5920, "total_steps": 20825, "loss": 0.9471, "learning_rate": 4.2778924915075704e-05, "epoch": 0.2842737094837935, "percentage": 28.43, "elapsed_time": "7:27:28", "remaining_time": "18:46:37", "throughput": 1806.31, "total_tokens": 48496640} +{"current_steps": 5930, "total_steps": 20825, "loss": 0.9296, "learning_rate": 4.275105085060014e-05, "epoch": 0.28475390156062425, "percentage": 28.48, "elapsed_time": "7:28:13", "remaining_time": "18:45:51", "throughput": 1806.33, "total_tokens": 48578560} +{"current_steps": 5940, "total_steps": 20825, "loss": 1.0404, "learning_rate": 4.272313221051094e-05, "epoch": 0.285234093637455, "percentage": 28.52, "elapsed_time": "7:28:58", "remaining_time": "18:45:05", "throughput": 1806.34, "total_tokens": 48660480} +{"current_steps": 5950, "total_steps": 20825, "loss": 0.9517, "learning_rate": 4.269516906491607e-05, "epoch": 0.2857142857142857, "percentage": 28.57, "elapsed_time": "7:29:43", "remaining_time": "18:44:19", "throughput": 1806.35, "total_tokens": 48742400} +{"current_steps": 5960, "total_steps": 20825, "loss": 0.7284, "learning_rate": 4.266716148403529e-05, "epoch": 0.28619447779111645, "percentage": 28.62, "elapsed_time": "7:30:29", "remaining_time": "18:43:33", "throughput": 1806.37, "total_tokens": 48824320} +{"current_steps": 5970, "total_steps": 20825, "loss": 0.98, "learning_rate": 4.263910953819993e-05, "epoch": 0.28667466986794715, "percentage": 28.67, "elapsed_time": "7:31:13", "remaining_time": "18:42:47", "throughput": 1806.39, "total_tokens": 48906240} +{"current_steps": 5980, "total_steps": 20825, "loss": 0.9762, "learning_rate": 4.2611013297852744e-05, "epoch": 0.2871548619447779, "percentage": 28.72, "elapsed_time": "7:31:59", "remaining_time": "18:42:01", "throughput": 1806.4, "total_tokens": 48988160} +{"current_steps": 5990, "total_steps": 20825, "loss": 0.9233, "learning_rate": 4.2582872833547693e-05, "epoch": 0.28763505402160866, "percentage": 28.76, "elapsed_time": "7:32:45", "remaining_time": "18:41:17", "throughput": 1806.37, "total_tokens": 49070080} +{"current_steps": 6000, "total_steps": 20825, "loss": 1.0877, "learning_rate": 4.255468821594981e-05, "epoch": 0.28811524609843936, "percentage": 28.81, "elapsed_time": "7:33:30", "remaining_time": "18:40:32", "throughput": 1806.37, "total_tokens": 49152000} +{"current_steps": 6010, "total_steps": 20825, "loss": 0.9164, "learning_rate": 4.2526459515834996e-05, "epoch": 0.2885954381752701, "percentage": 28.86, "elapsed_time": "7:34:18", "remaining_time": "18:39:54", "throughput": 1806.17, "total_tokens": 49233920} +{"current_steps": 6020, "total_steps": 20825, "loss": 1.01, "learning_rate": 4.249818680408984e-05, "epoch": 0.28907563025210087, "percentage": 28.91, "elapsed_time": "7:35:04", "remaining_time": "18:39:09", "throughput": 1806.17, "total_tokens": 49315840} +{"current_steps": 6030, "total_steps": 20825, "loss": 1.057, "learning_rate": 4.246987015171148e-05, "epoch": 0.28955582232893157, "percentage": 28.96, "elapsed_time": "7:35:49", "remaining_time": "18:38:23", "throughput": 1806.17, "total_tokens": 49397760} +{"current_steps": 6040, "total_steps": 20825, "loss": 1.1284, "learning_rate": 4.244150962980735e-05, "epoch": 0.2900360144057623, "percentage": 29.0, "elapsed_time": "7:36:34", "remaining_time": "18:37:38", "throughput": 1806.17, "total_tokens": 49479680} +{"current_steps": 6050, "total_steps": 20825, "loss": 0.9011, "learning_rate": 4.2413105309595105e-05, "epoch": 0.290516206482593, "percentage": 29.05, "elapsed_time": "7:37:20", "remaining_time": "18:36:52", "throughput": 1806.18, "total_tokens": 49561600} +{"current_steps": 6060, "total_steps": 20825, "loss": 0.8397, "learning_rate": 4.238465726240233e-05, "epoch": 0.2909963985594238, "percentage": 29.1, "elapsed_time": "7:38:05", "remaining_time": "18:36:07", "throughput": 1806.16, "total_tokens": 49643520} +{"current_steps": 6070, "total_steps": 20825, "loss": 0.8792, "learning_rate": 4.235616555966645e-05, "epoch": 0.29147659063625453, "percentage": 29.15, "elapsed_time": "7:38:50", "remaining_time": "18:35:21", "throughput": 1806.18, "total_tokens": 49725440} +{"current_steps": 6080, "total_steps": 20825, "loss": 0.7543, "learning_rate": 4.232763027293451e-05, "epoch": 0.29195678271308523, "percentage": 29.2, "elapsed_time": "7:39:36", "remaining_time": "18:34:36", "throughput": 1806.17, "total_tokens": 49807360} +{"current_steps": 6090, "total_steps": 20825, "loss": 1.0364, "learning_rate": 4.2299051473862976e-05, "epoch": 0.292436974789916, "percentage": 29.24, "elapsed_time": "7:40:21", "remaining_time": "18:33:51", "throughput": 1806.18, "total_tokens": 49889280} +{"current_steps": 6100, "total_steps": 20825, "loss": 0.9792, "learning_rate": 4.227042923421762e-05, "epoch": 0.2929171668667467, "percentage": 29.29, "elapsed_time": "7:41:06", "remaining_time": "18:33:05", "throughput": 1806.2, "total_tokens": 49971200} +{"current_steps": 6110, "total_steps": 20825, "loss": 0.9951, "learning_rate": 4.224176362587326e-05, "epoch": 0.29339735894357744, "percentage": 29.34, "elapsed_time": "7:41:51", "remaining_time": "18:32:19", "throughput": 1806.2, "total_tokens": 50053120} +{"current_steps": 6120, "total_steps": 20825, "loss": 0.8709, "learning_rate": 4.221305472081365e-05, "epoch": 0.2938775510204082, "percentage": 29.39, "elapsed_time": "7:42:37", "remaining_time": "18:31:34", "throughput": 1806.2, "total_tokens": 50135040} +{"current_steps": 6130, "total_steps": 20825, "loss": 0.9572, "learning_rate": 4.2184302591131264e-05, "epoch": 0.2943577430972389, "percentage": 29.44, "elapsed_time": "7:43:22", "remaining_time": "18:30:48", "throughput": 1806.22, "total_tokens": 50216960} +{"current_steps": 6140, "total_steps": 20825, "loss": 1.0038, "learning_rate": 4.21555073090271e-05, "epoch": 0.29483793517406964, "percentage": 29.48, "elapsed_time": "7:44:07", "remaining_time": "18:30:02", "throughput": 1806.23, "total_tokens": 50298880} +{"current_steps": 6150, "total_steps": 20825, "loss": 1.1052, "learning_rate": 4.2126668946810545e-05, "epoch": 0.29531812725090034, "percentage": 29.53, "elapsed_time": "7:44:52", "remaining_time": "18:29:16", "throughput": 1806.25, "total_tokens": 50380800} +{"current_steps": 6160, "total_steps": 20825, "loss": 0.788, "learning_rate": 4.2097787576899144e-05, "epoch": 0.2957983193277311, "percentage": 29.58, "elapsed_time": "7:45:37", "remaining_time": "18:28:30", "throughput": 1806.26, "total_tokens": 50462720} +{"current_steps": 6170, "total_steps": 20825, "loss": 0.8364, "learning_rate": 4.2068863271818455e-05, "epoch": 0.29627851140456185, "percentage": 29.63, "elapsed_time": "7:46:22", "remaining_time": "18:27:44", "throughput": 1806.27, "total_tokens": 50544640} +{"current_steps": 6180, "total_steps": 20825, "loss": 0.7908, "learning_rate": 4.2039896104201844e-05, "epoch": 0.29675870348139255, "percentage": 29.68, "elapsed_time": "7:47:08", "remaining_time": "18:27:00", "throughput": 1806.26, "total_tokens": 50626560} +{"current_steps": 6190, "total_steps": 20825, "loss": 0.8223, "learning_rate": 4.201088614679032e-05, "epoch": 0.2972388955582233, "percentage": 29.72, "elapsed_time": "7:47:53", "remaining_time": "18:26:14", "throughput": 1806.26, "total_tokens": 50708480} +{"current_steps": 6200, "total_steps": 20825, "loss": 0.9225, "learning_rate": 4.198183347243233e-05, "epoch": 0.297719087635054, "percentage": 29.77, "elapsed_time": "7:48:38", "remaining_time": "18:25:29", "throughput": 1806.27, "total_tokens": 50790400} +{"current_steps": 6210, "total_steps": 20825, "loss": 0.8484, "learning_rate": 4.1952738154083614e-05, "epoch": 0.29819927971188476, "percentage": 29.82, "elapsed_time": "7:49:24", "remaining_time": "18:24:43", "throughput": 1806.28, "total_tokens": 50872320} +{"current_steps": 6220, "total_steps": 20825, "loss": 0.9279, "learning_rate": 4.1923600264806975e-05, "epoch": 0.2986794717887155, "percentage": 29.87, "elapsed_time": "7:50:09", "remaining_time": "18:23:57", "throughput": 1806.29, "total_tokens": 50954240} +{"current_steps": 6230, "total_steps": 20825, "loss": 0.8793, "learning_rate": 4.189441987777212e-05, "epoch": 0.2991596638655462, "percentage": 29.92, "elapsed_time": "7:50:54", "remaining_time": "18:23:12", "throughput": 1806.29, "total_tokens": 51036160} +{"current_steps": 6240, "total_steps": 20825, "loss": 0.809, "learning_rate": 4.186519706625549e-05, "epoch": 0.29963985594237696, "percentage": 29.96, "elapsed_time": "7:51:40", "remaining_time": "18:22:27", "throughput": 1806.26, "total_tokens": 51118080} +{"current_steps": 6250, "total_steps": 20825, "loss": 1.015, "learning_rate": 4.1835931903640046e-05, "epoch": 0.30012004801920766, "percentage": 30.01, "elapsed_time": "7:52:25", "remaining_time": "18:21:41", "throughput": 1806.28, "total_tokens": 51200000} +{"current_steps": 6260, "total_steps": 20825, "loss": 0.971, "learning_rate": 4.180662446341511e-05, "epoch": 0.3006002400960384, "percentage": 30.06, "elapsed_time": "7:53:10", "remaining_time": "18:20:55", "throughput": 1806.3, "total_tokens": 51281920} +{"current_steps": 6270, "total_steps": 20825, "loss": 0.9027, "learning_rate": 4.1777274819176154e-05, "epoch": 0.3010804321728692, "percentage": 30.11, "elapsed_time": "7:53:55", "remaining_time": "18:20:09", "throughput": 1806.33, "total_tokens": 51363840} +{"current_steps": 6280, "total_steps": 20825, "loss": 0.9546, "learning_rate": 4.1747883044624644e-05, "epoch": 0.30156062424969987, "percentage": 30.16, "elapsed_time": "7:54:40", "remaining_time": "18:19:24", "throughput": 1806.32, "total_tokens": 51445760} +{"current_steps": 6290, "total_steps": 20825, "loss": 1.041, "learning_rate": 4.171844921356784e-05, "epoch": 0.3020408163265306, "percentage": 30.2, "elapsed_time": "7:55:26", "remaining_time": "18:18:38", "throughput": 1806.33, "total_tokens": 51527680} +{"current_steps": 6300, "total_steps": 20825, "loss": 1.0105, "learning_rate": 4.168897339991861e-05, "epoch": 0.3025210084033613, "percentage": 30.25, "elapsed_time": "7:56:11", "remaining_time": "18:17:52", "throughput": 1806.35, "total_tokens": 51609600} +{"current_steps": 6310, "total_steps": 20825, "loss": 1.0367, "learning_rate": 4.1659455677695245e-05, "epoch": 0.3030012004801921, "percentage": 30.3, "elapsed_time": "7:56:56", "remaining_time": "18:17:07", "throughput": 1806.35, "total_tokens": 51691520} +{"current_steps": 6320, "total_steps": 20825, "loss": 0.6583, "learning_rate": 4.162989612102128e-05, "epoch": 0.30348139255702283, "percentage": 30.35, "elapsed_time": "7:57:41", "remaining_time": "18:16:21", "throughput": 1806.34, "total_tokens": 51773440} +{"current_steps": 6330, "total_steps": 20825, "loss": 0.9942, "learning_rate": 4.160029480412529e-05, "epoch": 0.30396158463385353, "percentage": 30.4, "elapsed_time": "7:58:27", "remaining_time": "18:15:36", "throughput": 1806.35, "total_tokens": 51855360} +{"current_steps": 6340, "total_steps": 20825, "loss": 0.8157, "learning_rate": 4.1570651801340735e-05, "epoch": 0.3044417767106843, "percentage": 30.44, "elapsed_time": "7:59:12", "remaining_time": "18:14:50", "throughput": 1806.37, "total_tokens": 51937280} +{"current_steps": 6350, "total_steps": 20825, "loss": 1.0806, "learning_rate": 4.1540967187105753e-05, "epoch": 0.304921968787515, "percentage": 30.49, "elapsed_time": "7:59:57", "remaining_time": "18:14:04", "throughput": 1806.39, "total_tokens": 52019200} +{"current_steps": 6360, "total_steps": 20825, "loss": 0.815, "learning_rate": 4.151124103596295e-05, "epoch": 0.30540216086434574, "percentage": 30.54, "elapsed_time": "8:00:42", "remaining_time": "18:13:18", "throughput": 1806.4, "total_tokens": 52101120} +{"current_steps": 6370, "total_steps": 20825, "loss": 0.9705, "learning_rate": 4.148147342255926e-05, "epoch": 0.3058823529411765, "percentage": 30.59, "elapsed_time": "8:01:27", "remaining_time": "18:12:32", "throughput": 1806.42, "total_tokens": 52183040} +{"current_steps": 6380, "total_steps": 20825, "loss": 0.8492, "learning_rate": 4.145166442164573e-05, "epoch": 0.3063625450180072, "percentage": 30.64, "elapsed_time": "8:02:13", "remaining_time": "18:11:47", "throughput": 1806.41, "total_tokens": 52264960} +{"current_steps": 6390, "total_steps": 20825, "loss": 0.9553, "learning_rate": 4.142181410807735e-05, "epoch": 0.30684273709483795, "percentage": 30.68, "elapsed_time": "8:02:58", "remaining_time": "18:11:02", "throughput": 1806.41, "total_tokens": 52346880} +{"current_steps": 6400, "total_steps": 20825, "loss": 0.9121, "learning_rate": 4.1391922556812815e-05, "epoch": 0.30732292917166865, "percentage": 30.73, "elapsed_time": "8:03:43", "remaining_time": "18:10:16", "throughput": 1806.42, "total_tokens": 52428800} +{"current_steps": 6410, "total_steps": 20825, "loss": 0.8654, "learning_rate": 4.136198984291442e-05, "epoch": 0.3078031212484994, "percentage": 30.78, "elapsed_time": "8:04:28", "remaining_time": "18:09:31", "throughput": 1806.42, "total_tokens": 52510720} +{"current_steps": 6420, "total_steps": 20825, "loss": 0.9387, "learning_rate": 4.133201604154779e-05, "epoch": 0.30828331332533015, "percentage": 30.83, "elapsed_time": "8:05:14", "remaining_time": "18:08:46", "throughput": 1806.41, "total_tokens": 52592640} +{"current_steps": 6430, "total_steps": 20825, "loss": 1.084, "learning_rate": 4.1302001227981765e-05, "epoch": 0.30876350540216085, "percentage": 30.88, "elapsed_time": "8:06:00", "remaining_time": "18:08:01", "throughput": 1806.4, "total_tokens": 52674560} +{"current_steps": 6440, "total_steps": 20825, "loss": 0.7468, "learning_rate": 4.1271945477588126e-05, "epoch": 0.3092436974789916, "percentage": 30.92, "elapsed_time": "8:06:45", "remaining_time": "18:07:15", "throughput": 1806.39, "total_tokens": 52756480} +{"current_steps": 6450, "total_steps": 20825, "loss": 0.9378, "learning_rate": 4.124184886584148e-05, "epoch": 0.3097238895558223, "percentage": 30.97, "elapsed_time": "8:07:30", "remaining_time": "18:06:31", "throughput": 1806.38, "total_tokens": 52838400} +{"current_steps": 6460, "total_steps": 20825, "loss": 1.0187, "learning_rate": 4.121171146831905e-05, "epoch": 0.31020408163265306, "percentage": 31.02, "elapsed_time": "8:08:16", "remaining_time": "18:05:45", "throughput": 1806.4, "total_tokens": 52920320} +{"current_steps": 6470, "total_steps": 20825, "loss": 1.1429, "learning_rate": 4.118153336070045e-05, "epoch": 0.3106842737094838, "percentage": 31.07, "elapsed_time": "8:09:01", "remaining_time": "18:05:00", "throughput": 1806.38, "total_tokens": 53002240} +{"current_steps": 6480, "total_steps": 20825, "loss": 1.0201, "learning_rate": 4.115131461876756e-05, "epoch": 0.3111644657863145, "percentage": 31.12, "elapsed_time": "8:09:47", "remaining_time": "18:04:15", "throughput": 1806.37, "total_tokens": 53084160} +{"current_steps": 6490, "total_steps": 20825, "loss": 0.9806, "learning_rate": 4.1121055318404264e-05, "epoch": 0.31164465786314527, "percentage": 31.16, "elapsed_time": "8:10:32", "remaining_time": "18:03:29", "throughput": 1806.39, "total_tokens": 53166080} +{"current_steps": 6500, "total_steps": 20825, "loss": 1.1109, "learning_rate": 4.109075553559633e-05, "epoch": 0.31212484993997597, "percentage": 31.21, "elapsed_time": "8:11:17", "remaining_time": "18:02:43", "throughput": 1806.39, "total_tokens": 53248000} +{"current_steps": 6510, "total_steps": 20825, "loss": 0.9303, "learning_rate": 4.1060415346431134e-05, "epoch": 0.3126050420168067, "percentage": 31.26, "elapsed_time": "8:12:02", "remaining_time": "18:01:58", "throughput": 1806.4, "total_tokens": 53329920} +{"current_steps": 6520, "total_steps": 20825, "loss": 0.9677, "learning_rate": 4.103003482709758e-05, "epoch": 0.3130852340936375, "percentage": 31.31, "elapsed_time": "8:12:48", "remaining_time": "18:01:12", "throughput": 1806.4, "total_tokens": 53411840} +{"current_steps": 6530, "total_steps": 20825, "loss": 0.7746, "learning_rate": 4.0999614053885795e-05, "epoch": 0.3135654261704682, "percentage": 31.36, "elapsed_time": "8:13:33", "remaining_time": "18:00:28", "throughput": 1806.38, "total_tokens": 53493760} +{"current_steps": 6540, "total_steps": 20825, "loss": 0.8491, "learning_rate": 4.096915310318702e-05, "epoch": 0.31404561824729893, "percentage": 31.4, "elapsed_time": "8:14:18", "remaining_time": "17:59:42", "throughput": 1806.4, "total_tokens": 53575680} +{"current_steps": 6550, "total_steps": 20825, "loss": 0.9473, "learning_rate": 4.093865205149337e-05, "epoch": 0.31452581032412963, "percentage": 31.45, "elapsed_time": "8:15:04", "remaining_time": "17:58:56", "throughput": 1806.4, "total_tokens": 53657600} +{"current_steps": 6560, "total_steps": 20825, "loss": 0.7859, "learning_rate": 4.090811097539768e-05, "epoch": 0.3150060024009604, "percentage": 31.5, "elapsed_time": "8:15:49", "remaining_time": "17:58:11", "throughput": 1806.39, "total_tokens": 53739520} +{"current_steps": 6570, "total_steps": 20825, "loss": 0.7647, "learning_rate": 4.087752995159327e-05, "epoch": 0.31548619447779114, "percentage": 31.55, "elapsed_time": "8:16:34", "remaining_time": "17:57:26", "throughput": 1806.39, "total_tokens": 53821440} +{"current_steps": 6580, "total_steps": 20825, "loss": 0.988, "learning_rate": 4.084690905687379e-05, "epoch": 0.31596638655462184, "percentage": 31.6, "elapsed_time": "8:17:20", "remaining_time": "17:56:40", "throughput": 1806.4, "total_tokens": 53903360} +{"current_steps": 6590, "total_steps": 20825, "loss": 1.148, "learning_rate": 4.0816248368133016e-05, "epoch": 0.3164465786314526, "percentage": 31.64, "elapsed_time": "8:18:05", "remaining_time": "17:55:56", "throughput": 1806.38, "total_tokens": 53985280} +{"current_steps": 6600, "total_steps": 20825, "loss": 0.7685, "learning_rate": 4.078554796236462e-05, "epoch": 0.3169267707082833, "percentage": 31.69, "elapsed_time": "8:18:51", "remaining_time": "17:55:10", "throughput": 1806.39, "total_tokens": 54067200} +{"current_steps": 6610, "total_steps": 20825, "loss": 1.0151, "learning_rate": 4.0754807916662055e-05, "epoch": 0.31740696278511404, "percentage": 31.74, "elapsed_time": "8:19:36", "remaining_time": "17:54:25", "throughput": 1806.39, "total_tokens": 54149120} +{"current_steps": 6620, "total_steps": 20825, "loss": 0.9232, "learning_rate": 4.072402830821829e-05, "epoch": 0.3178871548619448, "percentage": 31.79, "elapsed_time": "8:20:21", "remaining_time": "17:53:39", "throughput": 1806.4, "total_tokens": 54231040} +{"current_steps": 6630, "total_steps": 20825, "loss": 0.907, "learning_rate": 4.069320921432564e-05, "epoch": 0.3183673469387755, "percentage": 31.84, "elapsed_time": "8:21:06", "remaining_time": "17:52:53", "throughput": 1806.41, "total_tokens": 54312960} +{"current_steps": 6640, "total_steps": 20825, "loss": 0.837, "learning_rate": 4.066235071237559e-05, "epoch": 0.31884753901560625, "percentage": 31.88, "elapsed_time": "8:21:51", "remaining_time": "17:52:07", "throughput": 1806.43, "total_tokens": 54394880} +{"current_steps": 6650, "total_steps": 20825, "loss": 0.9814, "learning_rate": 4.0631452879858565e-05, "epoch": 0.31932773109243695, "percentage": 31.93, "elapsed_time": "8:22:36", "remaining_time": "17:51:21", "throughput": 1806.44, "total_tokens": 54476800} +{"current_steps": 6660, "total_steps": 20825, "loss": 0.9107, "learning_rate": 4.0600515794363774e-05, "epoch": 0.3198079231692677, "percentage": 31.98, "elapsed_time": "8:23:21", "remaining_time": "17:50:35", "throughput": 1806.46, "total_tokens": 54558720} +{"current_steps": 6670, "total_steps": 20825, "loss": 0.9817, "learning_rate": 4.0569539533578985e-05, "epoch": 0.32028811524609846, "percentage": 32.03, "elapsed_time": "8:24:07", "remaining_time": "17:49:50", "throughput": 1806.48, "total_tokens": 54640640} +{"current_steps": 6680, "total_steps": 20825, "loss": 0.7322, "learning_rate": 4.053852417529035e-05, "epoch": 0.32076830732292916, "percentage": 32.08, "elapsed_time": "8:24:52", "remaining_time": "17:49:04", "throughput": 1806.47, "total_tokens": 54722560} +{"current_steps": 6690, "total_steps": 20825, "loss": 0.9097, "learning_rate": 4.050746979738218e-05, "epoch": 0.3212484993997599, "percentage": 32.12, "elapsed_time": "8:25:37", "remaining_time": "17:48:19", "throughput": 1806.48, "total_tokens": 54804480} +{"current_steps": 6700, "total_steps": 20825, "loss": 1.0164, "learning_rate": 4.047637647783681e-05, "epoch": 0.3217286914765906, "percentage": 32.17, "elapsed_time": "8:26:23", "remaining_time": "17:47:33", "throughput": 1806.48, "total_tokens": 54886400} +{"current_steps": 6710, "total_steps": 20825, "loss": 0.888, "learning_rate": 4.044524429473431e-05, "epoch": 0.32220888355342137, "percentage": 32.22, "elapsed_time": "8:27:08", "remaining_time": "17:46:48", "throughput": 1806.49, "total_tokens": 54968320} +{"current_steps": 6720, "total_steps": 20825, "loss": 0.8352, "learning_rate": 4.041407332625238e-05, "epoch": 0.3226890756302521, "percentage": 32.27, "elapsed_time": "8:27:53", "remaining_time": "17:46:02", "throughput": 1806.5, "total_tokens": 55050240} +{"current_steps": 6730, "total_steps": 20825, "loss": 0.843, "learning_rate": 4.038286365066613e-05, "epoch": 0.3231692677070828, "percentage": 32.32, "elapsed_time": "8:28:38", "remaining_time": "17:45:16", "throughput": 1806.52, "total_tokens": 55132160} +{"current_steps": 6740, "total_steps": 20825, "loss": 0.9569, "learning_rate": 4.0351615346347804e-05, "epoch": 0.3236494597839136, "percentage": 32.36, "elapsed_time": "8:29:23", "remaining_time": "17:44:30", "throughput": 1806.52, "total_tokens": 55214080} +{"current_steps": 6750, "total_steps": 20825, "loss": 0.912, "learning_rate": 4.032032849176673e-05, "epoch": 0.3241296518607443, "percentage": 32.41, "elapsed_time": "8:30:09", "remaining_time": "17:43:45", "throughput": 1806.52, "total_tokens": 55296000} +{"current_steps": 6760, "total_steps": 20825, "loss": 0.8669, "learning_rate": 4.0289003165488976e-05, "epoch": 0.324609843937575, "percentage": 32.46, "elapsed_time": "8:30:54", "remaining_time": "17:43:00", "throughput": 1806.52, "total_tokens": 55377920} +{"current_steps": 6770, "total_steps": 20825, "loss": 0.9358, "learning_rate": 4.025763944617727e-05, "epoch": 0.3250900360144058, "percentage": 32.51, "elapsed_time": "8:31:39", "remaining_time": "17:42:14", "throughput": 1806.53, "total_tokens": 55459840} +{"current_steps": 6780, "total_steps": 20825, "loss": 0.9055, "learning_rate": 4.0226237412590696e-05, "epoch": 0.3255702280912365, "percentage": 32.56, "elapsed_time": "8:32:24", "remaining_time": "17:41:28", "throughput": 1806.54, "total_tokens": 55541760} +{"current_steps": 6790, "total_steps": 20825, "loss": 0.8201, "learning_rate": 4.019479714358461e-05, "epoch": 0.32605042016806723, "percentage": 32.61, "elapsed_time": "8:33:09", "remaining_time": "17:40:43", "throughput": 1806.56, "total_tokens": 55623680} +{"current_steps": 6800, "total_steps": 20825, "loss": 0.7518, "learning_rate": 4.016331871811033e-05, "epoch": 0.32653061224489793, "percentage": 32.65, "elapsed_time": "8:33:55", "remaining_time": "17:39:58", "throughput": 1806.54, "total_tokens": 55705600} +{"current_steps": 6810, "total_steps": 20825, "loss": 1.0517, "learning_rate": 4.0131802215215025e-05, "epoch": 0.3270108043217287, "percentage": 32.7, "elapsed_time": "8:34:40", "remaining_time": "17:39:12", "throughput": 1806.55, "total_tokens": 55787520} +{"current_steps": 6820, "total_steps": 20825, "loss": 0.9678, "learning_rate": 4.010024771404147e-05, "epoch": 0.32749099639855944, "percentage": 32.75, "elapsed_time": "8:35:25", "remaining_time": "17:38:26", "throughput": 1806.56, "total_tokens": 55869440} +{"current_steps": 6830, "total_steps": 20825, "loss": 0.8882, "learning_rate": 4.006865529382787e-05, "epoch": 0.32797118847539014, "percentage": 32.8, "elapsed_time": "8:36:11", "remaining_time": "17:37:41", "throughput": 1806.55, "total_tokens": 55951360} +{"current_steps": 6840, "total_steps": 20825, "loss": 0.9419, "learning_rate": 4.0037025033907635e-05, "epoch": 0.3284513805522209, "percentage": 32.85, "elapsed_time": "8:36:56", "remaining_time": "17:36:56", "throughput": 1806.56, "total_tokens": 56033280} +{"current_steps": 6850, "total_steps": 20825, "loss": 0.9656, "learning_rate": 4.000535701370921e-05, "epoch": 0.3289315726290516, "percentage": 32.89, "elapsed_time": "8:37:41", "remaining_time": "17:36:10", "throughput": 1806.56, "total_tokens": 56115200} +{"current_steps": 6860, "total_steps": 20825, "loss": 0.9448, "learning_rate": 3.997365131275584e-05, "epoch": 0.32941176470588235, "percentage": 32.94, "elapsed_time": "8:38:27", "remaining_time": "17:35:25", "throughput": 1806.57, "total_tokens": 56197120} +{"current_steps": 6870, "total_steps": 20825, "loss": 1.1117, "learning_rate": 3.994190801066542e-05, "epoch": 0.3298919567827131, "percentage": 32.99, "elapsed_time": "8:39:12", "remaining_time": "17:34:39", "throughput": 1806.58, "total_tokens": 56279040} +{"current_steps": 6880, "total_steps": 20825, "loss": 0.9973, "learning_rate": 3.9910127187150246e-05, "epoch": 0.3303721488595438, "percentage": 33.04, "elapsed_time": "8:39:57", "remaining_time": "17:33:54", "throughput": 1806.58, "total_tokens": 56360960} +{"current_steps": 6890, "total_steps": 20825, "loss": 0.8873, "learning_rate": 3.9878308922016846e-05, "epoch": 0.33085234093637456, "percentage": 33.09, "elapsed_time": "8:40:42", "remaining_time": "17:33:08", "throughput": 1806.58, "total_tokens": 56442880} +{"current_steps": 6900, "total_steps": 20825, "loss": 0.8034, "learning_rate": 3.984645329516578e-05, "epoch": 0.33133253301320525, "percentage": 33.13, "elapsed_time": "8:41:28", "remaining_time": "17:32:22", "throughput": 1806.6, "total_tokens": 56524800} +{"current_steps": 6910, "total_steps": 20825, "loss": 0.9337, "learning_rate": 3.98145603865914e-05, "epoch": 0.331812725090036, "percentage": 33.18, "elapsed_time": "8:42:13", "remaining_time": "17:31:37", "throughput": 1806.61, "total_tokens": 56606720} +{"current_steps": 6920, "total_steps": 20825, "loss": 1.0943, "learning_rate": 3.978263027638171e-05, "epoch": 0.33229291716686676, "percentage": 33.23, "elapsed_time": "8:42:58", "remaining_time": "17:30:51", "throughput": 1806.61, "total_tokens": 56688640} +{"current_steps": 6930, "total_steps": 20825, "loss": 0.9727, "learning_rate": 3.975066304471811e-05, "epoch": 0.33277310924369746, "percentage": 33.28, "elapsed_time": "8:43:43", "remaining_time": "17:30:05", "throughput": 1806.63, "total_tokens": 56770560} +{"current_steps": 6940, "total_steps": 20825, "loss": 0.8136, "learning_rate": 3.971865877187523e-05, "epoch": 0.3332533013205282, "percentage": 33.33, "elapsed_time": "8:44:28", "remaining_time": "17:29:20", "throughput": 1806.64, "total_tokens": 56852480} +{"current_steps": 6950, "total_steps": 20825, "loss": 0.8136, "learning_rate": 3.968661753822071e-05, "epoch": 0.33373349339735897, "percentage": 33.37, "elapsed_time": "8:45:13", "remaining_time": "17:28:34", "throughput": 1806.65, "total_tokens": 56934400} +{"current_steps": 6960, "total_steps": 20825, "loss": 0.9095, "learning_rate": 3.9654539424214996e-05, "epoch": 0.33421368547418967, "percentage": 33.42, "elapsed_time": "8:45:58", "remaining_time": "17:27:48", "throughput": 1806.67, "total_tokens": 57016320} +{"current_steps": 6970, "total_steps": 20825, "loss": 0.8184, "learning_rate": 3.962242451041118e-05, "epoch": 0.3346938775510204, "percentage": 33.47, "elapsed_time": "8:46:44", "remaining_time": "17:27:02", "throughput": 1806.67, "total_tokens": 57098240} +{"current_steps": 6980, "total_steps": 20825, "loss": 0.9821, "learning_rate": 3.9590272877454714e-05, "epoch": 0.3351740696278511, "percentage": 33.52, "elapsed_time": "8:47:29", "remaining_time": "17:26:16", "throughput": 1806.69, "total_tokens": 57180160} +{"current_steps": 6990, "total_steps": 20825, "loss": 1.0956, "learning_rate": 3.955808460608331e-05, "epoch": 0.3356542617046819, "percentage": 33.57, "elapsed_time": "8:48:14", "remaining_time": "17:25:31", "throughput": 1806.69, "total_tokens": 57262080} +{"current_steps": 7000, "total_steps": 20825, "loss": 1.0477, "learning_rate": 3.952585977712664e-05, "epoch": 0.33613445378151263, "percentage": 33.61, "elapsed_time": "8:49:00", "remaining_time": "17:24:46", "throughput": 1806.67, "total_tokens": 57344000} +{"current_steps": 7010, "total_steps": 20825, "loss": 0.9404, "learning_rate": 3.94935984715062e-05, "epoch": 0.33661464585834333, "percentage": 33.66, "elapsed_time": "8:49:48", "remaining_time": "17:24:06", "throughput": 1806.53, "total_tokens": 57425920} +{"current_steps": 7020, "total_steps": 20825, "loss": 0.6775, "learning_rate": 3.9461300770235093e-05, "epoch": 0.3370948379351741, "percentage": 33.71, "elapsed_time": "8:50:33", "remaining_time": "17:23:21", "throughput": 1806.52, "total_tokens": 57507840} +{"current_steps": 7030, "total_steps": 20825, "loss": 0.9909, "learning_rate": 3.942896675441779e-05, "epoch": 0.3375750300120048, "percentage": 33.76, "elapsed_time": "8:51:18", "remaining_time": "17:22:36", "throughput": 1806.52, "total_tokens": 57589760} +{"current_steps": 7040, "total_steps": 20825, "loss": 0.9797, "learning_rate": 3.939659650524997e-05, "epoch": 0.33805522208883554, "percentage": 33.81, "elapsed_time": "8:52:04", "remaining_time": "17:21:50", "throughput": 1806.53, "total_tokens": 57671680} +{"current_steps": 7050, "total_steps": 20825, "loss": 0.8085, "learning_rate": 3.9364190104018307e-05, "epoch": 0.3385354141656663, "percentage": 33.85, "elapsed_time": "8:52:49", "remaining_time": "17:21:04", "throughput": 1806.53, "total_tokens": 57753600} +{"current_steps": 7060, "total_steps": 20825, "loss": 0.9574, "learning_rate": 3.933174763210024e-05, "epoch": 0.339015606242497, "percentage": 33.9, "elapsed_time": "8:53:34", "remaining_time": "17:20:19", "throughput": 1806.54, "total_tokens": 57835520} +{"current_steps": 7070, "total_steps": 20825, "loss": 0.8655, "learning_rate": 3.9299269170963795e-05, "epoch": 0.33949579831932775, "percentage": 33.95, "elapsed_time": "8:54:19", "remaining_time": "17:19:33", "throughput": 1806.54, "total_tokens": 57917440} +{"current_steps": 7080, "total_steps": 20825, "loss": 0.9769, "learning_rate": 3.926675480216738e-05, "epoch": 0.33997599039615845, "percentage": 34.0, "elapsed_time": "8:55:05", "remaining_time": "17:18:48", "throughput": 1806.54, "total_tokens": 57999360} +{"current_steps": 7090, "total_steps": 20825, "loss": 0.9666, "learning_rate": 3.923420460735957e-05, "epoch": 0.3404561824729892, "percentage": 34.05, "elapsed_time": "8:55:50", "remaining_time": "17:18:02", "throughput": 1806.55, "total_tokens": 58081280} +{"current_steps": 7100, "total_steps": 20825, "loss": 0.7937, "learning_rate": 3.920161866827889e-05, "epoch": 0.34093637454981995, "percentage": 34.09, "elapsed_time": "8:56:35", "remaining_time": "17:17:16", "throughput": 1806.57, "total_tokens": 58163200} +{"current_steps": 7110, "total_steps": 20825, "loss": 1.1521, "learning_rate": 3.916899706675365e-05, "epoch": 0.34141656662665065, "percentage": 34.14, "elapsed_time": "8:57:20", "remaining_time": "17:16:31", "throughput": 1806.57, "total_tokens": 58245120} +{"current_steps": 7120, "total_steps": 20825, "loss": 1.0604, "learning_rate": 3.913633988470169e-05, "epoch": 0.3418967587034814, "percentage": 34.19, "elapsed_time": "8:58:05", "remaining_time": "17:15:45", "throughput": 1806.58, "total_tokens": 58327040} +{"current_steps": 7130, "total_steps": 20825, "loss": 1.0293, "learning_rate": 3.91036472041302e-05, "epoch": 0.3423769507803121, "percentage": 34.24, "elapsed_time": "8:58:51", "remaining_time": "17:15:01", "throughput": 1806.55, "total_tokens": 58408960} +{"current_steps": 7140, "total_steps": 20825, "loss": 0.9386, "learning_rate": 3.907091910713553e-05, "epoch": 0.34285714285714286, "percentage": 34.29, "elapsed_time": "8:59:36", "remaining_time": "17:14:15", "throughput": 1806.56, "total_tokens": 58490880} +{"current_steps": 7150, "total_steps": 20825, "loss": 0.9874, "learning_rate": 3.9038155675902956e-05, "epoch": 0.3433373349339736, "percentage": 34.33, "elapsed_time": "9:00:22", "remaining_time": "17:13:30", "throughput": 1806.55, "total_tokens": 58572800} +{"current_steps": 7160, "total_steps": 20825, "loss": 0.9545, "learning_rate": 3.900535699270647e-05, "epoch": 0.3438175270108043, "percentage": 34.38, "elapsed_time": "9:01:07", "remaining_time": "17:12:45", "throughput": 1806.56, "total_tokens": 58654720} +{"current_steps": 7170, "total_steps": 20825, "loss": 0.9244, "learning_rate": 3.8972523139908616e-05, "epoch": 0.34429771908763507, "percentage": 34.43, "elapsed_time": "9:01:52", "remaining_time": "17:11:59", "throughput": 1806.57, "total_tokens": 58736640} +{"current_steps": 7180, "total_steps": 20825, "loss": 0.9025, "learning_rate": 3.8939654199960244e-05, "epoch": 0.34477791116446577, "percentage": 34.48, "elapsed_time": "9:02:37", "remaining_time": "17:11:13", "throughput": 1806.58, "total_tokens": 58818560} +{"current_steps": 7190, "total_steps": 20825, "loss": 0.8459, "learning_rate": 3.890675025540028e-05, "epoch": 0.3452581032412965, "percentage": 34.53, "elapsed_time": "9:03:23", "remaining_time": "17:10:27", "throughput": 1806.59, "total_tokens": 58900480} +{"current_steps": 7200, "total_steps": 20825, "loss": 0.9075, "learning_rate": 3.8873811388855605e-05, "epoch": 0.3457382953181273, "percentage": 34.57, "elapsed_time": "9:04:08", "remaining_time": "17:09:42", "throughput": 1806.59, "total_tokens": 58982400} +{"current_steps": 7210, "total_steps": 20825, "loss": 1.0231, "learning_rate": 3.8840837683040766e-05, "epoch": 0.346218487394958, "percentage": 34.62, "elapsed_time": "9:04:53", "remaining_time": "17:08:56", "throughput": 1806.6, "total_tokens": 59064320} +{"current_steps": 7220, "total_steps": 20825, "loss": 0.8264, "learning_rate": 3.880782922075778e-05, "epoch": 0.34669867947178873, "percentage": 34.67, "elapsed_time": "9:05:38", "remaining_time": "17:08:11", "throughput": 1806.61, "total_tokens": 59146240} +{"current_steps": 7230, "total_steps": 20825, "loss": 0.9188, "learning_rate": 3.8774786084896e-05, "epoch": 0.3471788715486194, "percentage": 34.72, "elapsed_time": "9:06:23", "remaining_time": "17:07:25", "throughput": 1806.62, "total_tokens": 59228160} +{"current_steps": 7240, "total_steps": 20825, "loss": 0.841, "learning_rate": 3.8741708358431774e-05, "epoch": 0.3476590636254502, "percentage": 34.77, "elapsed_time": "9:07:09", "remaining_time": "17:06:40", "throughput": 1806.63, "total_tokens": 59310080} +{"current_steps": 7250, "total_steps": 20825, "loss": 1.1382, "learning_rate": 3.870859612442837e-05, "epoch": 0.34813925570228094, "percentage": 34.81, "elapsed_time": "9:07:54", "remaining_time": "17:05:54", "throughput": 1806.63, "total_tokens": 59392000} +{"current_steps": 7260, "total_steps": 20825, "loss": 0.8716, "learning_rate": 3.86754494660357e-05, "epoch": 0.34861944777911164, "percentage": 34.86, "elapsed_time": "9:08:40", "remaining_time": "17:05:09", "throughput": 1806.62, "total_tokens": 59473920} +{"current_steps": 7270, "total_steps": 20825, "loss": 0.8413, "learning_rate": 3.864226846649008e-05, "epoch": 0.3490996398559424, "percentage": 34.91, "elapsed_time": "9:09:25", "remaining_time": "17:04:24", "throughput": 1806.62, "total_tokens": 59555840} +{"current_steps": 7280, "total_steps": 20825, "loss": 0.9106, "learning_rate": 3.860905320911413e-05, "epoch": 0.3495798319327731, "percentage": 34.96, "elapsed_time": "9:10:10", "remaining_time": "17:03:38", "throughput": 1806.63, "total_tokens": 59637760} +{"current_steps": 7290, "total_steps": 20825, "loss": 0.7808, "learning_rate": 3.857580377731644e-05, "epoch": 0.35006002400960384, "percentage": 35.01, "elapsed_time": "9:10:55", "remaining_time": "17:02:52", "throughput": 1806.64, "total_tokens": 59719680} +{"current_steps": 7300, "total_steps": 20825, "loss": 0.8681, "learning_rate": 3.854252025459144e-05, "epoch": 0.3505402160864346, "percentage": 35.05, "elapsed_time": "9:11:40", "remaining_time": "17:02:06", "throughput": 1806.66, "total_tokens": 59801600} +{"current_steps": 7310, "total_steps": 20825, "loss": 0.9087, "learning_rate": 3.8509202724519165e-05, "epoch": 0.3510204081632653, "percentage": 35.1, "elapsed_time": "9:12:25", "remaining_time": "17:01:21", "throughput": 1806.67, "total_tokens": 59883520} +{"current_steps": 7320, "total_steps": 20825, "loss": 0.8279, "learning_rate": 3.8475851270765054e-05, "epoch": 0.35150060024009605, "percentage": 35.15, "elapsed_time": "9:13:11", "remaining_time": "17:00:35", "throughput": 1806.68, "total_tokens": 59965440} +{"current_steps": 7330, "total_steps": 20825, "loss": 0.9013, "learning_rate": 3.844246597707972e-05, "epoch": 0.35198079231692675, "percentage": 35.2, "elapsed_time": "9:13:56", "remaining_time": "16:59:50", "throughput": 1806.66, "total_tokens": 60047360} +{"current_steps": 7340, "total_steps": 20825, "loss": 0.879, "learning_rate": 3.8409046927298755e-05, "epoch": 0.3524609843937575, "percentage": 35.25, "elapsed_time": "9:14:41", "remaining_time": "16:59:05", "throughput": 1806.67, "total_tokens": 60129280} +{"current_steps": 7350, "total_steps": 20825, "loss": 1.1444, "learning_rate": 3.8375594205342534e-05, "epoch": 0.35294117647058826, "percentage": 35.29, "elapsed_time": "9:15:26", "remaining_time": "16:58:19", "throughput": 1806.68, "total_tokens": 60211200} +{"current_steps": 7360, "total_steps": 20825, "loss": 1.0091, "learning_rate": 3.834210789521598e-05, "epoch": 0.35342136854741896, "percentage": 35.34, "elapsed_time": "9:16:12", "remaining_time": "16:57:34", "throughput": 1806.68, "total_tokens": 60293120} +{"current_steps": 7370, "total_steps": 20825, "loss": 1.0194, "learning_rate": 3.830858808100834e-05, "epoch": 0.3539015606242497, "percentage": 35.39, "elapsed_time": "9:16:57", "remaining_time": "16:56:48", "throughput": 1806.7, "total_tokens": 60375040} +{"current_steps": 7380, "total_steps": 20825, "loss": 0.8125, "learning_rate": 3.8275034846893046e-05, "epoch": 0.3543817527010804, "percentage": 35.44, "elapsed_time": "9:17:42", "remaining_time": "16:56:02", "throughput": 1806.72, "total_tokens": 60456960} +{"current_steps": 7390, "total_steps": 20825, "loss": 1.3012, "learning_rate": 3.824144827712738e-05, "epoch": 0.35486194477791116, "percentage": 35.49, "elapsed_time": "9:18:28", "remaining_time": "16:55:17", "throughput": 1806.69, "total_tokens": 60538880} +{"current_steps": 7400, "total_steps": 20825, "loss": 1.0136, "learning_rate": 3.82078284560524e-05, "epoch": 0.3553421368547419, "percentage": 35.53, "elapsed_time": "9:19:13", "remaining_time": "16:54:32", "throughput": 1806.7, "total_tokens": 60620800} +{"current_steps": 7410, "total_steps": 20825, "loss": 0.9035, "learning_rate": 3.817417546809263e-05, "epoch": 0.3558223289315726, "percentage": 35.58, "elapsed_time": "9:19:58", "remaining_time": "16:53:46", "throughput": 1806.71, "total_tokens": 60702720} +{"current_steps": 7420, "total_steps": 20825, "loss": 1.0054, "learning_rate": 3.8140489397755886e-05, "epoch": 0.3563025210084034, "percentage": 35.63, "elapsed_time": "9:20:43", "remaining_time": "16:53:00", "throughput": 1806.72, "total_tokens": 60784640} +{"current_steps": 7430, "total_steps": 20825, "loss": 0.9705, "learning_rate": 3.810677032963307e-05, "epoch": 0.35678271308523407, "percentage": 35.68, "elapsed_time": "9:21:29", "remaining_time": "16:52:15", "throughput": 1806.71, "total_tokens": 60866560} +{"current_steps": 7440, "total_steps": 20825, "loss": 0.8928, "learning_rate": 3.807301834839793e-05, "epoch": 0.3572629051620648, "percentage": 35.73, "elapsed_time": "9:22:14", "remaining_time": "16:51:29", "throughput": 1806.73, "total_tokens": 60948480} +{"current_steps": 7450, "total_steps": 20825, "loss": 0.7673, "learning_rate": 3.803923353880687e-05, "epoch": 0.3577430972388956, "percentage": 35.77, "elapsed_time": "9:22:59", "remaining_time": "16:50:44", "throughput": 1806.74, "total_tokens": 61030400} +{"current_steps": 7460, "total_steps": 20825, "loss": 0.9807, "learning_rate": 3.8005415985698754e-05, "epoch": 0.3582232893157263, "percentage": 35.82, "elapsed_time": "9:23:44", "remaining_time": "16:49:58", "throughput": 1806.75, "total_tokens": 61112320} +{"current_steps": 7470, "total_steps": 20825, "loss": 0.9943, "learning_rate": 3.797156577399462e-05, "epoch": 0.35870348139255703, "percentage": 35.87, "elapsed_time": "9:24:29", "remaining_time": "16:49:12", "throughput": 1806.75, "total_tokens": 61194240} +{"current_steps": 7480, "total_steps": 20825, "loss": 0.8648, "learning_rate": 3.7937682988697566e-05, "epoch": 0.35918367346938773, "percentage": 35.92, "elapsed_time": "9:25:15", "remaining_time": "16:48:27", "throughput": 1806.75, "total_tokens": 61276160} +{"current_steps": 7490, "total_steps": 20825, "loss": 1.0123, "learning_rate": 3.790376771489247e-05, "epoch": 0.3596638655462185, "percentage": 35.97, "elapsed_time": "9:26:00", "remaining_time": "16:47:41", "throughput": 1806.76, "total_tokens": 61358080} +{"current_steps": 7500, "total_steps": 20825, "loss": 0.8446, "learning_rate": 3.7869820037745776e-05, "epoch": 0.36014405762304924, "percentage": 36.01, "elapsed_time": "9:26:45", "remaining_time": "16:46:56", "throughput": 1806.76, "total_tokens": 61440000} +{"current_steps": 7510, "total_steps": 20825, "loss": 0.7602, "learning_rate": 3.783584004250531e-05, "epoch": 0.36062424969987994, "percentage": 36.06, "elapsed_time": "9:27:30", "remaining_time": "16:46:11", "throughput": 1806.76, "total_tokens": 61521920} +{"current_steps": 7520, "total_steps": 20825, "loss": 0.8187, "learning_rate": 3.7801827814500074e-05, "epoch": 0.3611044417767107, "percentage": 36.11, "elapsed_time": "9:28:16", "remaining_time": "16:45:25", "throughput": 1806.77, "total_tokens": 61603840} +{"current_steps": 7530, "total_steps": 20825, "loss": 0.8516, "learning_rate": 3.7767783439139984e-05, "epoch": 0.3615846338535414, "percentage": 36.16, "elapsed_time": "9:29:01", "remaining_time": "16:44:40", "throughput": 1806.77, "total_tokens": 61685760} +{"current_steps": 7540, "total_steps": 20825, "loss": 0.8289, "learning_rate": 3.77337070019157e-05, "epoch": 0.36206482593037215, "percentage": 36.21, "elapsed_time": "9:29:46", "remaining_time": "16:43:54", "throughput": 1806.78, "total_tokens": 61767680} +{"current_steps": 7550, "total_steps": 20825, "loss": 0.9404, "learning_rate": 3.7699598588398364e-05, "epoch": 0.3625450180072029, "percentage": 36.25, "elapsed_time": "9:30:31", "remaining_time": "16:43:08", "throughput": 1806.79, "total_tokens": 61849600} +{"current_steps": 7560, "total_steps": 20825, "loss": 0.9699, "learning_rate": 3.766545828423946e-05, "epoch": 0.3630252100840336, "percentage": 36.3, "elapsed_time": "9:31:16", "remaining_time": "16:42:23", "throughput": 1806.81, "total_tokens": 61931520} +{"current_steps": 7570, "total_steps": 20825, "loss": 0.8596, "learning_rate": 3.7631286175170535e-05, "epoch": 0.36350540216086435, "percentage": 36.35, "elapsed_time": "9:32:02", "remaining_time": "16:41:37", "throughput": 1806.81, "total_tokens": 62013440} +{"current_steps": 7580, "total_steps": 20825, "loss": 1.0988, "learning_rate": 3.7597082347003e-05, "epoch": 0.36398559423769505, "percentage": 36.4, "elapsed_time": "9:32:47", "remaining_time": "16:40:52", "throughput": 1806.81, "total_tokens": 62095360} +{"current_steps": 7590, "total_steps": 20825, "loss": 0.8688, "learning_rate": 3.75628468856279e-05, "epoch": 0.3644657863145258, "percentage": 36.45, "elapsed_time": "9:33:32", "remaining_time": "16:40:07", "throughput": 1806.81, "total_tokens": 62177280} +{"current_steps": 7600, "total_steps": 20825, "loss": 0.8713, "learning_rate": 3.7528579877015746e-05, "epoch": 0.36494597839135656, "percentage": 36.49, "elapsed_time": "9:34:18", "remaining_time": "16:39:22", "throughput": 1806.78, "total_tokens": 62259200} +{"current_steps": 7610, "total_steps": 20825, "loss": 1.0696, "learning_rate": 3.749428140721626e-05, "epoch": 0.36542617046818726, "percentage": 36.54, "elapsed_time": "9:35:03", "remaining_time": "16:38:36", "throughput": 1806.79, "total_tokens": 62341120} +{"current_steps": 7620, "total_steps": 20825, "loss": 0.8351, "learning_rate": 3.745995156235815e-05, "epoch": 0.365906362545018, "percentage": 36.59, "elapsed_time": "9:35:48", "remaining_time": "16:37:51", "throughput": 1806.8, "total_tokens": 62423040} +{"current_steps": 7630, "total_steps": 20825, "loss": 0.9453, "learning_rate": 3.742559042864895e-05, "epoch": 0.3663865546218487, "percentage": 36.64, "elapsed_time": "9:36:34", "remaining_time": "16:37:06", "throughput": 1806.79, "total_tokens": 62504960} +{"current_steps": 7640, "total_steps": 20825, "loss": 1.0241, "learning_rate": 3.7391198092374726e-05, "epoch": 0.36686674669867947, "percentage": 36.69, "elapsed_time": "9:37:19", "remaining_time": "16:36:20", "throughput": 1806.8, "total_tokens": 62586880} +{"current_steps": 7650, "total_steps": 20825, "loss": 0.8502, "learning_rate": 3.7356774639899914e-05, "epoch": 0.3673469387755102, "percentage": 36.73, "elapsed_time": "9:38:04", "remaining_time": "16:35:34", "throughput": 1806.81, "total_tokens": 62668800} +{"current_steps": 7660, "total_steps": 20825, "loss": 0.8658, "learning_rate": 3.7322320157667094e-05, "epoch": 0.3678271308523409, "percentage": 36.78, "elapsed_time": "9:38:50", "remaining_time": "16:34:49", "throughput": 1806.81, "total_tokens": 62750720} +{"current_steps": 7670, "total_steps": 20825, "loss": 0.7977, "learning_rate": 3.728783473219676e-05, "epoch": 0.3683073229291717, "percentage": 36.83, "elapsed_time": "9:39:34", "remaining_time": "16:34:03", "throughput": 1806.83, "total_tokens": 62832640} +{"current_steps": 7680, "total_steps": 20825, "loss": 0.7638, "learning_rate": 3.72533184500871e-05, "epoch": 0.3687875150060024, "percentage": 36.88, "elapsed_time": "9:40:20", "remaining_time": "16:33:17", "throughput": 1806.84, "total_tokens": 62914560} +{"current_steps": 7690, "total_steps": 20825, "loss": 0.9013, "learning_rate": 3.7218771398013807e-05, "epoch": 0.36926770708283313, "percentage": 36.93, "elapsed_time": "9:41:05", "remaining_time": "16:32:32", "throughput": 1806.83, "total_tokens": 62996480} +{"current_steps": 7700, "total_steps": 20825, "loss": 0.8292, "learning_rate": 3.718419366272982e-05, "epoch": 0.3697478991596639, "percentage": 36.97, "elapsed_time": "9:41:50", "remaining_time": "16:31:46", "throughput": 1806.85, "total_tokens": 63078400} +{"current_steps": 7710, "total_steps": 20825, "loss": 0.7722, "learning_rate": 3.714958533106515e-05, "epoch": 0.3702280912364946, "percentage": 37.02, "elapsed_time": "9:42:36", "remaining_time": "16:31:01", "throughput": 1806.85, "total_tokens": 63160320} +{"current_steps": 7720, "total_steps": 20825, "loss": 0.9032, "learning_rate": 3.7114946489926633e-05, "epoch": 0.37070828331332534, "percentage": 37.07, "elapsed_time": "9:43:21", "remaining_time": "16:30:16", "throughput": 1806.85, "total_tokens": 63242240} +{"current_steps": 7730, "total_steps": 20825, "loss": 1.0929, "learning_rate": 3.708027722629772e-05, "epoch": 0.37118847539015604, "percentage": 37.12, "elapsed_time": "9:44:06", "remaining_time": "16:29:30", "throughput": 1806.86, "total_tokens": 63324160} +{"current_steps": 7740, "total_steps": 20825, "loss": 0.8444, "learning_rate": 3.704557762723823e-05, "epoch": 0.3716686674669868, "percentage": 37.17, "elapsed_time": "9:44:51", "remaining_time": "16:28:44", "throughput": 1806.87, "total_tokens": 63406080} +{"current_steps": 7750, "total_steps": 20825, "loss": 0.8989, "learning_rate": 3.7010847779884204e-05, "epoch": 0.37214885954381755, "percentage": 37.21, "elapsed_time": "9:45:36", "remaining_time": "16:27:59", "throughput": 1806.88, "total_tokens": 63488000} +{"current_steps": 7760, "total_steps": 20825, "loss": 0.9214, "learning_rate": 3.697608777144762e-05, "epoch": 0.37262905162064824, "percentage": 37.26, "elapsed_time": "9:46:21", "remaining_time": "16:27:13", "throughput": 1806.89, "total_tokens": 63569920} +{"current_steps": 7770, "total_steps": 20825, "loss": 0.9651, "learning_rate": 3.694129768921619e-05, "epoch": 0.373109243697479, "percentage": 37.31, "elapsed_time": "9:47:07", "remaining_time": "16:26:28", "throughput": 1806.89, "total_tokens": 63651840} +{"current_steps": 7780, "total_steps": 20825, "loss": 0.946, "learning_rate": 3.6906477620553156e-05, "epoch": 0.3735894357743097, "percentage": 37.36, "elapsed_time": "9:47:52", "remaining_time": "16:25:42", "throughput": 1806.9, "total_tokens": 63733760} +{"current_steps": 7790, "total_steps": 20825, "loss": 0.9149, "learning_rate": 3.687162765289704e-05, "epoch": 0.37406962785114045, "percentage": 37.41, "elapsed_time": "9:48:37", "remaining_time": "16:24:56", "throughput": 1806.91, "total_tokens": 63815680} +{"current_steps": 7800, "total_steps": 20825, "loss": 0.8513, "learning_rate": 3.683674787376148e-05, "epoch": 0.3745498199279712, "percentage": 37.45, "elapsed_time": "9:49:22", "remaining_time": "16:24:10", "throughput": 1806.93, "total_tokens": 63897600} +{"current_steps": 7810, "total_steps": 20825, "loss": 0.7109, "learning_rate": 3.6801838370734945e-05, "epoch": 0.3750300120048019, "percentage": 37.5, "elapsed_time": "9:50:08", "remaining_time": "16:23:25", "throughput": 1806.92, "total_tokens": 63979520} +{"current_steps": 7820, "total_steps": 20825, "loss": 0.8537, "learning_rate": 3.676689923148056e-05, "epoch": 0.37551020408163266, "percentage": 37.55, "elapsed_time": "9:50:53", "remaining_time": "16:22:40", "throughput": 1806.92, "total_tokens": 64061440} +{"current_steps": 7830, "total_steps": 20825, "loss": 0.9253, "learning_rate": 3.673193054373587e-05, "epoch": 0.37599039615846336, "percentage": 37.6, "elapsed_time": "9:51:38", "remaining_time": "16:21:55", "throughput": 1806.92, "total_tokens": 64143360} +{"current_steps": 7840, "total_steps": 20825, "loss": 0.9448, "learning_rate": 3.6696932395312606e-05, "epoch": 0.3764705882352941, "percentage": 37.65, "elapsed_time": "9:52:24", "remaining_time": "16:21:10", "throughput": 1806.91, "total_tokens": 64225280} +{"current_steps": 7850, "total_steps": 20825, "loss": 0.8673, "learning_rate": 3.6661904874096503e-05, "epoch": 0.37695078031212487, "percentage": 37.7, "elapsed_time": "9:53:09", "remaining_time": "16:20:24", "throughput": 1806.93, "total_tokens": 64307200} +{"current_steps": 7860, "total_steps": 20825, "loss": 0.8175, "learning_rate": 3.662684806804704e-05, "epoch": 0.37743097238895557, "percentage": 37.74, "elapsed_time": "9:53:54", "remaining_time": "16:19:38", "throughput": 1806.94, "total_tokens": 64389120} +{"current_steps": 7870, "total_steps": 20825, "loss": 0.9513, "learning_rate": 3.659176206519724e-05, "epoch": 0.3779111644657863, "percentage": 37.79, "elapsed_time": "9:54:39", "remaining_time": "16:18:53", "throughput": 1806.95, "total_tokens": 64471040} +{"current_steps": 7880, "total_steps": 20825, "loss": 0.8763, "learning_rate": 3.655664695365344e-05, "epoch": 0.3783913565426171, "percentage": 37.84, "elapsed_time": "9:55:24", "remaining_time": "16:18:07", "throughput": 1806.94, "total_tokens": 64552960} +{"current_steps": 7890, "total_steps": 20825, "loss": 0.8944, "learning_rate": 3.652150282159507e-05, "epoch": 0.3788715486194478, "percentage": 37.89, "elapsed_time": "9:56:18", "remaining_time": "16:17:35", "throughput": 1806.53, "total_tokens": 64634880} +{"current_steps": 7900, "total_steps": 20825, "loss": 0.8366, "learning_rate": 3.6486329757274454e-05, "epoch": 0.3793517406962785, "percentage": 37.94, "elapsed_time": "9:57:18", "remaining_time": "16:17:13", "throughput": 1805.81, "total_tokens": 64716800} +{"current_steps": 7910, "total_steps": 20825, "loss": 0.9178, "learning_rate": 3.645112784901655e-05, "epoch": 0.3798319327731092, "percentage": 37.98, "elapsed_time": "9:58:17", "remaining_time": "16:16:51", "throughput": 1805.12, "total_tokens": 64798720} +{"current_steps": 7920, "total_steps": 20825, "loss": 0.8597, "learning_rate": 3.641589718521875e-05, "epoch": 0.38031212484994, "percentage": 38.03, "elapsed_time": "9:59:13", "remaining_time": "16:16:22", "throughput": 1804.59, "total_tokens": 64880640} +{"current_steps": 7930, "total_steps": 20825, "loss": 0.9038, "learning_rate": 3.6380637854350665e-05, "epoch": 0.38079231692677074, "percentage": 38.08, "elapsed_time": "10:00:09", "remaining_time": "16:15:54", "throughput": 1804.05, "total_tokens": 64962560} +{"current_steps": 7940, "total_steps": 20825, "loss": 0.8226, "learning_rate": 3.634534994495387e-05, "epoch": 0.38127250900360143, "percentage": 38.13, "elapsed_time": "10:01:05", "remaining_time": "16:15:26", "throughput": 1803.52, "total_tokens": 65044480} +{"current_steps": 7950, "total_steps": 20825, "loss": 0.8539, "learning_rate": 3.631003354564175e-05, "epoch": 0.3817527010804322, "percentage": 38.18, "elapsed_time": "10:02:00", "remaining_time": "16:14:57", "throughput": 1803.02, "total_tokens": 65126400} +{"current_steps": 7960, "total_steps": 20825, "loss": 1.0, "learning_rate": 3.6274688745099194e-05, "epoch": 0.3822328931572629, "percentage": 38.22, "elapsed_time": "10:02:56", "remaining_time": "16:14:29", "throughput": 1802.49, "total_tokens": 65208320} +{"current_steps": 7970, "total_steps": 20825, "loss": 0.9514, "learning_rate": 3.623931563208241e-05, "epoch": 0.38271308523409364, "percentage": 38.27, "elapsed_time": "10:03:52", "remaining_time": "16:14:00", "throughput": 1801.98, "total_tokens": 65290240} +{"current_steps": 7980, "total_steps": 20825, "loss": 0.8269, "learning_rate": 3.620391429541873e-05, "epoch": 0.3831932773109244, "percentage": 38.32, "elapsed_time": "10:04:47", "remaining_time": "16:13:30", "throughput": 1801.51, "total_tokens": 65372160} +{"current_steps": 7990, "total_steps": 20825, "loss": 0.9784, "learning_rate": 3.616848482400634e-05, "epoch": 0.3836734693877551, "percentage": 38.37, "elapsed_time": "10:05:42", "remaining_time": "16:13:00", "throughput": 1801.02, "total_tokens": 65454080} +{"current_steps": 8000, "total_steps": 20825, "loss": 0.994, "learning_rate": 3.6133027306814085e-05, "epoch": 0.38415366146458585, "percentage": 38.42, "elapsed_time": "10:06:38", "remaining_time": "16:12:30", "throughput": 1800.53, "total_tokens": 65536000} +{"current_steps": 8010, "total_steps": 20825, "loss": 1.046, "learning_rate": 3.609754183288122e-05, "epoch": 0.38463385354141655, "percentage": 38.46, "elapsed_time": "10:07:37", "remaining_time": "16:12:06", "throughput": 1799.86, "total_tokens": 65617920} +{"current_steps": 8020, "total_steps": 20825, "loss": 0.9983, "learning_rate": 3.606202849131723e-05, "epoch": 0.3851140456182473, "percentage": 38.51, "elapsed_time": "10:08:32", "remaining_time": "16:11:37", "throughput": 1799.38, "total_tokens": 65699840} +{"current_steps": 8030, "total_steps": 20825, "loss": 0.9211, "learning_rate": 3.6026487371301564e-05, "epoch": 0.38559423769507806, "percentage": 38.56, "elapsed_time": "10:09:27", "remaining_time": "16:11:07", "throughput": 1798.89, "total_tokens": 65781760} +{"current_steps": 8040, "total_steps": 20825, "loss": 0.8849, "learning_rate": 3.599091856208343e-05, "epoch": 0.38607442977190876, "percentage": 38.61, "elapsed_time": "10:10:23", "remaining_time": "16:10:37", "throughput": 1798.4, "total_tokens": 65863680} +{"current_steps": 8050, "total_steps": 20825, "loss": 0.9194, "learning_rate": 3.5955322152981575e-05, "epoch": 0.3865546218487395, "percentage": 38.66, "elapsed_time": "10:11:19", "remaining_time": "16:10:08", "throughput": 1797.91, "total_tokens": 65945600} +{"current_steps": 8060, "total_steps": 20825, "loss": 1.0414, "learning_rate": 3.5919698233384034e-05, "epoch": 0.3870348139255702, "percentage": 38.7, "elapsed_time": "10:12:15", "remaining_time": "16:09:39", "throughput": 1797.4, "total_tokens": 66027520} +{"current_steps": 8070, "total_steps": 20825, "loss": 0.8462, "learning_rate": 3.588404689274795e-05, "epoch": 0.38751500600240096, "percentage": 38.75, "elapsed_time": "10:13:13", "remaining_time": "16:09:13", "throughput": 1796.77, "total_tokens": 66109440} +{"current_steps": 8080, "total_steps": 20825, "loss": 0.7765, "learning_rate": 3.58483682205993e-05, "epoch": 0.3879951980792317, "percentage": 38.8, "elapsed_time": "10:14:08", "remaining_time": "16:08:42", "throughput": 1796.33, "total_tokens": 66191360} +{"current_steps": 8090, "total_steps": 20825, "loss": 0.8597, "learning_rate": 3.581266230653271e-05, "epoch": 0.3884753901560624, "percentage": 38.85, "elapsed_time": "10:15:01", "remaining_time": "16:08:08", "throughput": 1795.96, "total_tokens": 66273280} +{"current_steps": 8100, "total_steps": 20825, "loss": 0.8295, "learning_rate": 3.5776929240211224e-05, "epoch": 0.38895558223289317, "percentage": 38.9, "elapsed_time": "10:15:54", "remaining_time": "16:07:34", "throughput": 1795.6, "total_tokens": 66355200} +{"current_steps": 8110, "total_steps": 20825, "loss": 1.0028, "learning_rate": 3.5741169111366047e-05, "epoch": 0.38943577430972387, "percentage": 38.94, "elapsed_time": "10:16:47", "remaining_time": "16:07:01", "throughput": 1795.23, "total_tokens": 66437120} +{"current_steps": 8120, "total_steps": 20825, "loss": 1.0164, "learning_rate": 3.570538200979635e-05, "epoch": 0.3899159663865546, "percentage": 38.99, "elapsed_time": "10:17:41", "remaining_time": "16:06:28", "throughput": 1794.83, "total_tokens": 66519040} +{"current_steps": 8130, "total_steps": 20825, "loss": 0.9047, "learning_rate": 3.566956802536904e-05, "epoch": 0.3903961584633854, "percentage": 39.04, "elapsed_time": "10:18:34", "remaining_time": "16:05:54", "throughput": 1794.45, "total_tokens": 66600960} +{"current_steps": 8140, "total_steps": 20825, "loss": 0.9341, "learning_rate": 3.5633727248018536e-05, "epoch": 0.3908763505402161, "percentage": 39.09, "elapsed_time": "10:19:28", "remaining_time": "16:05:21", "throughput": 1794.09, "total_tokens": 66682880} +{"current_steps": 8150, "total_steps": 20825, "loss": 0.8941, "learning_rate": 3.5597859767746524e-05, "epoch": 0.39135654261704683, "percentage": 39.14, "elapsed_time": "10:20:22", "remaining_time": "16:04:48", "throughput": 1793.69, "total_tokens": 66764800} +{"current_steps": 8160, "total_steps": 20825, "loss": 0.8836, "learning_rate": 3.556196567462175e-05, "epoch": 0.39183673469387753, "percentage": 39.18, "elapsed_time": "10:21:15", "remaining_time": "16:04:15", "throughput": 1793.3, "total_tokens": 66846720} +{"current_steps": 8170, "total_steps": 20825, "loss": 0.9574, "learning_rate": 3.5526045058779805e-05, "epoch": 0.3923169267707083, "percentage": 39.23, "elapsed_time": "10:22:10", "remaining_time": "16:03:42", "throughput": 1792.88, "total_tokens": 66928640} +{"current_steps": 8180, "total_steps": 20825, "loss": 0.8612, "learning_rate": 3.549009801042286e-05, "epoch": 0.39279711884753904, "percentage": 39.28, "elapsed_time": "10:23:05", "remaining_time": "16:03:11", "throughput": 1792.44, "total_tokens": 67010560} +{"current_steps": 8190, "total_steps": 20825, "loss": 0.9242, "learning_rate": 3.545412461981947e-05, "epoch": 0.39327731092436974, "percentage": 39.33, "elapsed_time": "10:23:54", "remaining_time": "16:02:31", "throughput": 1792.28, "total_tokens": 67092480} +{"current_steps": 8200, "total_steps": 20825, "loss": 0.9924, "learning_rate": 3.541812497730435e-05, "epoch": 0.3937575030012005, "percentage": 39.38, "elapsed_time": "10:24:43", "remaining_time": "16:01:50", "throughput": 1792.12, "total_tokens": 67174400} +{"current_steps": 8210, "total_steps": 20825, "loss": 0.9064, "learning_rate": 3.5382099173278125e-05, "epoch": 0.3942376950780312, "percentage": 39.42, "elapsed_time": "10:25:32", "remaining_time": "16:01:10", "throughput": 1791.95, "total_tokens": 67256320} +{"current_steps": 8220, "total_steps": 20825, "loss": 0.8907, "learning_rate": 3.5346047298207116e-05, "epoch": 0.39471788715486195, "percentage": 39.47, "elapsed_time": "10:26:21", "remaining_time": "16:00:29", "throughput": 1791.78, "total_tokens": 67338240} +{"current_steps": 8230, "total_steps": 20825, "loss": 0.7992, "learning_rate": 3.530996944262312e-05, "epoch": 0.3951980792316927, "percentage": 39.52, "elapsed_time": "10:27:11", "remaining_time": "15:59:49", "throughput": 1791.6, "total_tokens": 67420160} +{"current_steps": 8240, "total_steps": 20825, "loss": 0.8946, "learning_rate": 3.5273865697123164e-05, "epoch": 0.3956782713085234, "percentage": 39.57, "elapsed_time": "10:28:00", "remaining_time": "15:59:09", "throughput": 1791.43, "total_tokens": 67502080} +{"current_steps": 8250, "total_steps": 20825, "loss": 1.0861, "learning_rate": 3.52377361523693e-05, "epoch": 0.39615846338535415, "percentage": 39.62, "elapsed_time": "10:28:52", "remaining_time": "15:58:32", "throughput": 1791.16, "total_tokens": 67584000} +{"current_steps": 8260, "total_steps": 20825, "loss": 1.0155, "learning_rate": 3.520158089908836e-05, "epoch": 0.39663865546218485, "percentage": 39.66, "elapsed_time": "10:29:43", "remaining_time": "15:57:55", "throughput": 1790.88, "total_tokens": 67665920} +{"current_steps": 8270, "total_steps": 20825, "loss": 0.7652, "learning_rate": 3.516540002807174e-05, "epoch": 0.3971188475390156, "percentage": 39.71, "elapsed_time": "10:30:33", "remaining_time": "15:57:16", "throughput": 1790.68, "total_tokens": 67747840} +{"current_steps": 8280, "total_steps": 20825, "loss": 0.8809, "learning_rate": 3.512919363017516e-05, "epoch": 0.39759903961584636, "percentage": 39.76, "elapsed_time": "10:31:24", "remaining_time": "15:56:38", "throughput": 1790.44, "total_tokens": 67829760} +{"current_steps": 8290, "total_steps": 20825, "loss": 0.8293, "learning_rate": 3.509296179631843e-05, "epoch": 0.39807923169267706, "percentage": 39.81, "elapsed_time": "10:32:15", "remaining_time": "15:56:01", "throughput": 1790.17, "total_tokens": 67911680} +{"current_steps": 8300, "total_steps": 20825, "loss": 0.8956, "learning_rate": 3.505670461748527e-05, "epoch": 0.3985594237695078, "percentage": 39.86, "elapsed_time": "10:33:06", "remaining_time": "15:55:23", "throughput": 1789.93, "total_tokens": 67993600} +{"current_steps": 8310, "total_steps": 20825, "loss": 1.1892, "learning_rate": 3.5020422184723e-05, "epoch": 0.3990396158463385, "percentage": 39.9, "elapsed_time": "10:33:56", "remaining_time": "15:54:43", "throughput": 1789.74, "total_tokens": 68075520} +{"current_steps": 8320, "total_steps": 20825, "loss": 0.8476, "learning_rate": 3.498411458914238e-05, "epoch": 0.39951980792316927, "percentage": 39.95, "elapsed_time": "10:34:47", "remaining_time": "15:54:05", "throughput": 1789.49, "total_tokens": 68157440} +{"current_steps": 8330, "total_steps": 20825, "loss": 0.859, "learning_rate": 3.494778192191739e-05, "epoch": 0.4, "percentage": 40.0, "elapsed_time": "10:35:40", "remaining_time": "15:53:30", "throughput": 1789.17, "total_tokens": 68239360} +{"current_steps": 8340, "total_steps": 20825, "loss": 0.771, "learning_rate": 3.4911424274284886e-05, "epoch": 0.4004801920768307, "percentage": 40.05, "elapsed_time": "10:36:31", "remaining_time": "15:52:52", "throughput": 1788.93, "total_tokens": 68321280} +{"current_steps": 8350, "total_steps": 20825, "loss": 0.9161, "learning_rate": 3.4875041737544526e-05, "epoch": 0.4009603841536615, "percentage": 40.1, "elapsed_time": "10:37:19", "remaining_time": "15:52:10", "throughput": 1788.79, "total_tokens": 68403200} +{"current_steps": 8360, "total_steps": 20825, "loss": 0.8845, "learning_rate": 3.483863440305845e-05, "epoch": 0.4014405762304922, "percentage": 40.14, "elapsed_time": "10:38:08", "remaining_time": "15:51:29", "throughput": 1788.67, "total_tokens": 68485120} +{"current_steps": 8370, "total_steps": 20825, "loss": 0.9752, "learning_rate": 3.480220236225106e-05, "epoch": 0.40192076830732293, "percentage": 40.19, "elapsed_time": "10:40:15", "remaining_time": "15:52:44", "throughput": 1784.86, "total_tokens": 68567040} +{"current_steps": 8380, "total_steps": 20825, "loss": 0.8717, "learning_rate": 3.476574570660879e-05, "epoch": 0.4024009603841537, "percentage": 40.24, "elapsed_time": "10:41:19", "remaining_time": "15:52:24", "throughput": 1784.06, "total_tokens": 68648960} +{"current_steps": 8390, "total_steps": 20825, "loss": 0.7304, "learning_rate": 3.472926452767992e-05, "epoch": 0.4028811524609844, "percentage": 40.29, "elapsed_time": "10:42:12", "remaining_time": "15:51:50", "throughput": 1783.7, "total_tokens": 68730880} +{"current_steps": 8400, "total_steps": 20825, "loss": 0.8629, "learning_rate": 3.469275891707428e-05, "epoch": 0.40336134453781514, "percentage": 40.34, "elapsed_time": "10:43:04", "remaining_time": "15:51:13", "throughput": 1783.42, "total_tokens": 68812800} +{"current_steps": 8410, "total_steps": 20825, "loss": 0.8738, "learning_rate": 3.465622896646305e-05, "epoch": 0.40384153661464584, "percentage": 40.38, "elapsed_time": "10:43:56", "remaining_time": "15:50:36", "throughput": 1783.14, "total_tokens": 68894720} +{"current_steps": 8420, "total_steps": 20825, "loss": 0.8472, "learning_rate": 3.461967476757857e-05, "epoch": 0.4043217286914766, "percentage": 40.43, "elapsed_time": "10:44:48", "remaining_time": "15:49:58", "throughput": 1782.87, "total_tokens": 68976640} +{"current_steps": 8430, "total_steps": 20825, "loss": 1.0451, "learning_rate": 3.4583096412214025e-05, "epoch": 0.40480192076830734, "percentage": 40.48, "elapsed_time": "10:45:40", "remaining_time": "15:49:21", "throughput": 1782.6, "total_tokens": 69058560} +{"current_steps": 8440, "total_steps": 20825, "loss": 0.8458, "learning_rate": 3.454649399222328e-05, "epoch": 0.40528211284513804, "percentage": 40.53, "elapsed_time": "10:46:32", "remaining_time": "15:48:44", "throughput": 1782.33, "total_tokens": 69140480} +{"current_steps": 8450, "total_steps": 20825, "loss": 0.8503, "learning_rate": 3.450986759952064e-05, "epoch": 0.4057623049219688, "percentage": 40.58, "elapsed_time": "10:47:23", "remaining_time": "15:48:06", "throughput": 1782.07, "total_tokens": 69222400} +{"current_steps": 8460, "total_steps": 20825, "loss": 0.8767, "learning_rate": 3.44732173260806e-05, "epoch": 0.4062424969987995, "percentage": 40.62, "elapsed_time": "10:48:15", "remaining_time": "15:47:29", "throughput": 1781.79, "total_tokens": 69304320} +{"current_steps": 8470, "total_steps": 20825, "loss": 0.9149, "learning_rate": 3.4436543263937613e-05, "epoch": 0.40672268907563025, "percentage": 40.67, "elapsed_time": "10:49:07", "remaining_time": "15:46:52", "throughput": 1781.53, "total_tokens": 69386240} +{"current_steps": 8480, "total_steps": 20825, "loss": 0.8728, "learning_rate": 3.439984550518589e-05, "epoch": 0.407202881152461, "percentage": 40.72, "elapsed_time": "10:49:59", "remaining_time": "15:46:14", "throughput": 1781.26, "total_tokens": 69468160} +{"current_steps": 8490, "total_steps": 20825, "loss": 0.9235, "learning_rate": 3.436312414197913e-05, "epoch": 0.4076830732292917, "percentage": 40.77, "elapsed_time": "10:50:51", "remaining_time": "15:45:37", "throughput": 1780.99, "total_tokens": 69550080} +{"current_steps": 8500, "total_steps": 20825, "loss": 1.0674, "learning_rate": 3.4326379266530314e-05, "epoch": 0.40816326530612246, "percentage": 40.82, "elapsed_time": "10:51:43", "remaining_time": "15:45:00", "throughput": 1780.7, "total_tokens": 69632000} +{"current_steps": 8510, "total_steps": 20825, "loss": 0.8399, "learning_rate": 3.428961097111146e-05, "epoch": 0.40864345738295316, "percentage": 40.86, "elapsed_time": "10:52:35", "remaining_time": "15:44:22", "throughput": 1780.44, "total_tokens": 69713920} +{"current_steps": 8520, "total_steps": 20825, "loss": 0.9089, "learning_rate": 3.4252819348053424e-05, "epoch": 0.4091236494597839, "percentage": 40.91, "elapsed_time": "10:53:27", "remaining_time": "15:43:45", "throughput": 1780.17, "total_tokens": 69795840} +{"current_steps": 8530, "total_steps": 20825, "loss": 0.9305, "learning_rate": 3.421600448974559e-05, "epoch": 0.40960384153661467, "percentage": 40.96, "elapsed_time": "10:54:19", "remaining_time": "15:43:07", "throughput": 1779.9, "total_tokens": 69877760} +{"current_steps": 8540, "total_steps": 20825, "loss": 0.9921, "learning_rate": 3.4179166488635736e-05, "epoch": 0.41008403361344536, "percentage": 41.01, "elapsed_time": "10:55:11", "remaining_time": "15:42:30", "throughput": 1779.63, "total_tokens": 69959680} +{"current_steps": 8550, "total_steps": 20825, "loss": 0.9862, "learning_rate": 3.414230543722973e-05, "epoch": 0.4105642256902761, "percentage": 41.06, "elapsed_time": "10:56:04", "remaining_time": "15:41:54", "throughput": 1779.32, "total_tokens": 70041600} +{"current_steps": 8560, "total_steps": 20825, "loss": 0.8721, "learning_rate": 3.410542142809134e-05, "epoch": 0.4110444177671068, "percentage": 41.1, "elapsed_time": "10:56:57", "remaining_time": "15:41:18", "throughput": 1779.01, "total_tokens": 70123520} +{"current_steps": 8570, "total_steps": 20825, "loss": 1.0909, "learning_rate": 3.4068514553841965e-05, "epoch": 0.41152460984393757, "percentage": 41.15, "elapsed_time": "10:57:49", "remaining_time": "15:40:40", "throughput": 1778.73, "total_tokens": 70205440} +{"current_steps": 8580, "total_steps": 20825, "loss": 0.8935, "learning_rate": 3.403158490716043e-05, "epoch": 0.4120048019207683, "percentage": 41.2, "elapsed_time": "10:58:42", "remaining_time": "15:40:04", "throughput": 1778.42, "total_tokens": 70287360} +{"current_steps": 8590, "total_steps": 20825, "loss": 0.8689, "learning_rate": 3.3994632580782766e-05, "epoch": 0.412484993997599, "percentage": 41.25, "elapsed_time": "10:59:34", "remaining_time": "15:39:26", "throughput": 1778.16, "total_tokens": 70369280} +{"current_steps": 8600, "total_steps": 20825, "loss": 0.8591, "learning_rate": 3.395765766750192e-05, "epoch": 0.4129651860744298, "percentage": 41.3, "elapsed_time": "11:00:24", "remaining_time": "15:38:47", "throughput": 1777.95, "total_tokens": 70451200} +{"current_steps": 8610, "total_steps": 20825, "loss": 0.8133, "learning_rate": 3.392066026016757e-05, "epoch": 0.4134453781512605, "percentage": 41.34, "elapsed_time": "11:01:14", "remaining_time": "15:38:06", "throughput": 1777.78, "total_tokens": 70533120} +{"current_steps": 8620, "total_steps": 20825, "loss": 0.8302, "learning_rate": 3.388364045168591e-05, "epoch": 0.41392557022809123, "percentage": 41.39, "elapsed_time": "11:02:06", "remaining_time": "15:37:28", "throughput": 1777.53, "total_tokens": 70615040} +{"current_steps": 8630, "total_steps": 20825, "loss": 0.8433, "learning_rate": 3.3846598335019335e-05, "epoch": 0.414405762304922, "percentage": 41.44, "elapsed_time": "11:02:58", "remaining_time": "15:36:51", "throughput": 1777.25, "total_tokens": 70696960} +{"current_steps": 8640, "total_steps": 20825, "loss": 0.959, "learning_rate": 3.38095340031863e-05, "epoch": 0.4148859543817527, "percentage": 41.49, "elapsed_time": "11:03:49", "remaining_time": "15:36:11", "throughput": 1777.05, "total_tokens": 70778880} +{"current_steps": 8650, "total_steps": 20825, "loss": 1.0122, "learning_rate": 3.377244754926104e-05, "epoch": 0.41536614645858344, "percentage": 41.54, "elapsed_time": "11:04:40", "remaining_time": "15:35:31", "throughput": 1776.84, "total_tokens": 70860800} +{"current_steps": 8660, "total_steps": 20825, "loss": 0.8981, "learning_rate": 3.3735339066373314e-05, "epoch": 0.41584633853541414, "percentage": 41.58, "elapsed_time": "11:05:30", "remaining_time": "15:34:51", "throughput": 1776.68, "total_tokens": 70942720} +{"current_steps": 8670, "total_steps": 20825, "loss": 0.8525, "learning_rate": 3.369820864770822e-05, "epoch": 0.4163265306122449, "percentage": 41.63, "elapsed_time": "11:06:19", "remaining_time": "15:34:09", "throughput": 1776.53, "total_tokens": 71024640} +{"current_steps": 8680, "total_steps": 20825, "loss": 0.8923, "learning_rate": 3.366105638650596e-05, "epoch": 0.41680672268907565, "percentage": 41.68, "elapsed_time": "11:07:08", "remaining_time": "15:33:27", "throughput": 1776.39, "total_tokens": 71106560} +{"current_steps": 8690, "total_steps": 20825, "loss": 0.8246, "learning_rate": 3.3623882376061554e-05, "epoch": 0.41728691476590635, "percentage": 41.73, "elapsed_time": "11:07:57", "remaining_time": "15:32:46", "throughput": 1776.25, "total_tokens": 71188480} +{"current_steps": 8700, "total_steps": 20825, "loss": 0.8436, "learning_rate": 3.358668670972465e-05, "epoch": 0.4177671068427371, "percentage": 41.78, "elapsed_time": "11:08:47", "remaining_time": "15:32:05", "throughput": 1776.08, "total_tokens": 71270400} +{"current_steps": 8710, "total_steps": 20825, "loss": 0.9426, "learning_rate": 3.354946948089927e-05, "epoch": 0.4182472989195678, "percentage": 41.82, "elapsed_time": "11:09:37", "remaining_time": "15:31:23", "throughput": 1775.94, "total_tokens": 71352320} +{"current_steps": 8720, "total_steps": 20825, "loss": 0.8829, "learning_rate": 3.351223078304359e-05, "epoch": 0.41872749099639855, "percentage": 41.87, "elapsed_time": "11:10:26", "remaining_time": "15:30:41", "throughput": 1775.81, "total_tokens": 71434240} +{"current_steps": 8730, "total_steps": 20825, "loss": 0.9692, "learning_rate": 3.34749707096697e-05, "epoch": 0.4192076830732293, "percentage": 41.92, "elapsed_time": "11:11:15", "remaining_time": "15:30:00", "throughput": 1775.67, "total_tokens": 71516160} +{"current_steps": 8740, "total_steps": 20825, "loss": 0.8491, "learning_rate": 3.343768935434337e-05, "epoch": 0.41968787515006, "percentage": 41.97, "elapsed_time": "11:12:05", "remaining_time": "15:29:18", "throughput": 1775.52, "total_tokens": 71598080} +{"current_steps": 8750, "total_steps": 20825, "loss": 0.905, "learning_rate": 3.34003868106838e-05, "epoch": 0.42016806722689076, "percentage": 42.02, "elapsed_time": "11:12:54", "remaining_time": "15:28:36", "throughput": 1775.38, "total_tokens": 71680000} +{"current_steps": 8760, "total_steps": 20825, "loss": 0.9733, "learning_rate": 3.3363063172363396e-05, "epoch": 0.42064825930372146, "percentage": 42.06, "elapsed_time": "11:13:44", "remaining_time": "15:27:55", "throughput": 1775.23, "total_tokens": 71761920} +{"current_steps": 8770, "total_steps": 20825, "loss": 1.1804, "learning_rate": 3.3325718533107556e-05, "epoch": 0.4211284513805522, "percentage": 42.11, "elapsed_time": "11:14:33", "remaining_time": "15:27:13", "throughput": 1775.08, "total_tokens": 71843840} +{"current_steps": 8780, "total_steps": 20825, "loss": 0.9318, "learning_rate": 3.3288352986694396e-05, "epoch": 0.42160864345738297, "percentage": 42.16, "elapsed_time": "11:15:22", "remaining_time": "15:26:32", "throughput": 1774.94, "total_tokens": 71925760} +{"current_steps": 8790, "total_steps": 20825, "loss": 1.0563, "learning_rate": 3.325096662695454e-05, "epoch": 0.42208883553421367, "percentage": 42.21, "elapsed_time": "11:16:12", "remaining_time": "15:25:50", "throughput": 1774.8, "total_tokens": 72007680} +{"current_steps": 8800, "total_steps": 20825, "loss": 0.83, "learning_rate": 3.321355954777087e-05, "epoch": 0.4225690276110444, "percentage": 42.26, "elapsed_time": "11:17:01", "remaining_time": "15:25:08", "throughput": 1774.65, "total_tokens": 72089600} +{"current_steps": 8810, "total_steps": 20825, "loss": 0.906, "learning_rate": 3.317613184307832e-05, "epoch": 0.4230492196878752, "percentage": 42.3, "elapsed_time": "11:17:51", "remaining_time": "15:24:27", "throughput": 1774.49, "total_tokens": 72171520} +{"current_steps": 8820, "total_steps": 20825, "loss": 0.938, "learning_rate": 3.313868360686359e-05, "epoch": 0.4235294117647059, "percentage": 42.35, "elapsed_time": "11:18:41", "remaining_time": "15:23:46", "throughput": 1774.34, "total_tokens": 72253440} +{"current_steps": 8830, "total_steps": 20825, "loss": 0.8989, "learning_rate": 3.310121493316495e-05, "epoch": 0.42400960384153663, "percentage": 42.4, "elapsed_time": "11:19:30", "remaining_time": "15:23:04", "throughput": 1774.21, "total_tokens": 72335360} +{"current_steps": 8840, "total_steps": 20825, "loss": 0.876, "learning_rate": 3.306372591607199e-05, "epoch": 0.42448979591836733, "percentage": 42.45, "elapsed_time": "11:20:19", "remaining_time": "15:22:22", "throughput": 1774.06, "total_tokens": 72417280} +{"current_steps": 8850, "total_steps": 20825, "loss": 0.8632, "learning_rate": 3.30262166497254e-05, "epoch": 0.4249699879951981, "percentage": 42.5, "elapsed_time": "11:21:09", "remaining_time": "15:21:41", "throughput": 1773.9, "total_tokens": 72499200} +{"current_steps": 8860, "total_steps": 20825, "loss": 1.1161, "learning_rate": 3.29886872283167e-05, "epoch": 0.42545018007202884, "percentage": 42.55, "elapsed_time": "11:21:59", "remaining_time": "15:21:00", "throughput": 1773.75, "total_tokens": 72581120} +{"current_steps": 8870, "total_steps": 20825, "loss": 0.94, "learning_rate": 3.2951137746088004e-05, "epoch": 0.42593037214885954, "percentage": 42.59, "elapsed_time": "11:22:53", "remaining_time": "15:20:23", "throughput": 1773.43, "total_tokens": 72663040} +{"current_steps": 8880, "total_steps": 20825, "loss": 0.8393, "learning_rate": 3.291356829733186e-05, "epoch": 0.4264105642256903, "percentage": 42.64, "elapsed_time": "11:23:47", "remaining_time": "15:19:48", "throughput": 1773.07, "total_tokens": 72744960} +{"current_steps": 8890, "total_steps": 20825, "loss": 1.0528, "learning_rate": 3.287597897639092e-05, "epoch": 0.426890756302521, "percentage": 42.69, "elapsed_time": "11:24:38", "remaining_time": "15:19:08", "throughput": 1772.87, "total_tokens": 72826880} +{"current_steps": 8900, "total_steps": 20825, "loss": 0.8697, "learning_rate": 3.283836987765771e-05, "epoch": 0.42737094837935174, "percentage": 42.74, "elapsed_time": "11:25:29", "remaining_time": "15:18:29", "throughput": 1772.66, "total_tokens": 72908800} +{"current_steps": 8910, "total_steps": 20825, "loss": 0.8158, "learning_rate": 3.280074109557447e-05, "epoch": 0.4278511404561825, "percentage": 42.79, "elapsed_time": "11:26:44", "remaining_time": "15:18:20", "throughput": 1771.44, "total_tokens": 72990720} +{"current_steps": 8920, "total_steps": 20825, "loss": 0.8016, "learning_rate": 3.2763092724632854e-05, "epoch": 0.4283313325330132, "percentage": 42.83, "elapsed_time": "11:27:56", "remaining_time": "15:18:09", "throughput": 1770.31, "total_tokens": 73072640} +{"current_steps": 8930, "total_steps": 20825, "loss": 0.9782, "learning_rate": 3.272542485937369e-05, "epoch": 0.42881152460984395, "percentage": 42.88, "elapsed_time": "11:28:50", "remaining_time": "15:17:33", "throughput": 1769.99, "total_tokens": 73154560} +{"current_steps": 8940, "total_steps": 20825, "loss": 0.7977, "learning_rate": 3.2687737594386766e-05, "epoch": 0.42929171668667465, "percentage": 42.93, "elapsed_time": "11:29:42", "remaining_time": "15:16:54", "throughput": 1769.76, "total_tokens": 73236480} +{"current_steps": 8950, "total_steps": 20825, "loss": 1.0063, "learning_rate": 3.2650031024310603e-05, "epoch": 0.4297719087635054, "percentage": 42.98, "elapsed_time": "11:30:33", "remaining_time": "15:16:14", "throughput": 1769.56, "total_tokens": 73318400} +{"current_steps": 8960, "total_steps": 20825, "loss": 1.0871, "learning_rate": 3.2612305243832176e-05, "epoch": 0.43025210084033616, "percentage": 43.03, "elapsed_time": "11:31:24", "remaining_time": "15:15:34", "throughput": 1769.34, "total_tokens": 73400320} +{"current_steps": 8970, "total_steps": 20825, "loss": 0.9702, "learning_rate": 3.2574560347686725e-05, "epoch": 0.43073229291716686, "percentage": 43.07, "elapsed_time": "11:32:19", "remaining_time": "15:14:59", "throughput": 1768.97, "total_tokens": 73482240} +{"current_steps": 8980, "total_steps": 20825, "loss": 0.9451, "learning_rate": 3.253679643065747e-05, "epoch": 0.4312124849939976, "percentage": 43.12, "elapsed_time": "11:33:11", "remaining_time": "15:14:20", "throughput": 1768.73, "total_tokens": 73564160} +{"current_steps": 8990, "total_steps": 20825, "loss": 0.9423, "learning_rate": 3.249901358757538e-05, "epoch": 0.4316926770708283, "percentage": 43.17, "elapsed_time": "11:34:09", "remaining_time": "15:13:50", "throughput": 1768.23, "total_tokens": 73646080} +{"current_steps": 9000, "total_steps": 20825, "loss": 0.9845, "learning_rate": 3.246121191331902e-05, "epoch": 0.43217286914765907, "percentage": 43.22, "elapsed_time": "11:35:05", "remaining_time": "15:13:16", "throughput": 1767.83, "total_tokens": 73728000} +{"current_steps": 9010, "total_steps": 20825, "loss": 0.8655, "learning_rate": 3.242339150281417e-05, "epoch": 0.4326530612244898, "percentage": 43.27, "elapsed_time": "11:36:09", "remaining_time": "15:12:53", "throughput": 1767.08, "total_tokens": 73809920} +{"current_steps": 9020, "total_steps": 20825, "loss": 0.869, "learning_rate": 3.238555245103368e-05, "epoch": 0.4331332533013205, "percentage": 43.31, "elapsed_time": "11:37:07", "remaining_time": "15:12:22", "throughput": 1766.58, "total_tokens": 73891840} +{"current_steps": 9030, "total_steps": 20825, "loss": 0.8508, "learning_rate": 3.234769485299724e-05, "epoch": 0.4336134453781513, "percentage": 43.36, "elapsed_time": "11:38:06", "remaining_time": "15:11:52", "throughput": 1766.03, "total_tokens": 73973760} +{"current_steps": 9040, "total_steps": 20825, "loss": 1.035, "learning_rate": 3.230981880377107e-05, "epoch": 0.434093637454982, "percentage": 43.41, "elapsed_time": "11:39:01", "remaining_time": "15:11:17", "throughput": 1765.67, "total_tokens": 74055680} +{"current_steps": 9050, "total_steps": 20825, "loss": 0.9306, "learning_rate": 3.227192439846775e-05, "epoch": 0.4345738295318127, "percentage": 43.46, "elapsed_time": "11:39:57", "remaining_time": "15:10:43", "throughput": 1765.29, "total_tokens": 74137600} +{"current_steps": 9060, "total_steps": 20825, "loss": 0.9369, "learning_rate": 3.223401173224595e-05, "epoch": 0.4350540216086435, "percentage": 43.51, "elapsed_time": "11:40:53", "remaining_time": "15:10:09", "throughput": 1764.89, "total_tokens": 74219520} +{"current_steps": 9070, "total_steps": 20825, "loss": 0.8561, "learning_rate": 3.219608090031021e-05, "epoch": 0.4355342136854742, "percentage": 43.55, "elapsed_time": "11:41:52", "remaining_time": "15:09:38", "throughput": 1764.37, "total_tokens": 74301440} +{"current_steps": 9080, "total_steps": 20825, "loss": 1.0078, "learning_rate": 3.215813199791065e-05, "epoch": 0.43601440576230494, "percentage": 43.6, "elapsed_time": "11:42:49", "remaining_time": "15:09:06", "throughput": 1763.91, "total_tokens": 74383360} +{"current_steps": 9090, "total_steps": 20825, "loss": 0.8402, "learning_rate": 3.212016512034279e-05, "epoch": 0.43649459783913563, "percentage": 43.65, "elapsed_time": "11:43:48", "remaining_time": "15:08:35", "throughput": 1763.41, "total_tokens": 74465280} +{"current_steps": 9100, "total_steps": 20825, "loss": 0.9409, "learning_rate": 3.2082180362947304e-05, "epoch": 0.4369747899159664, "percentage": 43.7, "elapsed_time": "11:44:46", "remaining_time": "15:08:04", "throughput": 1762.9, "total_tokens": 74547200} +{"current_steps": 9110, "total_steps": 20825, "loss": 1.0121, "learning_rate": 3.204417782110974e-05, "epoch": 0.43745498199279714, "percentage": 43.75, "elapsed_time": "11:46:00", "remaining_time": "15:07:53", "throughput": 1761.76, "total_tokens": 74629120} +{"current_steps": 9120, "total_steps": 20825, "loss": 1.0525, "learning_rate": 3.200615759026031e-05, "epoch": 0.43793517406962784, "percentage": 43.79, "elapsed_time": "11:47:12", "remaining_time": "15:07:39", "throughput": 1760.72, "total_tokens": 74711040} +{"current_steps": 9130, "total_steps": 20825, "loss": 0.8456, "learning_rate": 3.1968119765873654e-05, "epoch": 0.4384153661464586, "percentage": 43.84, "elapsed_time": "11:48:20", "remaining_time": "15:07:20", "throughput": 1759.82, "total_tokens": 74792960} +{"current_steps": 9140, "total_steps": 20825, "loss": 0.8187, "learning_rate": 3.193006444346859e-05, "epoch": 0.4388955582232893, "percentage": 43.89, "elapsed_time": "11:49:29", "remaining_time": "15:07:02", "throughput": 1758.89, "total_tokens": 74874880} +{"current_steps": 9150, "total_steps": 20825, "loss": 1.1672, "learning_rate": 3.189199171860787e-05, "epoch": 0.43937575030012005, "percentage": 43.94, "elapsed_time": "11:50:39", "remaining_time": "15:06:46", "throughput": 1757.91, "total_tokens": 74956800} +{"current_steps": 9160, "total_steps": 20825, "loss": 0.7784, "learning_rate": 3.185390168689796e-05, "epoch": 0.4398559423769508, "percentage": 43.99, "elapsed_time": "11:51:46", "remaining_time": "15:06:25", "throughput": 1757.09, "total_tokens": 75038720} +{"current_steps": 9170, "total_steps": 20825, "loss": 0.7409, "learning_rate": 3.1815794443988763e-05, "epoch": 0.4403361344537815, "percentage": 44.03, "elapsed_time": "11:53:51", "remaining_time": "15:07:18", "throughput": 1753.86, "total_tokens": 75120640} +{"current_steps": 9180, "total_steps": 20825, "loss": 0.9283, "learning_rate": 3.177767008557343e-05, "epoch": 0.44081632653061226, "percentage": 44.08, "elapsed_time": "11:59:39", "remaining_time": "15:12:54", "throughput": 1741.61, "total_tokens": 75202560} +{"current_steps": 9190, "total_steps": 20825, "loss": 0.8384, "learning_rate": 3.1739528707388066e-05, "epoch": 0.44129651860744296, "percentage": 44.13, "elapsed_time": "12:04:21", "remaining_time": "15:17:04", "throughput": 1732.2, "total_tokens": 75284480} +{"current_steps": 9200, "total_steps": 20825, "loss": 0.8281, "learning_rate": 3.1701370405211535e-05, "epoch": 0.4417767106842737, "percentage": 44.18, "elapsed_time": "12:06:18", "remaining_time": "15:17:44", "throughput": 1729.45, "total_tokens": 75366400} +{"current_steps": 9210, "total_steps": 20825, "loss": 0.9655, "learning_rate": 3.166319527486519e-05, "epoch": 0.44225690276110446, "percentage": 44.23, "elapsed_time": "12:07:32", "remaining_time": "15:17:31", "throughput": 1728.37, "total_tokens": 75448320} +{"current_steps": 9220, "total_steps": 20825, "loss": 0.9852, "learning_rate": 3.162500341221264e-05, "epoch": 0.44273709483793516, "percentage": 44.27, "elapsed_time": "12:08:31", "remaining_time": "15:16:58", "throughput": 1727.93, "total_tokens": 75530240} +{"current_steps": 9230, "total_steps": 20825, "loss": 0.9623, "learning_rate": 3.158679491315951e-05, "epoch": 0.4432172869147659, "percentage": 44.32, "elapsed_time": "12:09:29", "remaining_time": "15:16:24", "throughput": 1727.51, "total_tokens": 75612160} +{"current_steps": 9240, "total_steps": 20825, "loss": 0.9564, "learning_rate": 3.154856987365322e-05, "epoch": 0.4436974789915966, "percentage": 44.37, "elapsed_time": "12:10:29", "remaining_time": "15:15:53", "throughput": 1727.0, "total_tokens": 75694080} +{"current_steps": 9250, "total_steps": 20825, "loss": 0.7948, "learning_rate": 3.151032838968271e-05, "epoch": 0.44417767106842737, "percentage": 44.42, "elapsed_time": "12:11:28", "remaining_time": "15:15:20", "throughput": 1726.54, "total_tokens": 75776000} +{"current_steps": 9260, "total_steps": 20825, "loss": 1.0294, "learning_rate": 3.14720705572782e-05, "epoch": 0.4446578631452581, "percentage": 44.47, "elapsed_time": "12:12:27", "remaining_time": "15:14:46", "throughput": 1726.11, "total_tokens": 75857920} +{"current_steps": 9270, "total_steps": 20825, "loss": 0.8652, "learning_rate": 3.1433796472511e-05, "epoch": 0.4451380552220888, "percentage": 44.51, "elapsed_time": "12:13:24", "remaining_time": "15:14:11", "throughput": 1725.72, "total_tokens": 75939840} +{"current_steps": 9280, "total_steps": 20825, "loss": 1.0851, "learning_rate": 3.13955062314932e-05, "epoch": 0.4456182472989196, "percentage": 44.56, "elapsed_time": "12:14:23", "remaining_time": "15:13:37", "throughput": 1725.29, "total_tokens": 76021760} +{"current_steps": 9290, "total_steps": 20825, "loss": 0.9558, "learning_rate": 3.135719993037748e-05, "epoch": 0.4460984393757503, "percentage": 44.61, "elapsed_time": "12:15:24", "remaining_time": "15:13:07", "throughput": 1724.74, "total_tokens": 76103680} +{"current_steps": 9300, "total_steps": 20825, "loss": 0.9276, "learning_rate": 3.131887766535684e-05, "epoch": 0.44657863145258103, "percentage": 44.66, "elapsed_time": "12:16:27", "remaining_time": "15:12:39", "throughput": 1724.13, "total_tokens": 76185600} +{"current_steps": 9310, "total_steps": 20825, "loss": 0.824, "learning_rate": 3.1280539532664366e-05, "epoch": 0.4470588235294118, "percentage": 44.71, "elapsed_time": "12:17:29", "remaining_time": "15:12:09", "throughput": 1723.58, "total_tokens": 76267520} +{"current_steps": 9320, "total_steps": 20825, "loss": 0.876, "learning_rate": 3.1242185628573e-05, "epoch": 0.4475390156062425, "percentage": 44.75, "elapsed_time": "12:18:28", "remaining_time": "15:11:36", "throughput": 1723.12, "total_tokens": 76349440} +{"current_steps": 9330, "total_steps": 20825, "loss": 0.8179, "learning_rate": 3.120381604939529e-05, "epoch": 0.44801920768307324, "percentage": 44.8, "elapsed_time": "12:19:21", "remaining_time": "15:10:55", "throughput": 1722.92, "total_tokens": 76431360} +{"current_steps": 9340, "total_steps": 20825, "loss": 0.9818, "learning_rate": 3.116543089148312e-05, "epoch": 0.44849939975990394, "percentage": 44.85, "elapsed_time": "12:20:13", "remaining_time": "15:10:13", "throughput": 1722.74, "total_tokens": 76513280} +{"current_steps": 9350, "total_steps": 20825, "loss": 0.767, "learning_rate": 3.112703025122754e-05, "epoch": 0.4489795918367347, "percentage": 44.9, "elapsed_time": "12:21:06", "remaining_time": "15:09:32", "throughput": 1722.55, "total_tokens": 76595200} +{"current_steps": 9360, "total_steps": 20825, "loss": 0.7457, "learning_rate": 3.108861422505842e-05, "epoch": 0.44945978391356545, "percentage": 44.95, "elapsed_time": "12:21:58", "remaining_time": "15:08:50", "throughput": 1722.37, "total_tokens": 76677120} +{"current_steps": 9370, "total_steps": 20825, "loss": 0.9048, "learning_rate": 3.105018290944432e-05, "epoch": 0.44993997599039615, "percentage": 44.99, "elapsed_time": "12:22:52", "remaining_time": "15:08:11", "throughput": 1722.1, "total_tokens": 76759040} +{"current_steps": 9380, "total_steps": 20825, "loss": 0.86, "learning_rate": 3.1011736400892175e-05, "epoch": 0.4504201680672269, "percentage": 45.04, "elapsed_time": "12:23:47", "remaining_time": "15:07:32", "throughput": 1721.81, "total_tokens": 76840960} +{"current_steps": 9390, "total_steps": 20825, "loss": 0.793, "learning_rate": 3.097327479594707e-05, "epoch": 0.4509003601440576, "percentage": 45.09, "elapsed_time": "12:24:43", "remaining_time": "15:06:55", "throughput": 1721.49, "total_tokens": 76922880} +{"current_steps": 9400, "total_steps": 20825, "loss": 0.9349, "learning_rate": 3.093479819119198e-05, "epoch": 0.45138055222088835, "percentage": 45.14, "elapsed_time": "12:25:39", "remaining_time": "15:06:17", "throughput": 1721.2, "total_tokens": 77004800} +{"current_steps": 9410, "total_steps": 20825, "loss": 0.9205, "learning_rate": 3.089630668324759e-05, "epoch": 0.4518607442977191, "percentage": 45.19, "elapsed_time": "12:26:33", "remaining_time": "15:05:38", "throughput": 1720.92, "total_tokens": 77086720} +{"current_steps": 9420, "total_steps": 20825, "loss": 0.8324, "learning_rate": 3.085780036877197e-05, "epoch": 0.4523409363745498, "percentage": 45.23, "elapsed_time": "12:27:27", "remaining_time": "15:04:58", "throughput": 1720.68, "total_tokens": 77168640} +{"current_steps": 9430, "total_steps": 20825, "loss": 0.8051, "learning_rate": 3.0819279344460396e-05, "epoch": 0.45282112845138056, "percentage": 45.28, "elapsed_time": "12:28:23", "remaining_time": "15:04:19", "throughput": 1720.39, "total_tokens": 77250560} +{"current_steps": 9440, "total_steps": 20825, "loss": 0.9294, "learning_rate": 3.078074370704507e-05, "epoch": 0.45330132052821126, "percentage": 45.33, "elapsed_time": "12:29:16", "remaining_time": "15:03:39", "throughput": 1720.15, "total_tokens": 77332480} +{"current_steps": 9450, "total_steps": 20825, "loss": 0.8818, "learning_rate": 3.07421935532949e-05, "epoch": 0.453781512605042, "percentage": 45.38, "elapsed_time": "12:30:17", "remaining_time": "15:03:07", "throughput": 1719.65, "total_tokens": 77414400} +{"current_steps": 9460, "total_steps": 20825, "loss": 0.9213, "learning_rate": 3.0703628980015214e-05, "epoch": 0.45426170468187277, "percentage": 45.43, "elapsed_time": "12:31:17", "remaining_time": "15:02:35", "throughput": 1719.18, "total_tokens": 77496320} +{"current_steps": 9470, "total_steps": 20825, "loss": 0.8218, "learning_rate": 3.0665050084047605e-05, "epoch": 0.45474189675870347, "percentage": 45.47, "elapsed_time": "12:32:19", "remaining_time": "15:02:04", "throughput": 1718.62, "total_tokens": 77578240} +{"current_steps": 9480, "total_steps": 20825, "loss": 0.7467, "learning_rate": 3.062645696226959e-05, "epoch": 0.4552220888355342, "percentage": 45.52, "elapsed_time": "12:33:28", "remaining_time": "15:01:41", "throughput": 1717.83, "total_tokens": 77660160} +{"current_steps": 9490, "total_steps": 20825, "loss": 0.9819, "learning_rate": 3.0587849711594425e-05, "epoch": 0.4557022809123649, "percentage": 45.57, "elapsed_time": "12:34:27", "remaining_time": "15:01:08", "throughput": 1717.38, "total_tokens": 77742080} +{"current_steps": 9500, "total_steps": 20825, "loss": 0.8633, "learning_rate": 3.054922842897084e-05, "epoch": 0.4561824729891957, "percentage": 45.62, "elapsed_time": "12:35:29", "remaining_time": "15:00:37", "throughput": 1716.85, "total_tokens": 77824000} +{"current_steps": 9510, "total_steps": 20825, "loss": 1.0312, "learning_rate": 3.051059321138281e-05, "epoch": 0.45666266506602643, "percentage": 45.67, "elapsed_time": "12:36:26", "remaining_time": "15:00:00", "throughput": 1716.5, "total_tokens": 77905920} +{"current_steps": 9520, "total_steps": 20825, "loss": 0.9672, "learning_rate": 3.047194415584929e-05, "epoch": 0.45714285714285713, "percentage": 45.71, "elapsed_time": "12:37:26", "remaining_time": "14:59:27", "throughput": 1716.05, "total_tokens": 77987840} +{"current_steps": 9530, "total_steps": 20825, "loss": 0.9048, "learning_rate": 3.0433281359424008e-05, "epoch": 0.4576230492196879, "percentage": 45.76, "elapsed_time": "12:38:23", "remaining_time": "14:58:51", "throughput": 1715.67, "total_tokens": 78069760} +{"current_steps": 9540, "total_steps": 20825, "loss": 0.7858, "learning_rate": 3.0394604919195156e-05, "epoch": 0.4581032412965186, "percentage": 45.81, "elapsed_time": "12:39:23", "remaining_time": "14:58:17", "throughput": 1715.23, "total_tokens": 78151680} +{"current_steps": 9550, "total_steps": 20825, "loss": 0.9508, "learning_rate": 3.0355914932285228e-05, "epoch": 0.45858343337334934, "percentage": 45.86, "elapsed_time": "12:40:28", "remaining_time": "14:57:50", "throughput": 1714.57, "total_tokens": 78233600} +{"current_steps": 9560, "total_steps": 20825, "loss": 0.8558, "learning_rate": 3.0317211495850717e-05, "epoch": 0.4590636254501801, "percentage": 45.91, "elapsed_time": "12:41:33", "remaining_time": "14:57:22", "throughput": 1713.93, "total_tokens": 78315520} +{"current_steps": 9570, "total_steps": 20825, "loss": 0.7818, "learning_rate": 3.02784947070819e-05, "epoch": 0.4595438175270108, "percentage": 45.95, "elapsed_time": "12:42:37", "remaining_time": "14:56:54", "throughput": 1713.32, "total_tokens": 78397440} +{"current_steps": 9580, "total_steps": 20825, "loss": 0.9045, "learning_rate": 3.0239764663202562e-05, "epoch": 0.46002400960384154, "percentage": 46.0, "elapsed_time": "12:43:35", "remaining_time": "14:56:18", "throughput": 1712.94, "total_tokens": 78479360} +{"current_steps": 9590, "total_steps": 20825, "loss": 0.9581, "learning_rate": 3.0201021461469803e-05, "epoch": 0.46050420168067224, "percentage": 46.05, "elapsed_time": "12:44:30", "remaining_time": "14:55:39", "throughput": 1712.66, "total_tokens": 78561280} +{"current_steps": 9600, "total_steps": 20825, "loss": 0.8943, "learning_rate": 3.0162265199173738e-05, "epoch": 0.460984393757503, "percentage": 46.1, "elapsed_time": "12:45:28", "remaining_time": "14:55:03", "throughput": 1712.28, "total_tokens": 78643200} +{"current_steps": 9610, "total_steps": 20825, "loss": 0.9728, "learning_rate": 3.0123495973637305e-05, "epoch": 0.46146458583433375, "percentage": 46.15, "elapsed_time": "12:46:26", "remaining_time": "14:54:27", "throughput": 1711.9, "total_tokens": 78725120} +{"current_steps": 9620, "total_steps": 20825, "loss": 0.8959, "learning_rate": 3.008471388221597e-05, "epoch": 0.46194477791116445, "percentage": 46.19, "elapsed_time": "12:47:26", "remaining_time": "14:53:53", "throughput": 1711.47, "total_tokens": 78807040} +{"current_steps": 9630, "total_steps": 20825, "loss": 0.7175, "learning_rate": 3.0045919022297524e-05, "epoch": 0.4624249699879952, "percentage": 46.24, "elapsed_time": "12:48:21", "remaining_time": "14:53:13", "throughput": 1711.2, "total_tokens": 78888960} +{"current_steps": 9640, "total_steps": 20825, "loss": 0.8525, "learning_rate": 3.0007111491301816e-05, "epoch": 0.4629051620648259, "percentage": 46.29, "elapsed_time": "12:49:23", "remaining_time": "14:52:41", "throughput": 1710.69, "total_tokens": 78970880} +{"current_steps": 9650, "total_steps": 20825, "loss": 0.941, "learning_rate": 2.9968291386680503e-05, "epoch": 0.46338535414165666, "percentage": 46.34, "elapsed_time": "12:50:23", "remaining_time": "14:52:08", "throughput": 1710.23, "total_tokens": 79052800} +{"current_steps": 9660, "total_steps": 20825, "loss": 1.066, "learning_rate": 2.9929458805916837e-05, "epoch": 0.4638655462184874, "percentage": 46.39, "elapsed_time": "12:51:24", "remaining_time": "14:51:35", "throughput": 1709.76, "total_tokens": 79134720} +{"current_steps": 9670, "total_steps": 20825, "loss": 0.7304, "learning_rate": 2.9890613846525395e-05, "epoch": 0.4643457382953181, "percentage": 46.43, "elapsed_time": "12:52:22", "remaining_time": "14:50:58", "throughput": 1709.39, "total_tokens": 79216640} +{"current_steps": 9680, "total_steps": 20825, "loss": 0.8932, "learning_rate": 2.9851756606051817e-05, "epoch": 0.46482593037214887, "percentage": 46.48, "elapsed_time": "12:53:32", "remaining_time": "14:50:36", "throughput": 1708.57, "total_tokens": 79298560} +{"current_steps": 9690, "total_steps": 20825, "loss": 0.9239, "learning_rate": 2.9812887182072607e-05, "epoch": 0.46530612244897956, "percentage": 46.53, "elapsed_time": "12:54:43", "remaining_time": "14:50:15", "throughput": 1707.72, "total_tokens": 79380480} +{"current_steps": 9700, "total_steps": 20825, "loss": 0.8346, "learning_rate": 2.9774005672194854e-05, "epoch": 0.4657863145258103, "percentage": 46.58, "elapsed_time": "12:55:54", "remaining_time": "14:49:53", "throughput": 1706.86, "total_tokens": 79462400} +{"current_steps": 9710, "total_steps": 20825, "loss": 0.886, "learning_rate": 2.9735112174056006e-05, "epoch": 0.4662665066026411, "percentage": 46.63, "elapsed_time": "12:57:06", "remaining_time": "14:49:32", "throughput": 1706.0, "total_tokens": 79544320} +{"current_steps": 9720, "total_steps": 20825, "loss": 0.8596, "learning_rate": 2.96962067853236e-05, "epoch": 0.46674669867947177, "percentage": 46.67, "elapsed_time": "12:58:13", "remaining_time": "14:49:06", "throughput": 1705.29, "total_tokens": 79626240} +{"current_steps": 9730, "total_steps": 20825, "loss": 0.8394, "learning_rate": 2.9657289603695037e-05, "epoch": 0.4672268907563025, "percentage": 46.72, "elapsed_time": "12:59:12", "remaining_time": "14:48:31", "throughput": 1704.9, "total_tokens": 79708160} +{"current_steps": 9740, "total_steps": 20825, "loss": 1.2984, "learning_rate": 2.9618360726897344e-05, "epoch": 0.4677070828331333, "percentage": 46.77, "elapsed_time": "13:00:11", "remaining_time": "14:47:56", "throughput": 1704.48, "total_tokens": 79790080} +{"current_steps": 9750, "total_steps": 20825, "loss": 0.9511, "learning_rate": 2.957942025268689e-05, "epoch": 0.468187274909964, "percentage": 46.82, "elapsed_time": "13:01:20", "remaining_time": "14:47:31", "throughput": 1703.74, "total_tokens": 79872000} +{"current_steps": 9760, "total_steps": 20825, "loss": 0.8727, "learning_rate": 2.9540468278849208e-05, "epoch": 0.46866746698679473, "percentage": 46.87, "elapsed_time": "13:02:17", "remaining_time": "14:46:53", "throughput": 1703.43, "total_tokens": 79953920} +{"current_steps": 9770, "total_steps": 20825, "loss": 0.8799, "learning_rate": 2.950150490319866e-05, "epoch": 0.46914765906362543, "percentage": 46.91, "elapsed_time": "13:03:12", "remaining_time": "14:46:13", "throughput": 1703.15, "total_tokens": 80035840} +{"current_steps": 9780, "total_steps": 20825, "loss": 0.9699, "learning_rate": 2.9462530223578273e-05, "epoch": 0.4696278511404562, "percentage": 46.96, "elapsed_time": "13:04:11", "remaining_time": "14:45:37", "throughput": 1702.76, "total_tokens": 80117760} +{"current_steps": 9790, "total_steps": 20825, "loss": 0.8275, "learning_rate": 2.9423544337859454e-05, "epoch": 0.47010804321728694, "percentage": 47.01, "elapsed_time": "13:05:09", "remaining_time": "14:44:59", "throughput": 1702.43, "total_tokens": 80199680} +{"current_steps": 9800, "total_steps": 20825, "loss": 0.8525, "learning_rate": 2.938454734394174e-05, "epoch": 0.47058823529411764, "percentage": 47.06, "elapsed_time": "13:06:07", "remaining_time": "14:44:23", "throughput": 1702.07, "total_tokens": 80281600} +{"current_steps": 9810, "total_steps": 20825, "loss": 0.9778, "learning_rate": 2.9345539339752575e-05, "epoch": 0.4710684273709484, "percentage": 47.11, "elapsed_time": "13:07:04", "remaining_time": "14:43:44", "throughput": 1701.75, "total_tokens": 80363520} +{"current_steps": 9820, "total_steps": 20825, "loss": 0.829, "learning_rate": 2.9306520423247045e-05, "epoch": 0.4715486194477791, "percentage": 47.15, "elapsed_time": "13:08:09", "remaining_time": "14:43:16", "throughput": 1701.11, "total_tokens": 80445440} +{"current_steps": 9830, "total_steps": 20825, "loss": 0.9411, "learning_rate": 2.9267490692407635e-05, "epoch": 0.47202881152460985, "percentage": 47.2, "elapsed_time": "13:10:20", "remaining_time": "14:44:00", "throughput": 1698.14, "total_tokens": 80527360} +{"current_steps": 9840, "total_steps": 20825, "loss": 0.9641, "learning_rate": 2.9228450245243993e-05, "epoch": 0.4725090036014406, "percentage": 47.25, "elapsed_time": "13:12:30", "remaining_time": "14:44:44", "throughput": 1695.22, "total_tokens": 80609280} +{"current_steps": 9850, "total_steps": 20825, "loss": 1.1205, "learning_rate": 2.9189399179792676e-05, "epoch": 0.4729891956782713, "percentage": 47.3, "elapsed_time": "13:14:33", "remaining_time": "14:45:18", "throughput": 1692.57, "total_tokens": 80691200} +{"current_steps": 9860, "total_steps": 20825, "loss": 0.9089, "learning_rate": 2.9150337594116904e-05, "epoch": 0.47346938775510206, "percentage": 47.35, "elapsed_time": "13:15:25", "remaining_time": "14:44:33", "throughput": 1692.47, "total_tokens": 80773120} +{"current_steps": 9870, "total_steps": 20825, "loss": 0.8489, "learning_rate": 2.9111265586306314e-05, "epoch": 0.47394957983193275, "percentage": 47.39, "elapsed_time": "13:16:16", "remaining_time": "14:43:48", "throughput": 1692.35, "total_tokens": 80855040} +{"current_steps": 9880, "total_steps": 20825, "loss": 0.8287, "learning_rate": 2.9072183254476713e-05, "epoch": 0.4744297719087635, "percentage": 47.44, "elapsed_time": "13:17:08", "remaining_time": "14:43:03", "throughput": 1692.24, "total_tokens": 80936960} +{"current_steps": 9890, "total_steps": 20825, "loss": 0.9506, "learning_rate": 2.903309069676984e-05, "epoch": 0.47490996398559426, "percentage": 47.49, "elapsed_time": "13:18:01", "remaining_time": "14:42:20", "throughput": 1692.08, "total_tokens": 81018880} +{"current_steps": 9900, "total_steps": 20825, "loss": 0.8601, "learning_rate": 2.8993988011353112e-05, "epoch": 0.47539015606242496, "percentage": 47.54, "elapsed_time": "13:18:54", "remaining_time": "14:41:37", "throughput": 1691.89, "total_tokens": 81100800} +{"current_steps": 9910, "total_steps": 20825, "loss": 0.9003, "learning_rate": 2.8954875296419364e-05, "epoch": 0.4758703481392557, "percentage": 47.59, "elapsed_time": "13:19:47", "remaining_time": "14:40:53", "throughput": 1691.76, "total_tokens": 81182720} +{"current_steps": 9920, "total_steps": 20825, "loss": 0.9797, "learning_rate": 2.8915752650186635e-05, "epoch": 0.4763505402160864, "percentage": 47.64, "elapsed_time": "13:20:39", "remaining_time": "14:40:09", "throughput": 1691.61, "total_tokens": 81264640} +{"current_steps": 9930, "total_steps": 20825, "loss": 0.7935, "learning_rate": 2.8876620170897895e-05, "epoch": 0.47683073229291717, "percentage": 47.68, "elapsed_time": "13:21:31", "remaining_time": "14:39:25", "throughput": 1691.49, "total_tokens": 81346560} +{"current_steps": 9940, "total_steps": 20825, "loss": 0.8632, "learning_rate": 2.88374779568208e-05, "epoch": 0.4773109243697479, "percentage": 47.73, "elapsed_time": "13:22:24", "remaining_time": "14:38:41", "throughput": 1691.35, "total_tokens": 81428480} +{"current_steps": 9950, "total_steps": 20825, "loss": 0.8712, "learning_rate": 2.879832610624747e-05, "epoch": 0.4777911164465786, "percentage": 47.78, "elapsed_time": "13:23:16", "remaining_time": "14:37:57", "throughput": 1691.21, "total_tokens": 81510400} +{"current_steps": 9960, "total_steps": 20825, "loss": 0.8157, "learning_rate": 2.8759164717494202e-05, "epoch": 0.4782713085234094, "percentage": 47.83, "elapsed_time": "13:24:08", "remaining_time": "14:37:12", "throughput": 1691.08, "total_tokens": 81592320} +{"current_steps": 9970, "total_steps": 20825, "loss": 1.05, "learning_rate": 2.8719993888901258e-05, "epoch": 0.4787515006002401, "percentage": 47.88, "elapsed_time": "13:24:59", "remaining_time": "14:36:27", "throughput": 1690.98, "total_tokens": 81674240} +{"current_steps": 9980, "total_steps": 20825, "loss": 0.8731, "learning_rate": 2.86808137188326e-05, "epoch": 0.47923169267707083, "percentage": 47.92, "elapsed_time": "13:25:51", "remaining_time": "14:35:42", "throughput": 1690.88, "total_tokens": 81756160} +{"current_steps": 9990, "total_steps": 20825, "loss": 0.9884, "learning_rate": 2.8641624305675657e-05, "epoch": 0.4797118847539016, "percentage": 47.97, "elapsed_time": "13:26:42", "remaining_time": "14:34:56", "throughput": 1690.79, "total_tokens": 81838080} +{"current_steps": 10000, "total_steps": 20825, "loss": 0.7331, "learning_rate": 2.8602425747841057e-05, "epoch": 0.4801920768307323, "percentage": 48.02, "elapsed_time": "13:27:34", "remaining_time": "14:34:12", "throughput": 1690.64, "total_tokens": 81920000} +{"current_steps": 10010, "total_steps": 20825, "loss": 0.8353, "learning_rate": 2.8563218143762383e-05, "epoch": 0.48067226890756304, "percentage": 48.07, "elapsed_time": "13:28:31", "remaining_time": "14:33:32", "throughput": 1690.38, "total_tokens": 82001920} +{"current_steps": 10020, "total_steps": 20825, "loss": 0.8458, "learning_rate": 2.852400159189597e-05, "epoch": 0.48115246098439374, "percentage": 48.12, "elapsed_time": "13:29:22", "remaining_time": "14:32:47", "throughput": 1690.26, "total_tokens": 82083840} +{"current_steps": 10030, "total_steps": 20825, "loss": 0.9951, "learning_rate": 2.848477619072059e-05, "epoch": 0.4816326530612245, "percentage": 48.16, "elapsed_time": "13:30:14", "remaining_time": "14:32:02", "throughput": 1690.16, "total_tokens": 82165760} +{"current_steps": 10040, "total_steps": 20825, "loss": 1.0225, "learning_rate": 2.8445542038737245e-05, "epoch": 0.48211284513805525, "percentage": 48.21, "elapsed_time": "13:31:05", "remaining_time": "14:31:16", "throughput": 1690.08, "total_tokens": 82247680} +{"current_steps": 10050, "total_steps": 20825, "loss": 0.9611, "learning_rate": 2.8406299234468915e-05, "epoch": 0.48259303721488594, "percentage": 48.26, "elapsed_time": "13:31:54", "remaining_time": "14:30:29", "throughput": 1690.03, "total_tokens": 82329600} +{"current_steps": 10060, "total_steps": 20825, "loss": 1.0389, "learning_rate": 2.8367047876460305e-05, "epoch": 0.4830732292917167, "percentage": 48.31, "elapsed_time": "13:32:45", "remaining_time": "14:29:42", "throughput": 1689.97, "total_tokens": 82411520} +{"current_steps": 10070, "total_steps": 20825, "loss": 0.9294, "learning_rate": 2.8327788063277594e-05, "epoch": 0.4835534213685474, "percentage": 48.36, "elapsed_time": "13:33:34", "remaining_time": "14:28:55", "throughput": 1689.93, "total_tokens": 82493440} +{"current_steps": 10080, "total_steps": 20825, "loss": 0.8672, "learning_rate": 2.8288519893508212e-05, "epoch": 0.48403361344537815, "percentage": 48.4, "elapsed_time": "13:34:24", "remaining_time": "14:28:08", "throughput": 1689.89, "total_tokens": 82575360} +{"current_steps": 10090, "total_steps": 20825, "loss": 0.805, "learning_rate": 2.8249243465760566e-05, "epoch": 0.4845138055222089, "percentage": 48.45, "elapsed_time": "13:35:14", "remaining_time": "14:27:21", "throughput": 1689.84, "total_tokens": 82657280} +{"current_steps": 10100, "total_steps": 20825, "loss": 0.8885, "learning_rate": 2.8209958878663778e-05, "epoch": 0.4849939975990396, "percentage": 48.5, "elapsed_time": "13:36:04", "remaining_time": "14:26:34", "throughput": 1689.79, "total_tokens": 82739200} +{"current_steps": 10110, "total_steps": 20825, "loss": 0.855, "learning_rate": 2.817066623086748e-05, "epoch": 0.48547418967587036, "percentage": 48.55, "elapsed_time": "13:36:53", "remaining_time": "14:25:46", "throughput": 1689.75, "total_tokens": 82821120} +{"current_steps": 10120, "total_steps": 20825, "loss": 0.8841, "learning_rate": 2.813136562104155e-05, "epoch": 0.48595438175270106, "percentage": 48.6, "elapsed_time": "13:37:43", "remaining_time": "14:24:59", "throughput": 1689.71, "total_tokens": 82903040} +{"current_steps": 10130, "total_steps": 20825, "loss": 0.9228, "learning_rate": 2.8092057147875856e-05, "epoch": 0.4864345738295318, "percentage": 48.64, "elapsed_time": "13:38:33", "remaining_time": "14:24:12", "throughput": 1689.67, "total_tokens": 82984960} +{"current_steps": 10140, "total_steps": 20825, "loss": 0.9771, "learning_rate": 2.8052740910079994e-05, "epoch": 0.48691476590636257, "percentage": 48.69, "elapsed_time": "13:39:22", "remaining_time": "14:23:25", "throughput": 1689.62, "total_tokens": 83066880} +{"current_steps": 10150, "total_steps": 20825, "loss": 0.9318, "learning_rate": 2.8013417006383076e-05, "epoch": 0.48739495798319327, "percentage": 48.74, "elapsed_time": "13:40:13", "remaining_time": "14:22:38", "throughput": 1689.56, "total_tokens": 83148800} +{"current_steps": 10160, "total_steps": 20825, "loss": 0.8569, "learning_rate": 2.7974085535533473e-05, "epoch": 0.487875150060024, "percentage": 48.79, "elapsed_time": "13:41:02", "remaining_time": "14:21:51", "throughput": 1689.52, "total_tokens": 83230720} +{"current_steps": 10170, "total_steps": 20825, "loss": 1.0495, "learning_rate": 2.7934746596298535e-05, "epoch": 0.4883553421368547, "percentage": 48.84, "elapsed_time": "13:41:52", "remaining_time": "14:21:04", "throughput": 1689.47, "total_tokens": 83312640} +{"current_steps": 10180, "total_steps": 20825, "loss": 0.8839, "learning_rate": 2.789540028746438e-05, "epoch": 0.4888355342136855, "percentage": 48.88, "elapsed_time": "13:42:42", "remaining_time": "14:20:17", "throughput": 1689.42, "total_tokens": 83394560} +{"current_steps": 10190, "total_steps": 20825, "loss": 0.9594, "learning_rate": 2.785604670783563e-05, "epoch": 0.48931572629051623, "percentage": 48.93, "elapsed_time": "13:43:32", "remaining_time": "14:19:30", "throughput": 1689.39, "total_tokens": 83476480} +{"current_steps": 10200, "total_steps": 20825, "loss": 0.7835, "learning_rate": 2.7816685956235165e-05, "epoch": 0.4897959183673469, "percentage": 48.98, "elapsed_time": "13:44:21", "remaining_time": "14:18:42", "throughput": 1689.35, "total_tokens": 83558400} +{"current_steps": 10210, "total_steps": 20825, "loss": 0.9379, "learning_rate": 2.7777318131503873e-05, "epoch": 0.4902761104441777, "percentage": 49.03, "elapsed_time": "13:45:11", "remaining_time": "14:17:55", "throughput": 1689.3, "total_tokens": 83640320} +{"current_steps": 10220, "total_steps": 20825, "loss": 0.767, "learning_rate": 2.773794333250041e-05, "epoch": 0.4907563025210084, "percentage": 49.08, "elapsed_time": "13:46:01", "remaining_time": "14:17:08", "throughput": 1689.26, "total_tokens": 83722240} +{"current_steps": 10230, "total_steps": 20825, "loss": 0.9591, "learning_rate": 2.769856165810093e-05, "epoch": 0.49123649459783914, "percentage": 49.12, "elapsed_time": "13:46:51", "remaining_time": "14:16:21", "throughput": 1689.21, "total_tokens": 83804160} +{"current_steps": 10240, "total_steps": 20825, "loss": 0.929, "learning_rate": 2.765917320719887e-05, "epoch": 0.4917166866746699, "percentage": 49.17, "elapsed_time": "13:47:41", "remaining_time": "14:15:34", "throughput": 1689.16, "total_tokens": 83886080} +{"current_steps": 10250, "total_steps": 20825, "loss": 0.8609, "learning_rate": 2.7619778078704685e-05, "epoch": 0.4921968787515006, "percentage": 49.22, "elapsed_time": "13:48:31", "remaining_time": "14:14:47", "throughput": 1689.12, "total_tokens": 83968000} +{"current_steps": 10260, "total_steps": 20825, "loss": 0.7207, "learning_rate": 2.7580376371545573e-05, "epoch": 0.49267707082833134, "percentage": 49.27, "elapsed_time": "13:49:22", "remaining_time": "14:14:01", "throughput": 1689.02, "total_tokens": 84049920} +{"current_steps": 10270, "total_steps": 20825, "loss": 0.8415, "learning_rate": 2.7540968184665283e-05, "epoch": 0.49315726290516204, "percentage": 49.32, "elapsed_time": "13:50:15", "remaining_time": "14:13:17", "throughput": 1688.88, "total_tokens": 84131840} +{"current_steps": 10280, "total_steps": 20825, "loss": 0.9007, "learning_rate": 2.7501553617023816e-05, "epoch": 0.4936374549819928, "percentage": 49.36, "elapsed_time": "13:51:07", "remaining_time": "14:12:32", "throughput": 1688.76, "total_tokens": 84213760} +{"current_steps": 10290, "total_steps": 20825, "loss": 0.8125, "learning_rate": 2.7462132767597205e-05, "epoch": 0.49411764705882355, "percentage": 49.41, "elapsed_time": "13:51:59", "remaining_time": "14:11:47", "throughput": 1688.64, "total_tokens": 84295680} +{"current_steps": 10300, "total_steps": 20825, "loss": 0.8609, "learning_rate": 2.742270573537724e-05, "epoch": 0.49459783913565425, "percentage": 49.46, "elapsed_time": "13:52:50", "remaining_time": "14:11:02", "throughput": 1688.54, "total_tokens": 84377600} +{"current_steps": 10310, "total_steps": 20825, "loss": 0.9997, "learning_rate": 2.7383272619371276e-05, "epoch": 0.495078031212485, "percentage": 49.51, "elapsed_time": "13:53:41", "remaining_time": "14:10:16", "throughput": 1688.45, "total_tokens": 84459520} +{"current_steps": 10320, "total_steps": 20825, "loss": 0.8754, "learning_rate": 2.7343833518601913e-05, "epoch": 0.4955582232893157, "percentage": 49.56, "elapsed_time": "13:54:32", "remaining_time": "14:09:29", "throughput": 1688.4, "total_tokens": 84541440} +{"current_steps": 10330, "total_steps": 20825, "loss": 1.121, "learning_rate": 2.7304388532106768e-05, "epoch": 0.49603841536614646, "percentage": 49.6, "elapsed_time": "13:55:25", "remaining_time": "14:08:45", "throughput": 1688.25, "total_tokens": 84623360} +{"current_steps": 10340, "total_steps": 20825, "loss": 0.7872, "learning_rate": 2.726493775893828e-05, "epoch": 0.4965186074429772, "percentage": 49.65, "elapsed_time": "13:56:15", "remaining_time": "14:07:58", "throughput": 1688.19, "total_tokens": 84705280} +{"current_steps": 10350, "total_steps": 20825, "loss": 0.9003, "learning_rate": 2.7225481298163387e-05, "epoch": 0.4969987995198079, "percentage": 49.7, "elapsed_time": "13:57:06", "remaining_time": "14:07:12", "throughput": 1688.11, "total_tokens": 84787200} +{"current_steps": 10360, "total_steps": 20825, "loss": 1.0785, "learning_rate": 2.718601924886332e-05, "epoch": 0.49747899159663866, "percentage": 49.75, "elapsed_time": "13:57:58", "remaining_time": "14:06:28", "throughput": 1687.97, "total_tokens": 84869120} +{"current_steps": 10370, "total_steps": 20825, "loss": 0.8888, "learning_rate": 2.7146551710133346e-05, "epoch": 0.49795918367346936, "percentage": 49.8, "elapsed_time": "13:58:50", "remaining_time": "14:05:43", "throughput": 1687.86, "total_tokens": 84951040} +{"current_steps": 10380, "total_steps": 20825, "loss": 0.8726, "learning_rate": 2.7107078781082508e-05, "epoch": 0.4984393757503001, "percentage": 49.84, "elapsed_time": "13:59:43", "remaining_time": "14:04:58", "throughput": 1687.72, "total_tokens": 85032960} +{"current_steps": 10390, "total_steps": 20825, "loss": 0.942, "learning_rate": 2.7067600560833384e-05, "epoch": 0.49891956782713087, "percentage": 49.89, "elapsed_time": "14:00:35", "remaining_time": "14:04:14", "throughput": 1687.59, "total_tokens": 85114880} +{"current_steps": 10400, "total_steps": 20825, "loss": 0.8575, "learning_rate": 2.7028117148521863e-05, "epoch": 0.49939975990396157, "percentage": 49.94, "elapsed_time": "14:01:28", "remaining_time": "14:03:29", "throughput": 1687.46, "total_tokens": 85196800} +{"current_steps": 10410, "total_steps": 20825, "loss": 0.9079, "learning_rate": 2.698862864329685e-05, "epoch": 0.4998799519807923, "percentage": 49.99, "elapsed_time": "14:02:21", "remaining_time": "14:02:45", "throughput": 1687.3, "total_tokens": 85278720} +{"current_steps": 10420, "total_steps": 20825, "loss": 0.9877, "learning_rate": 2.6949135144320026e-05, "epoch": 0.5003601440576231, "percentage": 50.04, "elapsed_time": "14:03:12", "remaining_time": "14:02:00", "throughput": 1687.2, "total_tokens": 85360640} +{"current_steps": 10430, "total_steps": 20825, "loss": 0.8622, "learning_rate": 2.6909636750765653e-05, "epoch": 0.5008403361344538, "percentage": 50.08, "elapsed_time": "14:04:03", "remaining_time": "14:01:13", "throughput": 1687.15, "total_tokens": 85442560} +{"current_steps": 10440, "total_steps": 20825, "loss": 0.9352, "learning_rate": 2.6870133561820243e-05, "epoch": 0.5013205282112845, "percentage": 50.13, "elapsed_time": "14:04:53", "remaining_time": "14:00:26", "throughput": 1687.09, "total_tokens": 85524480} +{"current_steps": 10450, "total_steps": 20825, "loss": 1.031, "learning_rate": 2.683062567668238e-05, "epoch": 0.5018007202881153, "percentage": 50.18, "elapsed_time": "14:05:44", "remaining_time": "13:59:39", "throughput": 1687.02, "total_tokens": 85606400} +{"current_steps": 10460, "total_steps": 20825, "loss": 0.8878, "learning_rate": 2.679111319456242e-05, "epoch": 0.502280912364946, "percentage": 50.23, "elapsed_time": "14:06:34", "remaining_time": "13:58:52", "throughput": 1686.97, "total_tokens": 85688320} +{"current_steps": 10470, "total_steps": 20825, "loss": 0.6566, "learning_rate": 2.6751596214682278e-05, "epoch": 0.5027611044417767, "percentage": 50.28, "elapsed_time": "14:07:24", "remaining_time": "13:58:06", "throughput": 1686.91, "total_tokens": 85770240} +{"current_steps": 10480, "total_steps": 20825, "loss": 0.9173, "learning_rate": 2.671207483627515e-05, "epoch": 0.5032412965186075, "percentage": 50.32, "elapsed_time": "14:08:19", "remaining_time": "13:57:23", "throughput": 1686.7, "total_tokens": 85852160} +{"current_steps": 10490, "total_steps": 20825, "loss": 0.8325, "learning_rate": 2.6672549158585293e-05, "epoch": 0.5037214885954382, "percentage": 50.37, "elapsed_time": "14:09:12", "remaining_time": "13:56:39", "throughput": 1686.56, "total_tokens": 85934080} +{"current_steps": 10500, "total_steps": 20825, "loss": 0.7438, "learning_rate": 2.663301928086774e-05, "epoch": 0.5042016806722689, "percentage": 50.42, "elapsed_time": "14:10:06", "remaining_time": "13:55:56", "throughput": 1686.39, "total_tokens": 86016000} +{"current_steps": 10510, "total_steps": 20825, "loss": 0.8527, "learning_rate": 2.6593485302388087e-05, "epoch": 0.5046818727490996, "percentage": 50.47, "elapsed_time": "14:10:58", "remaining_time": "13:55:10", "throughput": 1686.27, "total_tokens": 86097920} +{"current_steps": 10520, "total_steps": 20825, "loss": 0.9448, "learning_rate": 2.6553947322422223e-05, "epoch": 0.5051620648259304, "percentage": 50.52, "elapsed_time": "14:11:51", "remaining_time": "13:54:26", "throughput": 1686.12, "total_tokens": 86179840} +{"current_steps": 10530, "total_steps": 20825, "loss": 0.8656, "learning_rate": 2.6514405440256086e-05, "epoch": 0.5056422569027611, "percentage": 50.56, "elapsed_time": "14:12:44", "remaining_time": "13:53:42", "throughput": 1685.96, "total_tokens": 86261760} +{"current_steps": 10540, "total_steps": 20825, "loss": 0.9212, "learning_rate": 2.6474859755185415e-05, "epoch": 0.5061224489795918, "percentage": 50.61, "elapsed_time": "14:13:38", "remaining_time": "13:52:59", "throughput": 1685.78, "total_tokens": 86343680} +{"current_steps": 10550, "total_steps": 20825, "loss": 0.9893, "learning_rate": 2.6435310366515498e-05, "epoch": 0.5066026410564226, "percentage": 50.66, "elapsed_time": "14:14:32", "remaining_time": "13:52:16", "throughput": 1685.6, "total_tokens": 86425600} +{"current_steps": 10560, "total_steps": 20825, "loss": 1.0323, "learning_rate": 2.6395757373560904e-05, "epoch": 0.5070828331332533, "percentage": 50.71, "elapsed_time": "14:15:27", "remaining_time": "13:51:33", "throughput": 1685.41, "total_tokens": 86507520} +{"current_steps": 10570, "total_steps": 20825, "loss": 0.9709, "learning_rate": 2.6356200875645287e-05, "epoch": 0.507563025210084, "percentage": 50.76, "elapsed_time": "14:16:19", "remaining_time": "13:50:48", "throughput": 1685.29, "total_tokens": 86589440} +{"current_steps": 10580, "total_steps": 20825, "loss": 0.7823, "learning_rate": 2.631664097210108e-05, "epoch": 0.5080432172869148, "percentage": 50.8, "elapsed_time": "14:17:11", "remaining_time": "13:50:03", "throughput": 1685.18, "total_tokens": 86671360} +{"current_steps": 10590, "total_steps": 20825, "loss": 0.7174, "learning_rate": 2.6277077762269276e-05, "epoch": 0.5085234093637455, "percentage": 50.85, "elapsed_time": "14:18:03", "remaining_time": "13:49:17", "throughput": 1685.06, "total_tokens": 86753280} +{"current_steps": 10600, "total_steps": 20825, "loss": 0.8513, "learning_rate": 2.6237511345499167e-05, "epoch": 0.5090036014405762, "percentage": 50.9, "elapsed_time": "14:18:58", "remaining_time": "13:48:34", "throughput": 1684.87, "total_tokens": 86835200} +{"current_steps": 10610, "total_steps": 20825, "loss": 0.8895, "learning_rate": 2.61979418211481e-05, "epoch": 0.5094837935174069, "percentage": 50.95, "elapsed_time": "14:19:52", "remaining_time": "13:47:51", "throughput": 1684.69, "total_tokens": 86917120} +{"current_steps": 10620, "total_steps": 20825, "loss": 0.9501, "learning_rate": 2.615836928858122e-05, "epoch": 0.5099639855942377, "percentage": 51.0, "elapsed_time": "14:20:45", "remaining_time": "13:47:07", "throughput": 1684.53, "total_tokens": 86999040} +{"current_steps": 10630, "total_steps": 20825, "loss": 0.7757, "learning_rate": 2.6118793847171236e-05, "epoch": 0.5104441776710684, "percentage": 51.04, "elapsed_time": "14:21:38", "remaining_time": "13:46:22", "throughput": 1684.4, "total_tokens": 87080960} +{"current_steps": 10640, "total_steps": 20825, "loss": 1.0115, "learning_rate": 2.607921559629816e-05, "epoch": 0.5109243697478991, "percentage": 51.09, "elapsed_time": "14:22:30", "remaining_time": "13:45:37", "throughput": 1684.29, "total_tokens": 87162880} +{"current_steps": 10650, "total_steps": 20825, "loss": 0.9044, "learning_rate": 2.6039634635349043e-05, "epoch": 0.5114045618247299, "percentage": 51.14, "elapsed_time": "14:23:25", "remaining_time": "13:44:54", "throughput": 1684.09, "total_tokens": 87244800} +{"current_steps": 10660, "total_steps": 20825, "loss": 0.8815, "learning_rate": 2.6000051063717767e-05, "epoch": 0.5118847539015606, "percentage": 51.19, "elapsed_time": "14:24:20", "remaining_time": "13:44:12", "throughput": 1683.88, "total_tokens": 87326720} +{"current_steps": 10670, "total_steps": 20825, "loss": 0.8555, "learning_rate": 2.596046498080475e-05, "epoch": 0.5123649459783913, "percentage": 51.24, "elapsed_time": "14:25:14", "remaining_time": "13:43:28", "throughput": 1683.7, "total_tokens": 87408640} +{"current_steps": 10680, "total_steps": 20825, "loss": 0.9126, "learning_rate": 2.5920876486016726e-05, "epoch": 0.5128451380552221, "percentage": 51.28, "elapsed_time": "14:26:13", "remaining_time": "13:42:50", "throughput": 1683.36, "total_tokens": 87490560} +{"current_steps": 10690, "total_steps": 20825, "loss": 0.8932, "learning_rate": 2.5881285678766482e-05, "epoch": 0.5133253301320528, "percentage": 51.33, "elapsed_time": "14:27:06", "remaining_time": "13:42:05", "throughput": 1683.22, "total_tokens": 87572480} +{"current_steps": 10700, "total_steps": 20825, "loss": 0.8166, "learning_rate": 2.5841692658472617e-05, "epoch": 0.5138055222088835, "percentage": 51.38, "elapsed_time": "14:28:00", "remaining_time": "13:41:22", "throughput": 1683.04, "total_tokens": 87654400} +{"current_steps": 10710, "total_steps": 20825, "loss": 1.0928, "learning_rate": 2.5802097524559264e-05, "epoch": 0.5142857142857142, "percentage": 51.43, "elapsed_time": "14:28:55", "remaining_time": "13:40:38", "throughput": 1682.86, "total_tokens": 87736320} +{"current_steps": 10720, "total_steps": 20825, "loss": 0.8714, "learning_rate": 2.5762500376455912e-05, "epoch": 0.514765906362545, "percentage": 51.48, "elapsed_time": "14:29:52", "remaining_time": "13:39:58", "throughput": 1682.57, "total_tokens": 87818240} +{"current_steps": 10730, "total_steps": 20825, "loss": 0.8432, "learning_rate": 2.5722901313597052e-05, "epoch": 0.5152460984393757, "percentage": 51.52, "elapsed_time": "14:30:48", "remaining_time": "13:39:16", "throughput": 1682.35, "total_tokens": 87900160} +{"current_steps": 10740, "total_steps": 20825, "loss": 0.8825, "learning_rate": 2.5683300435422032e-05, "epoch": 0.5157262905162064, "percentage": 51.57, "elapsed_time": "14:31:41", "remaining_time": "13:38:31", "throughput": 1682.2, "total_tokens": 87982080} +{"current_steps": 10750, "total_steps": 20825, "loss": 0.8147, "learning_rate": 2.564369784137472e-05, "epoch": 0.5162064825930373, "percentage": 51.62, "elapsed_time": "14:32:37", "remaining_time": "13:37:49", "throughput": 1681.98, "total_tokens": 88064000} +{"current_steps": 10760, "total_steps": 20825, "loss": 0.8252, "learning_rate": 2.5604093630903307e-05, "epoch": 0.516686674669868, "percentage": 51.67, "elapsed_time": "14:33:35", "remaining_time": "13:37:10", "throughput": 1681.67, "total_tokens": 88145920} +{"current_steps": 10770, "total_steps": 20825, "loss": 0.7476, "learning_rate": 2.556448790346006e-05, "epoch": 0.5171668667466987, "percentage": 51.72, "elapsed_time": "14:34:33", "remaining_time": "13:36:29", "throughput": 1681.39, "total_tokens": 88227840} +{"current_steps": 10780, "total_steps": 20825, "loss": 1.0129, "learning_rate": 2.5524880758501035e-05, "epoch": 0.5176470588235295, "percentage": 51.76, "elapsed_time": "14:35:28", "remaining_time": "13:35:47", "throughput": 1681.17, "total_tokens": 88309760} +{"current_steps": 10790, "total_steps": 20825, "loss": 0.9356, "learning_rate": 2.5485272295485846e-05, "epoch": 0.5181272509003602, "percentage": 51.81, "elapsed_time": "14:36:24", "remaining_time": "13:35:05", "throughput": 1680.93, "total_tokens": 88391680} +{"current_steps": 10800, "total_steps": 20825, "loss": 0.7554, "learning_rate": 2.544566261387743e-05, "epoch": 0.5186074429771909, "percentage": 51.86, "elapsed_time": "14:37:23", "remaining_time": "13:34:25", "throughput": 1680.62, "total_tokens": 88473600} +{"current_steps": 10810, "total_steps": 20825, "loss": 0.8429, "learning_rate": 2.5406051813141773e-05, "epoch": 0.5190876350540216, "percentage": 51.91, "elapsed_time": "14:38:22", "remaining_time": "13:33:46", "throughput": 1680.3, "total_tokens": 88555520} +{"current_steps": 10820, "total_steps": 20825, "loss": 0.8418, "learning_rate": 2.5366439992747688e-05, "epoch": 0.5195678271308524, "percentage": 51.96, "elapsed_time": "14:39:21", "remaining_time": "13:33:07", "throughput": 1679.95, "total_tokens": 88637440} +{"current_steps": 10830, "total_steps": 20825, "loss": 0.873, "learning_rate": 2.5326827252166523e-05, "epoch": 0.5200480192076831, "percentage": 52.0, "elapsed_time": "14:40:12", "remaining_time": "13:32:20", "throughput": 1679.89, "total_tokens": 88719360} +{"current_steps": 10840, "total_steps": 20825, "loss": 0.8453, "learning_rate": 2.5287213690871957e-05, "epoch": 0.5205282112845138, "percentage": 52.05, "elapsed_time": "14:40:59", "remaining_time": "13:31:30", "throughput": 1679.94, "total_tokens": 88801280} +{"current_steps": 10850, "total_steps": 20825, "loss": 0.8937, "learning_rate": 2.5247599408339723e-05, "epoch": 0.5210084033613446, "percentage": 52.1, "elapsed_time": "14:41:47", "remaining_time": "13:30:40", "throughput": 1679.98, "total_tokens": 88883200} +{"current_steps": 10860, "total_steps": 20825, "loss": 0.8389, "learning_rate": 2.5207984504047365e-05, "epoch": 0.5214885954381753, "percentage": 52.15, "elapsed_time": "14:42:35", "remaining_time": "13:29:51", "throughput": 1680.0, "total_tokens": 88965120} +{"current_steps": 10870, "total_steps": 20825, "loss": 0.7679, "learning_rate": 2.5168369077474004e-05, "epoch": 0.521968787515006, "percentage": 52.2, "elapsed_time": "14:43:24", "remaining_time": "13:29:03", "throughput": 1679.98, "total_tokens": 89047040} +{"current_steps": 10880, "total_steps": 20825, "loss": 0.9431, "learning_rate": 2.512875322810002e-05, "epoch": 0.5224489795918368, "percentage": 52.24, "elapsed_time": "14:44:15", "remaining_time": "13:28:16", "throughput": 1679.92, "total_tokens": 89128960} +{"current_steps": 10890, "total_steps": 20825, "loss": 0.8919, "learning_rate": 2.508913705540693e-05, "epoch": 0.5229291716686675, "percentage": 52.29, "elapsed_time": "14:45:06", "remaining_time": "13:27:29", "throughput": 1679.84, "total_tokens": 89210880} +{"current_steps": 10900, "total_steps": 20825, "loss": 0.841, "learning_rate": 2.504952065887701e-05, "epoch": 0.5234093637454982, "percentage": 52.34, "elapsed_time": "14:45:55", "remaining_time": "13:26:40", "throughput": 1679.83, "total_tokens": 89292800} +{"current_steps": 10910, "total_steps": 20825, "loss": 0.904, "learning_rate": 2.5009904137993106e-05, "epoch": 0.5238895558223289, "percentage": 52.39, "elapsed_time": "14:46:43", "remaining_time": "13:25:51", "throughput": 1679.87, "total_tokens": 89374720} +{"current_steps": 10920, "total_steps": 20825, "loss": 1.042, "learning_rate": 2.497028759223839e-05, "epoch": 0.5243697478991597, "percentage": 52.44, "elapsed_time": "14:47:31", "remaining_time": "13:25:01", "throughput": 1679.9, "total_tokens": 89456640} +{"current_steps": 10930, "total_steps": 20825, "loss": 0.9832, "learning_rate": 2.4930671121096105e-05, "epoch": 0.5248499399759904, "percentage": 52.48, "elapsed_time": "14:48:17", "remaining_time": "13:24:10", "throughput": 1679.98, "total_tokens": 89538560} +{"current_steps": 10940, "total_steps": 20825, "loss": 0.7118, "learning_rate": 2.4891054824049264e-05, "epoch": 0.5253301320528211, "percentage": 52.53, "elapsed_time": "14:49:03", "remaining_time": "13:23:19", "throughput": 1680.05, "total_tokens": 89620480} +{"current_steps": 10950, "total_steps": 20825, "loss": 0.864, "learning_rate": 2.485143880058049e-05, "epoch": 0.5258103241296519, "percentage": 52.58, "elapsed_time": "14:49:52", "remaining_time": "13:22:30", "throughput": 1680.05, "total_tokens": 89702400} +{"current_steps": 10960, "total_steps": 20825, "loss": 0.8928, "learning_rate": 2.4811823150171692e-05, "epoch": 0.5262905162064826, "percentage": 52.63, "elapsed_time": "14:50:40", "remaining_time": "13:21:41", "throughput": 1680.08, "total_tokens": 89784320} +{"current_steps": 10970, "total_steps": 20825, "loss": 1.0436, "learning_rate": 2.477220797230385e-05, "epoch": 0.5267707082833133, "percentage": 52.68, "elapsed_time": "14:51:29", "remaining_time": "13:20:52", "throughput": 1680.07, "total_tokens": 89866240} +{"current_steps": 10980, "total_steps": 20825, "loss": 1.1344, "learning_rate": 2.4732593366456755e-05, "epoch": 0.5272509003601441, "percentage": 52.73, "elapsed_time": "14:52:17", "remaining_time": "13:20:03", "throughput": 1680.09, "total_tokens": 89948160} +{"current_steps": 10990, "total_steps": 20825, "loss": 0.9068, "learning_rate": 2.4692979432108777e-05, "epoch": 0.5277310924369748, "percentage": 52.77, "elapsed_time": "14:53:04", "remaining_time": "13:19:13", "throughput": 1680.14, "total_tokens": 90030080} +{"current_steps": 11000, "total_steps": 20825, "loss": 1.0396, "learning_rate": 2.4653366268736565e-05, "epoch": 0.5282112845138055, "percentage": 52.82, "elapsed_time": "14:53:52", "remaining_time": "13:18:23", "throughput": 1680.16, "total_tokens": 90112000} +{"current_steps": 11010, "total_steps": 20825, "loss": 0.7987, "learning_rate": 2.461375397581487e-05, "epoch": 0.5286914765906362, "percentage": 52.87, "elapsed_time": "14:54:43", "remaining_time": "13:17:36", "throughput": 1680.11, "total_tokens": 90193920} +{"current_steps": 11020, "total_steps": 20825, "loss": 0.8519, "learning_rate": 2.4574142652816238e-05, "epoch": 0.529171668667467, "percentage": 52.92, "elapsed_time": "14:55:29", "remaining_time": "13:16:45", "throughput": 1680.19, "total_tokens": 90275840} +{"current_steps": 11030, "total_steps": 20825, "loss": 0.7499, "learning_rate": 2.453453239921077e-05, "epoch": 0.5296518607442977, "percentage": 52.97, "elapsed_time": "14:56:17", "remaining_time": "13:15:56", "throughput": 1680.21, "total_tokens": 90357760} +{"current_steps": 11040, "total_steps": 20825, "loss": 0.7552, "learning_rate": 2.44949233144659e-05, "epoch": 0.5301320528211284, "percentage": 53.01, "elapsed_time": "14:57:06", "remaining_time": "13:15:07", "throughput": 1680.22, "total_tokens": 90439680} +{"current_steps": 11050, "total_steps": 20825, "loss": 0.8187, "learning_rate": 2.4455315498046134e-05, "epoch": 0.5306122448979592, "percentage": 53.06, "elapsed_time": "14:57:52", "remaining_time": "13:14:16", "throughput": 1680.3, "total_tokens": 90521600} +{"current_steps": 11060, "total_steps": 20825, "loss": 0.8756, "learning_rate": 2.4415709049412757e-05, "epoch": 0.5310924369747899, "percentage": 53.11, "elapsed_time": "14:58:41", "remaining_time": "13:13:27", "throughput": 1680.29, "total_tokens": 90603520} +{"current_steps": 11070, "total_steps": 20825, "loss": 0.8821, "learning_rate": 2.437610406802365e-05, "epoch": 0.5315726290516206, "percentage": 53.16, "elapsed_time": "14:59:29", "remaining_time": "13:12:38", "throughput": 1680.3, "total_tokens": 90685440} +{"current_steps": 11080, "total_steps": 20825, "loss": 0.9912, "learning_rate": 2.4336500653333012e-05, "epoch": 0.5320528211284514, "percentage": 53.21, "elapsed_time": "15:00:15", "remaining_time": "13:11:47", "throughput": 1680.38, "total_tokens": 90767360} +{"current_steps": 11090, "total_steps": 20825, "loss": 0.9691, "learning_rate": 2.4296898904791076e-05, "epoch": 0.5325330132052821, "percentage": 53.25, "elapsed_time": "15:01:04", "remaining_time": "13:10:58", "throughput": 1680.39, "total_tokens": 90849280} +{"current_steps": 11100, "total_steps": 20825, "loss": 0.8621, "learning_rate": 2.425729892184393e-05, "epoch": 0.5330132052821128, "percentage": 53.3, "elapsed_time": "15:01:52", "remaining_time": "13:10:09", "throughput": 1680.42, "total_tokens": 90931200} +{"current_steps": 11110, "total_steps": 20825, "loss": 1.1661, "learning_rate": 2.421770080393321e-05, "epoch": 0.5334933973589436, "percentage": 53.35, "elapsed_time": "15:02:40", "remaining_time": "13:09:20", "throughput": 1680.42, "total_tokens": 91013120} +{"current_steps": 11120, "total_steps": 20825, "loss": 0.9819, "learning_rate": 2.417810465049585e-05, "epoch": 0.5339735894357743, "percentage": 53.4, "elapsed_time": "15:03:27", "remaining_time": "13:08:29", "throughput": 1680.5, "total_tokens": 91095040} +{"current_steps": 11130, "total_steps": 20825, "loss": 0.7812, "learning_rate": 2.413851056096388e-05, "epoch": 0.534453781512605, "percentage": 53.45, "elapsed_time": "15:04:15", "remaining_time": "13:07:40", "throughput": 1680.51, "total_tokens": 91176960} +{"current_steps": 11140, "total_steps": 20825, "loss": 0.8706, "learning_rate": 2.4098918634764153e-05, "epoch": 0.5349339735894357, "percentage": 53.49, "elapsed_time": "15:05:03", "remaining_time": "13:06:51", "throughput": 1680.52, "total_tokens": 91258880} +{"current_steps": 11150, "total_steps": 20825, "loss": 1.015, "learning_rate": 2.4059328971318053e-05, "epoch": 0.5354141656662665, "percentage": 53.54, "elapsed_time": "15:05:50", "remaining_time": "13:06:00", "throughput": 1680.58, "total_tokens": 91340800} +{"current_steps": 11160, "total_steps": 20825, "loss": 0.9073, "learning_rate": 2.4019741670041305e-05, "epoch": 0.5358943577430972, "percentage": 53.59, "elapsed_time": "15:06:37", "remaining_time": "13:05:09", "throughput": 1680.66, "total_tokens": 91422720} +{"current_steps": 11170, "total_steps": 20825, "loss": 0.9643, "learning_rate": 2.398015683034371e-05, "epoch": 0.5363745498199279, "percentage": 53.64, "elapsed_time": "15:07:23", "remaining_time": "13:04:19", "throughput": 1680.73, "total_tokens": 91504640} +{"current_steps": 11180, "total_steps": 20825, "loss": 0.6964, "learning_rate": 2.394057455162886e-05, "epoch": 0.5368547418967587, "percentage": 53.69, "elapsed_time": "15:08:10", "remaining_time": "13:03:28", "throughput": 1680.79, "total_tokens": 91586560} +{"current_steps": 11190, "total_steps": 20825, "loss": 0.7903, "learning_rate": 2.3900994933293953e-05, "epoch": 0.5373349339735894, "percentage": 53.73, "elapsed_time": "15:08:57", "remaining_time": "13:02:38", "throughput": 1680.83, "total_tokens": 91668480} +{"current_steps": 11200, "total_steps": 20825, "loss": 0.918, "learning_rate": 2.3861418074729476e-05, "epoch": 0.5378151260504201, "percentage": 53.78, "elapsed_time": "15:09:44", "remaining_time": "13:01:48", "throughput": 1680.88, "total_tokens": 91750400} +{"current_steps": 11210, "total_steps": 20825, "loss": 0.8276, "learning_rate": 2.3821844075318993e-05, "epoch": 0.538295318127251, "percentage": 53.83, "elapsed_time": "15:10:31", "remaining_time": "13:00:58", "throughput": 1680.93, "total_tokens": 91832320} +{"current_steps": 11220, "total_steps": 20825, "loss": 0.9665, "learning_rate": 2.378227303443889e-05, "epoch": 0.5387755102040817, "percentage": 53.88, "elapsed_time": "15:11:19", "remaining_time": "13:00:09", "throughput": 1680.95, "total_tokens": 91914240} +{"current_steps": 11230, "total_steps": 20825, "loss": 0.8118, "learning_rate": 2.3742705051458145e-05, "epoch": 0.5392557022809124, "percentage": 53.93, "elapsed_time": "15:12:09", "remaining_time": "12:59:21", "throughput": 1680.92, "total_tokens": 91996160} +{"current_steps": 11240, "total_steps": 20825, "loss": 0.9285, "learning_rate": 2.3703140225738017e-05, "epoch": 0.539735894357743, "percentage": 53.97, "elapsed_time": "15:12:57", "remaining_time": "12:58:32", "throughput": 1680.94, "total_tokens": 92078080} +{"current_steps": 11250, "total_steps": 20825, "loss": 0.814, "learning_rate": 2.3663578656631858e-05, "epoch": 0.5402160864345739, "percentage": 54.02, "elapsed_time": "15:13:45", "remaining_time": "12:57:42", "throughput": 1680.96, "total_tokens": 92160000} +{"current_steps": 11260, "total_steps": 20825, "loss": 0.8016, "learning_rate": 2.362402044348486e-05, "epoch": 0.5406962785114046, "percentage": 54.07, "elapsed_time": "15:14:32", "remaining_time": "12:56:52", "throughput": 1681.01, "total_tokens": 92241920} +{"current_steps": 11270, "total_steps": 20825, "loss": 0.8771, "learning_rate": 2.3584465685633738e-05, "epoch": 0.5411764705882353, "percentage": 54.12, "elapsed_time": "15:15:19", "remaining_time": "12:56:01", "throughput": 1681.08, "total_tokens": 92323840} +{"current_steps": 11280, "total_steps": 20825, "loss": 0.8791, "learning_rate": 2.3544914482406592e-05, "epoch": 0.5416566626650661, "percentage": 54.17, "elapsed_time": "15:16:06", "remaining_time": "12:55:11", "throughput": 1681.13, "total_tokens": 92405760} +{"current_steps": 11290, "total_steps": 20825, "loss": 0.8822, "learning_rate": 2.350536693312255e-05, "epoch": 0.5421368547418968, "percentage": 54.21, "elapsed_time": "15:16:55", "remaining_time": "12:54:23", "throughput": 1681.13, "total_tokens": 92487680} +{"current_steps": 11300, "total_steps": 20825, "loss": 0.8298, "learning_rate": 2.3465823137091572e-05, "epoch": 0.5426170468187275, "percentage": 54.26, "elapsed_time": "15:17:43", "remaining_time": "12:53:34", "throughput": 1681.14, "total_tokens": 92569600} +{"current_steps": 11310, "total_steps": 20825, "loss": 0.8567, "learning_rate": 2.3426283193614208e-05, "epoch": 0.5430972388955583, "percentage": 54.31, "elapsed_time": "15:18:32", "remaining_time": "12:52:45", "throughput": 1681.14, "total_tokens": 92651520} +{"current_steps": 11320, "total_steps": 20825, "loss": 1.1435, "learning_rate": 2.3386747201981338e-05, "epoch": 0.543577430972389, "percentage": 54.36, "elapsed_time": "15:19:21", "remaining_time": "12:51:56", "throughput": 1681.14, "total_tokens": 92733440} +{"current_steps": 11330, "total_steps": 20825, "loss": 0.8503, "learning_rate": 2.3347215261473887e-05, "epoch": 0.5440576230492197, "percentage": 54.41, "elapsed_time": "15:20:08", "remaining_time": "12:51:07", "throughput": 1681.16, "total_tokens": 92815360} +{"current_steps": 11340, "total_steps": 20825, "loss": 0.9992, "learning_rate": 2.330768747136263e-05, "epoch": 0.5445378151260504, "percentage": 54.45, "elapsed_time": "15:20:56", "remaining_time": "12:50:18", "throughput": 1681.19, "total_tokens": 92897280} +{"current_steps": 11350, "total_steps": 20825, "loss": 0.8629, "learning_rate": 2.3268163930907933e-05, "epoch": 0.5450180072028812, "percentage": 54.5, "elapsed_time": "15:21:46", "remaining_time": "12:49:30", "throughput": 1681.15, "total_tokens": 92979200} +{"current_steps": 11360, "total_steps": 20825, "loss": 0.8107, "learning_rate": 2.3228644739359444e-05, "epoch": 0.5454981992797119, "percentage": 54.55, "elapsed_time": "15:22:37", "remaining_time": "12:48:42", "throughput": 1681.11, "total_tokens": 93061120} +{"current_steps": 11370, "total_steps": 20825, "loss": 0.9255, "learning_rate": 2.3189129995955943e-05, "epoch": 0.5459783913565426, "percentage": 54.6, "elapsed_time": "15:23:40", "remaining_time": "12:48:06", "throughput": 1680.65, "total_tokens": 93143040} +{"current_steps": 11380, "total_steps": 20825, "loss": 0.9589, "learning_rate": 2.314961979992501e-05, "epoch": 0.5464585834333734, "percentage": 54.65, "elapsed_time": "15:24:50", "remaining_time": "12:47:34", "throughput": 1680.03, "total_tokens": 93224960} +{"current_steps": 11390, "total_steps": 20825, "loss": 1.0476, "learning_rate": 2.311011425048281e-05, "epoch": 0.5469387755102041, "percentage": 54.69, "elapsed_time": "15:25:59", "remaining_time": "12:47:03", "throughput": 1679.4, "total_tokens": 93306880} +{"current_steps": 11400, "total_steps": 20825, "loss": 0.9967, "learning_rate": 2.3070613446833842e-05, "epoch": 0.5474189675870348, "percentage": 54.74, "elapsed_time": "15:26:59", "remaining_time": "12:46:23", "throughput": 1679.06, "total_tokens": 93388800} +{"current_steps": 11410, "total_steps": 20825, "loss": 0.9432, "learning_rate": 2.30311174881707e-05, "epoch": 0.5478991596638656, "percentage": 54.79, "elapsed_time": "15:27:50", "remaining_time": "12:45:36", "throughput": 1679.01, "total_tokens": 93470720} +{"current_steps": 11420, "total_steps": 20825, "loss": 0.7797, "learning_rate": 2.2991626473673773e-05, "epoch": 0.5483793517406963, "percentage": 54.84, "elapsed_time": "15:28:36", "remaining_time": "12:44:45", "throughput": 1679.09, "total_tokens": 93552640} +{"current_steps": 11430, "total_steps": 20825, "loss": 0.9207, "learning_rate": 2.295214050251108e-05, "epoch": 0.548859543817527, "percentage": 54.89, "elapsed_time": "15:29:22", "remaining_time": "12:43:54", "throughput": 1679.18, "total_tokens": 93634560} +{"current_steps": 11440, "total_steps": 20825, "loss": 0.7837, "learning_rate": 2.2912659673837965e-05, "epoch": 0.5493397358943577, "percentage": 54.93, "elapsed_time": "15:30:09", "remaining_time": "12:43:03", "throughput": 1679.23, "total_tokens": 93716480} +{"current_steps": 11450, "total_steps": 20825, "loss": 0.8649, "learning_rate": 2.2873184086796824e-05, "epoch": 0.5498199279711885, "percentage": 54.98, "elapsed_time": "15:30:57", "remaining_time": "12:42:14", "throughput": 1679.25, "total_tokens": 93798400} +{"current_steps": 11460, "total_steps": 20825, "loss": 1.2096, "learning_rate": 2.283371384051693e-05, "epoch": 0.5503001200480192, "percentage": 55.03, "elapsed_time": "15:31:46", "remaining_time": "12:41:26", "throughput": 1679.23, "total_tokens": 93880320} +{"current_steps": 11470, "total_steps": 20825, "loss": 0.9088, "learning_rate": 2.2794249034114137e-05, "epoch": 0.5507803121248499, "percentage": 55.08, "elapsed_time": "15:32:35", "remaining_time": "12:40:37", "throughput": 1679.22, "total_tokens": 93962240} +{"current_steps": 11480, "total_steps": 20825, "loss": 1.0068, "learning_rate": 2.275478976669062e-05, "epoch": 0.5512605042016807, "percentage": 55.13, "elapsed_time": "15:33:22", "remaining_time": "12:39:47", "throughput": 1679.29, "total_tokens": 94044160} +{"current_steps": 11490, "total_steps": 20825, "loss": 0.9817, "learning_rate": 2.2715336137334657e-05, "epoch": 0.5517406962785114, "percentage": 55.17, "elapsed_time": "15:34:07", "remaining_time": "12:38:55", "throughput": 1679.39, "total_tokens": 94126080} +{"current_steps": 11500, "total_steps": 20825, "loss": 1.0594, "learning_rate": 2.2675888245120382e-05, "epoch": 0.5522208883553421, "percentage": 55.22, "elapsed_time": "15:34:54", "remaining_time": "12:38:05", "throughput": 1679.46, "total_tokens": 94208000} +{"current_steps": 11510, "total_steps": 20825, "loss": 0.9223, "learning_rate": 2.263644618910749e-05, "epoch": 0.5527010804321729, "percentage": 55.27, "elapsed_time": "15:35:44", "remaining_time": "12:37:17", "throughput": 1679.42, "total_tokens": 94289920} +{"current_steps": 11520, "total_steps": 20825, "loss": 0.6925, "learning_rate": 2.2597010068341052e-05, "epoch": 0.5531812725090036, "percentage": 55.32, "elapsed_time": "15:36:32", "remaining_time": "12:36:27", "throughput": 1679.45, "total_tokens": 94371840} +{"current_steps": 11530, "total_steps": 20825, "loss": 0.9426, "learning_rate": 2.255757998185122e-05, "epoch": 0.5536614645858343, "percentage": 55.37, "elapsed_time": "15:37:22", "remaining_time": "12:35:40", "throughput": 1679.4, "total_tokens": 94453760} +{"current_steps": 11540, "total_steps": 20825, "loss": 0.9247, "learning_rate": 2.2518156028652977e-05, "epoch": 0.554141656662665, "percentage": 55.41, "elapsed_time": "15:38:09", "remaining_time": "12:34:49", "throughput": 1679.47, "total_tokens": 94535680} +{"current_steps": 11550, "total_steps": 20825, "loss": 0.7931, "learning_rate": 2.2478738307745938e-05, "epoch": 0.5546218487394958, "percentage": 55.46, "elapsed_time": "15:38:56", "remaining_time": "12:34:00", "throughput": 1679.5, "total_tokens": 94617600} +{"current_steps": 11560, "total_steps": 20825, "loss": 0.9164, "learning_rate": 2.243932691811405e-05, "epoch": 0.5551020408163265, "percentage": 55.51, "elapsed_time": "15:39:44", "remaining_time": "12:33:10", "throughput": 1679.54, "total_tokens": 94699520} +{"current_steps": 11570, "total_steps": 20825, "loss": 0.9756, "learning_rate": 2.2399921958725364e-05, "epoch": 0.5555822328931572, "percentage": 55.56, "elapsed_time": "15:40:30", "remaining_time": "12:32:19", "throughput": 1679.62, "total_tokens": 94781440} +{"current_steps": 11580, "total_steps": 20825, "loss": 1.0529, "learning_rate": 2.236052352853177e-05, "epoch": 0.556062424969988, "percentage": 55.61, "elapsed_time": "15:41:17", "remaining_time": "12:31:29", "throughput": 1679.67, "total_tokens": 94863360} +{"current_steps": 11590, "total_steps": 20825, "loss": 0.9882, "learning_rate": 2.232113172646878e-05, "epoch": 0.5565426170468187, "percentage": 55.65, "elapsed_time": "15:42:03", "remaining_time": "12:30:38", "throughput": 1679.76, "total_tokens": 94945280} +{"current_steps": 11600, "total_steps": 20825, "loss": 0.8608, "learning_rate": 2.2281746651455272e-05, "epoch": 0.5570228091236494, "percentage": 55.7, "elapsed_time": "15:42:49", "remaining_time": "12:29:47", "throughput": 1679.84, "total_tokens": 95027200} +{"current_steps": 11610, "total_steps": 20825, "loss": 1.0607, "learning_rate": 2.2242368402393198e-05, "epoch": 0.5575030012004802, "percentage": 55.75, "elapsed_time": "15:43:35", "remaining_time": "12:28:56", "throughput": 1679.92, "total_tokens": 95109120} +{"current_steps": 11620, "total_steps": 20825, "loss": 0.8243, "learning_rate": 2.220299707816738e-05, "epoch": 0.5579831932773109, "percentage": 55.8, "elapsed_time": "15:44:20", "remaining_time": "12:28:05", "throughput": 1680.01, "total_tokens": 95191040} +{"current_steps": 11630, "total_steps": 20825, "loss": 0.8224, "learning_rate": 2.2163632777645282e-05, "epoch": 0.5584633853541416, "percentage": 55.85, "elapsed_time": "15:45:07", "remaining_time": "12:27:14", "throughput": 1680.08, "total_tokens": 95272960} +{"current_steps": 11640, "total_steps": 20825, "loss": 0.9011, "learning_rate": 2.2124275599676676e-05, "epoch": 0.5589435774309723, "percentage": 55.89, "elapsed_time": "15:45:58", "remaining_time": "12:26:27", "throughput": 1680.02, "total_tokens": 95354880} +{"current_steps": 11650, "total_steps": 20825, "loss": 0.9039, "learning_rate": 2.20849256430935e-05, "epoch": 0.5594237695078031, "percentage": 55.94, "elapsed_time": "15:46:46", "remaining_time": "12:25:37", "throughput": 1680.04, "total_tokens": 95436800} +{"current_steps": 11660, "total_steps": 20825, "loss": 0.9187, "learning_rate": 2.2045583006709536e-05, "epoch": 0.5599039615846338, "percentage": 55.99, "elapsed_time": "15:47:35", "remaining_time": "12:24:49", "throughput": 1680.03, "total_tokens": 95518720} +{"current_steps": 11670, "total_steps": 20825, "loss": 0.8694, "learning_rate": 2.2006247789320162e-05, "epoch": 0.5603841536614645, "percentage": 56.04, "elapsed_time": "15:48:25", "remaining_time": "12:24:01", "throughput": 1679.98, "total_tokens": 95600640} +{"current_steps": 11680, "total_steps": 20825, "loss": 0.9286, "learning_rate": 2.1966920089702157e-05, "epoch": 0.5608643457382954, "percentage": 56.09, "elapsed_time": "15:49:13", "remaining_time": "12:23:12", "throughput": 1680.03, "total_tokens": 95682560} +{"current_steps": 11690, "total_steps": 20825, "loss": 0.8019, "learning_rate": 2.192760000661343e-05, "epoch": 0.561344537815126, "percentage": 56.13, "elapsed_time": "15:50:07", "remaining_time": "12:22:27", "throughput": 1679.86, "total_tokens": 95764480} +{"current_steps": 11700, "total_steps": 20825, "loss": 0.8267, "learning_rate": 2.1888287638792722e-05, "epoch": 0.5618247298919568, "percentage": 56.18, "elapsed_time": "15:50:54", "remaining_time": "12:21:37", "throughput": 1679.91, "total_tokens": 95846400} +{"current_steps": 11710, "total_steps": 20825, "loss": 0.8884, "learning_rate": 2.184898308495943e-05, "epoch": 0.5623049219687876, "percentage": 56.23, "elapsed_time": "15:52:05", "remaining_time": "12:21:06", "throughput": 1679.26, "total_tokens": 95928320} +{"current_steps": 11720, "total_steps": 20825, "loss": 0.992, "learning_rate": 2.180968644381334e-05, "epoch": 0.5627851140456183, "percentage": 56.28, "elapsed_time": "15:53:24", "remaining_time": "12:20:40", "throughput": 1678.36, "total_tokens": 96010240} +{"current_steps": 11730, "total_steps": 20825, "loss": 0.8166, "learning_rate": 2.1770397814034315e-05, "epoch": 0.563265306122449, "percentage": 56.33, "elapsed_time": "15:54:16", "remaining_time": "12:19:54", "throughput": 1678.28, "total_tokens": 96092160} +{"current_steps": 11740, "total_steps": 20825, "loss": 0.9194, "learning_rate": 2.1731117294282166e-05, "epoch": 0.5637454981992797, "percentage": 56.37, "elapsed_time": "15:55:11", "remaining_time": "12:19:10", "throughput": 1678.11, "total_tokens": 96174080} +{"current_steps": 11750, "total_steps": 20825, "loss": 0.8408, "learning_rate": 2.16918449831963e-05, "epoch": 0.5642256902761105, "percentage": 56.42, "elapsed_time": "15:55:58", "remaining_time": "12:18:20", "throughput": 1678.16, "total_tokens": 96256000} +{"current_steps": 11760, "total_steps": 20825, "loss": 0.8308, "learning_rate": 2.165258097939551e-05, "epoch": 0.5647058823529412, "percentage": 56.47, "elapsed_time": "15:56:47", "remaining_time": "12:17:31", "throughput": 1678.14, "total_tokens": 96337920} +{"current_steps": 11770, "total_steps": 20825, "loss": 0.6813, "learning_rate": 2.1613325381477744e-05, "epoch": 0.5651860744297719, "percentage": 56.52, "elapsed_time": "15:57:34", "remaining_time": "12:16:41", "throughput": 1678.2, "total_tokens": 96419840} +{"current_steps": 11780, "total_steps": 20825, "loss": 0.9842, "learning_rate": 2.1574078288019846e-05, "epoch": 0.5656662665066027, "percentage": 56.57, "elapsed_time": "15:58:22", "remaining_time": "12:15:52", "throughput": 1678.21, "total_tokens": 96501760} +{"current_steps": 11790, "total_steps": 20825, "loss": 1.0156, "learning_rate": 2.1534839797577268e-05, "epoch": 0.5661464585834334, "percentage": 56.61, "elapsed_time": "15:59:15", "remaining_time": "12:15:06", "throughput": 1678.09, "total_tokens": 96583680} +{"current_steps": 11800, "total_steps": 20825, "loss": 0.8119, "learning_rate": 2.14956100086839e-05, "epoch": 0.5666266506602641, "percentage": 56.66, "elapsed_time": "16:00:14", "remaining_time": "12:14:25", "throughput": 1677.8, "total_tokens": 96665600} +{"current_steps": 11810, "total_steps": 20825, "loss": 0.8039, "learning_rate": 2.1456389019851762e-05, "epoch": 0.5671068427370949, "percentage": 56.71, "elapsed_time": "16:01:12", "remaining_time": "12:13:43", "throughput": 1677.53, "total_tokens": 96747520} +{"current_steps": 11820, "total_steps": 20825, "loss": 0.8425, "learning_rate": 2.1417176929570768e-05, "epoch": 0.5675870348139256, "percentage": 56.76, "elapsed_time": "16:02:08", "remaining_time": "12:12:59", "throughput": 1677.33, "total_tokens": 96829440} +{"current_steps": 11830, "total_steps": 20825, "loss": 0.8214, "learning_rate": 2.137797383630851e-05, "epoch": 0.5680672268907563, "percentage": 56.81, "elapsed_time": "16:03:02", "remaining_time": "12:12:15", "throughput": 1677.17, "total_tokens": 96911360} +{"current_steps": 11840, "total_steps": 20825, "loss": 0.8337, "learning_rate": 2.1338779838509965e-05, "epoch": 0.568547418967587, "percentage": 56.85, "elapsed_time": "16:03:55", "remaining_time": "12:11:29", "throughput": 1677.06, "total_tokens": 96993280} +{"current_steps": 11850, "total_steps": 20825, "loss": 1.018, "learning_rate": 2.129959503459728e-05, "epoch": 0.5690276110444178, "percentage": 56.9, "elapsed_time": "16:04:50", "remaining_time": "12:10:45", "throughput": 1676.87, "total_tokens": 97075200} +{"current_steps": 11860, "total_steps": 20825, "loss": 0.8476, "learning_rate": 2.126041952296951e-05, "epoch": 0.5695078031212485, "percentage": 56.95, "elapsed_time": "16:05:40", "remaining_time": "12:09:57", "throughput": 1676.83, "total_tokens": 97157120} +{"current_steps": 11870, "total_steps": 20825, "loss": 1.086, "learning_rate": 2.122125340200239e-05, "epoch": 0.5699879951980792, "percentage": 57.0, "elapsed_time": "16:06:40", "remaining_time": "12:09:16", "throughput": 1676.52, "total_tokens": 97239040} +{"current_steps": 11880, "total_steps": 20825, "loss": 1.1085, "learning_rate": 2.1182096770048045e-05, "epoch": 0.57046818727491, "percentage": 57.05, "elapsed_time": "16:07:29", "remaining_time": "12:08:28", "throughput": 1676.52, "total_tokens": 97320960} +{"current_steps": 11890, "total_steps": 20825, "loss": 0.8716, "learning_rate": 2.11429497254348e-05, "epoch": 0.5709483793517407, "percentage": 57.09, "elapsed_time": "16:08:23", "remaining_time": "12:07:43", "throughput": 1676.37, "total_tokens": 97402880} +{"current_steps": 11900, "total_steps": 20825, "loss": 0.9373, "learning_rate": 2.1103812366466896e-05, "epoch": 0.5714285714285714, "percentage": 57.14, "elapsed_time": "16:09:11", "remaining_time": "12:06:53", "throughput": 1676.41, "total_tokens": 97484800} +{"current_steps": 11910, "total_steps": 20825, "loss": 0.9405, "learning_rate": 2.1064684791424236e-05, "epoch": 0.5719087635054022, "percentage": 57.19, "elapsed_time": "16:10:17", "remaining_time": "12:06:17", "throughput": 1675.91, "total_tokens": 97566720} +{"current_steps": 11920, "total_steps": 20825, "loss": 0.8314, "learning_rate": 2.1025567098562177e-05, "epoch": 0.5723889555822329, "percentage": 57.24, "elapsed_time": "16:11:12", "remaining_time": "12:05:33", "throughput": 1675.73, "total_tokens": 97648640} +{"current_steps": 11930, "total_steps": 20825, "loss": 0.8852, "learning_rate": 2.0986459386111256e-05, "epoch": 0.5728691476590636, "percentage": 57.29, "elapsed_time": "16:11:59", "remaining_time": "12:04:43", "throughput": 1675.78, "total_tokens": 97730560} +{"current_steps": 11940, "total_steps": 20825, "loss": 0.8412, "learning_rate": 2.0947361752276935e-05, "epoch": 0.5733493397358943, "percentage": 57.33, "elapsed_time": "16:12:45", "remaining_time": "12:03:51", "throughput": 1675.86, "total_tokens": 97812480} +{"current_steps": 11950, "total_steps": 20825, "loss": 1.007, "learning_rate": 2.0908274295239365e-05, "epoch": 0.5738295318127251, "percentage": 57.38, "elapsed_time": "16:13:31", "remaining_time": "12:03:00", "throughput": 1675.94, "total_tokens": 97894400} +{"current_steps": 11960, "total_steps": 20825, "loss": 0.882, "learning_rate": 2.0869197113153175e-05, "epoch": 0.5743097238895558, "percentage": 57.43, "elapsed_time": "16:14:18", "remaining_time": "12:02:10", "throughput": 1675.99, "total_tokens": 97976320} +{"current_steps": 11970, "total_steps": 20825, "loss": 0.7298, "learning_rate": 2.083013030414714e-05, "epoch": 0.5747899159663865, "percentage": 57.48, "elapsed_time": "16:15:06", "remaining_time": "12:01:20", "throughput": 1676.03, "total_tokens": 98058240} +{"current_steps": 11980, "total_steps": 20825, "loss": 0.808, "learning_rate": 2.0791073966324037e-05, "epoch": 0.5752701080432173, "percentage": 57.53, "elapsed_time": "16:15:52", "remaining_time": "12:00:30", "throughput": 1676.09, "total_tokens": 98140160} +{"current_steps": 11990, "total_steps": 20825, "loss": 0.729, "learning_rate": 2.0752028197760323e-05, "epoch": 0.575750300120048, "percentage": 57.58, "elapsed_time": "16:16:40", "remaining_time": "11:59:40", "throughput": 1676.12, "total_tokens": 98222080} +{"current_steps": 12000, "total_steps": 20825, "loss": 0.9467, "learning_rate": 2.07129930965059e-05, "epoch": 0.5762304921968787, "percentage": 57.62, "elapsed_time": "16:17:27", "remaining_time": "11:58:50", "throughput": 1676.18, "total_tokens": 98304000} +{"current_steps": 12010, "total_steps": 20825, "loss": 0.8261, "learning_rate": 2.0673968760583912e-05, "epoch": 0.5767106842737095, "percentage": 57.67, "elapsed_time": "16:18:18", "remaining_time": "11:58:03", "throughput": 1676.11, "total_tokens": 98385920} +{"current_steps": 12020, "total_steps": 20825, "loss": 1.0051, "learning_rate": 2.0634955287990465e-05, "epoch": 0.5771908763505402, "percentage": 57.72, "elapsed_time": "16:19:05", "remaining_time": "11:57:12", "throughput": 1676.17, "total_tokens": 98467840} +{"current_steps": 12030, "total_steps": 20825, "loss": 0.7679, "learning_rate": 2.059595277669436e-05, "epoch": 0.5776710684273709, "percentage": 57.77, "elapsed_time": "16:19:52", "remaining_time": "11:56:22", "throughput": 1676.22, "total_tokens": 98549760} +{"current_steps": 12040, "total_steps": 20825, "loss": 0.9756, "learning_rate": 2.0556961324636903e-05, "epoch": 0.5781512605042017, "percentage": 57.82, "elapsed_time": "16:20:39", "remaining_time": "11:55:32", "throughput": 1676.29, "total_tokens": 98631680} +{"current_steps": 12050, "total_steps": 20825, "loss": 0.9699, "learning_rate": 2.0517981029731616e-05, "epoch": 0.5786314525810324, "percentage": 57.86, "elapsed_time": "16:21:25", "remaining_time": "11:54:41", "throughput": 1676.36, "total_tokens": 98713600} +{"current_steps": 12060, "total_steps": 20825, "loss": 1.0828, "learning_rate": 2.0479011989863988e-05, "epoch": 0.5791116446578631, "percentage": 57.91, "elapsed_time": "16:22:12", "remaining_time": "11:53:50", "throughput": 1676.43, "total_tokens": 98795520} +{"current_steps": 12070, "total_steps": 20825, "loss": 0.8873, "learning_rate": 2.0440054302891276e-05, "epoch": 0.5795918367346938, "percentage": 57.96, "elapsed_time": "16:22:58", "remaining_time": "11:53:00", "throughput": 1676.5, "total_tokens": 98877440} +{"current_steps": 12080, "total_steps": 20825, "loss": 0.7899, "learning_rate": 2.0401108066642217e-05, "epoch": 0.5800720288115246, "percentage": 58.01, "elapsed_time": "16:23:45", "remaining_time": "11:52:09", "throughput": 1676.55, "total_tokens": 98959360} +{"current_steps": 12090, "total_steps": 20825, "loss": 0.843, "learning_rate": 2.0362173378916763e-05, "epoch": 0.5805522208883553, "percentage": 58.06, "elapsed_time": "16:24:33", "remaining_time": "11:51:20", "throughput": 1676.59, "total_tokens": 99041280} +{"current_steps": 12100, "total_steps": 20825, "loss": 0.8847, "learning_rate": 2.032325033748591e-05, "epoch": 0.581032412965186, "percentage": 58.1, "elapsed_time": "16:25:20", "remaining_time": "11:50:29", "throughput": 1676.64, "total_tokens": 99123200} +{"current_steps": 12110, "total_steps": 20825, "loss": 0.9604, "learning_rate": 2.0284339040091403e-05, "epoch": 0.5815126050420169, "percentage": 58.15, "elapsed_time": "16:26:07", "remaining_time": "11:49:40", "throughput": 1676.68, "total_tokens": 99205120} +{"current_steps": 12120, "total_steps": 20825, "loss": 0.716, "learning_rate": 2.0245439584445457e-05, "epoch": 0.5819927971188475, "percentage": 58.2, "elapsed_time": "16:26:55", "remaining_time": "11:48:50", "throughput": 1676.7, "total_tokens": 99287040} +{"current_steps": 12130, "total_steps": 20825, "loss": 0.9379, "learning_rate": 2.0206552068230587e-05, "epoch": 0.5824729891956782, "percentage": 58.25, "elapsed_time": "16:27:41", "remaining_time": "11:47:59", "throughput": 1676.79, "total_tokens": 99368960} +{"current_steps": 12140, "total_steps": 20825, "loss": 0.9769, "learning_rate": 2.0167676589099324e-05, "epoch": 0.5829531812725091, "percentage": 58.3, "elapsed_time": "16:28:27", "remaining_time": "11:47:08", "throughput": 1676.87, "total_tokens": 99450880} +{"current_steps": 12150, "total_steps": 20825, "loss": 0.8786, "learning_rate": 2.0128813244673946e-05, "epoch": 0.5834333733493398, "percentage": 58.34, "elapsed_time": "16:29:14", "remaining_time": "11:46:18", "throughput": 1676.91, "total_tokens": 99532800} +{"current_steps": 12160, "total_steps": 20825, "loss": 0.9365, "learning_rate": 2.0089962132546296e-05, "epoch": 0.5839135654261705, "percentage": 58.39, "elapsed_time": "16:30:01", "remaining_time": "11:45:28", "throughput": 1676.98, "total_tokens": 99614720} +{"current_steps": 12170, "total_steps": 20825, "loss": 0.8467, "learning_rate": 2.0051123350277477e-05, "epoch": 0.5843937575030012, "percentage": 58.44, "elapsed_time": "16:30:47", "remaining_time": "11:44:37", "throughput": 1677.04, "total_tokens": 99696640} +{"current_steps": 12180, "total_steps": 20825, "loss": 0.6612, "learning_rate": 2.0012296995397613e-05, "epoch": 0.584873949579832, "percentage": 58.49, "elapsed_time": "16:31:35", "remaining_time": "11:43:47", "throughput": 1677.08, "total_tokens": 99778560} +{"current_steps": 12190, "total_steps": 20825, "loss": 0.7583, "learning_rate": 1.997348316540566e-05, "epoch": 0.5853541416566627, "percentage": 58.54, "elapsed_time": "16:32:22", "remaining_time": "11:42:57", "throughput": 1677.14, "total_tokens": 99860480} +{"current_steps": 12200, "total_steps": 20825, "loss": 0.7988, "learning_rate": 1.9934681957769107e-05, "epoch": 0.5858343337334934, "percentage": 58.58, "elapsed_time": "16:33:09", "remaining_time": "11:42:07", "throughput": 1677.19, "total_tokens": 99942400} +{"current_steps": 12210, "total_steps": 20825, "loss": 0.9576, "learning_rate": 1.9895893469923736e-05, "epoch": 0.5863145258103242, "percentage": 58.63, "elapsed_time": "16:33:56", "remaining_time": "11:41:17", "throughput": 1677.24, "total_tokens": 100024320} +{"current_steps": 12220, "total_steps": 20825, "loss": 1.1025, "learning_rate": 1.985711779927339e-05, "epoch": 0.5867947178871549, "percentage": 58.68, "elapsed_time": "16:34:42", "remaining_time": "11:40:26", "throughput": 1677.32, "total_tokens": 100106240} +{"current_steps": 12230, "total_steps": 20825, "loss": 0.8477, "learning_rate": 1.9818355043189732e-05, "epoch": 0.5872749099639856, "percentage": 58.73, "elapsed_time": "16:35:28", "remaining_time": "11:39:36", "throughput": 1677.38, "total_tokens": 100188160} +{"current_steps": 12240, "total_steps": 20825, "loss": 0.9275, "learning_rate": 1.9779605299012005e-05, "epoch": 0.5877551020408164, "percentage": 58.78, "elapsed_time": "16:36:15", "remaining_time": "11:38:45", "throughput": 1677.45, "total_tokens": 100270080} +{"current_steps": 12250, "total_steps": 20825, "loss": 0.9013, "learning_rate": 1.974086866404675e-05, "epoch": 0.5882352941176471, "percentage": 58.82, "elapsed_time": "16:37:03", "remaining_time": "11:37:56", "throughput": 1677.46, "total_tokens": 100352000} +{"current_steps": 12260, "total_steps": 20825, "loss": 1.0079, "learning_rate": 1.970214523556761e-05, "epoch": 0.5887154861944778, "percentage": 58.87, "elapsed_time": "16:37:51", "remaining_time": "11:37:06", "throughput": 1677.5, "total_tokens": 100433920} +{"current_steps": 12270, "total_steps": 20825, "loss": 0.909, "learning_rate": 1.9663435110815065e-05, "epoch": 0.5891956782713085, "percentage": 58.92, "elapsed_time": "16:38:38", "remaining_time": "11:36:17", "throughput": 1677.53, "total_tokens": 100515840} +{"current_steps": 12280, "total_steps": 20825, "loss": 0.8296, "learning_rate": 1.9624738386996163e-05, "epoch": 0.5896758703481393, "percentage": 58.97, "elapsed_time": "16:39:26", "remaining_time": "11:35:27", "throughput": 1677.57, "total_tokens": 100597760} +{"current_steps": 12290, "total_steps": 20825, "loss": 0.9134, "learning_rate": 1.9586055161284332e-05, "epoch": 0.59015606242497, "percentage": 59.02, "elapsed_time": "16:40:14", "remaining_time": "11:34:38", "throughput": 1677.59, "total_tokens": 100679680} +{"current_steps": 12300, "total_steps": 20825, "loss": 1.115, "learning_rate": 1.954738553081909e-05, "epoch": 0.5906362545018007, "percentage": 59.06, "elapsed_time": "16:41:01", "remaining_time": "11:33:48", "throughput": 1677.63, "total_tokens": 100761600} +{"current_steps": 12310, "total_steps": 20825, "loss": 0.8391, "learning_rate": 1.950872959270581e-05, "epoch": 0.5911164465786315, "percentage": 59.11, "elapsed_time": "16:41:49", "remaining_time": "11:32:58", "throughput": 1677.67, "total_tokens": 100843520} +{"current_steps": 12320, "total_steps": 20825, "loss": 0.897, "learning_rate": 1.9470087444015484e-05, "epoch": 0.5915966386554622, "percentage": 59.16, "elapsed_time": "16:42:37", "remaining_time": "11:32:09", "throughput": 1677.68, "total_tokens": 100925440} +{"current_steps": 12330, "total_steps": 20825, "loss": 1.1514, "learning_rate": 1.9431459181784495e-05, "epoch": 0.5920768307322929, "percentage": 59.21, "elapsed_time": "16:43:25", "remaining_time": "11:31:19", "throughput": 1677.72, "total_tokens": 101007360} +{"current_steps": 12340, "total_steps": 20825, "loss": 0.8289, "learning_rate": 1.939284490301432e-05, "epoch": 0.5925570228091237, "percentage": 59.26, "elapsed_time": "16:44:12", "remaining_time": "11:30:29", "throughput": 1677.76, "total_tokens": 101089280} +{"current_steps": 12350, "total_steps": 20825, "loss": 0.7324, "learning_rate": 1.935424470467135e-05, "epoch": 0.5930372148859544, "percentage": 59.3, "elapsed_time": "16:45:00", "remaining_time": "11:29:40", "throughput": 1677.77, "total_tokens": 101171200} +{"current_steps": 12360, "total_steps": 20825, "loss": 0.9871, "learning_rate": 1.9315658683686615e-05, "epoch": 0.5935174069627851, "percentage": 59.35, "elapsed_time": "16:45:46", "remaining_time": "11:28:49", "throughput": 1677.85, "total_tokens": 101253120} +{"current_steps": 12370, "total_steps": 20825, "loss": 0.8688, "learning_rate": 1.9277086936955517e-05, "epoch": 0.5939975990396158, "percentage": 59.4, "elapsed_time": "16:46:34", "remaining_time": "11:27:59", "throughput": 1677.9, "total_tokens": 101335040} +{"current_steps": 12380, "total_steps": 20825, "loss": 0.8722, "learning_rate": 1.9238529561337646e-05, "epoch": 0.5944777911164466, "percentage": 59.45, "elapsed_time": "16:47:21", "remaining_time": "11:27:10", "throughput": 1677.94, "total_tokens": 101416960} +{"current_steps": 12390, "total_steps": 20825, "loss": 0.9837, "learning_rate": 1.9199986653656502e-05, "epoch": 0.5949579831932773, "percentage": 59.5, "elapsed_time": "16:48:08", "remaining_time": "11:26:20", "throughput": 1677.97, "total_tokens": 101498880} +{"current_steps": 12400, "total_steps": 20825, "loss": 0.8041, "learning_rate": 1.9161458310699225e-05, "epoch": 0.595438175270108, "percentage": 59.54, "elapsed_time": "16:48:54", "remaining_time": "11:25:29", "throughput": 1678.06, "total_tokens": 101580800} +{"current_steps": 12410, "total_steps": 20825, "loss": 0.9768, "learning_rate": 1.9122944629216402e-05, "epoch": 0.5959183673469388, "percentage": 59.59, "elapsed_time": "16:49:39", "remaining_time": "11:24:38", "throughput": 1678.16, "total_tokens": 101662720} +{"current_steps": 12420, "total_steps": 20825, "loss": 0.8343, "learning_rate": 1.9084445705921815e-05, "epoch": 0.5963985594237695, "percentage": 59.64, "elapsed_time": "16:50:25", "remaining_time": "11:23:47", "throughput": 1678.25, "total_tokens": 101744640} +{"current_steps": 12430, "total_steps": 20825, "loss": 1.0443, "learning_rate": 1.9045961637492145e-05, "epoch": 0.5968787515006002, "percentage": 59.69, "elapsed_time": "16:51:10", "remaining_time": "11:22:55", "throughput": 1678.35, "total_tokens": 101826560} +{"current_steps": 12440, "total_steps": 20825, "loss": 0.9608, "learning_rate": 1.9007492520566814e-05, "epoch": 0.597358943577431, "percentage": 59.74, "elapsed_time": "16:51:55", "remaining_time": "11:22:04", "throughput": 1678.45, "total_tokens": 101908480} +{"current_steps": 12450, "total_steps": 20825, "loss": 0.9062, "learning_rate": 1.896903845174768e-05, "epoch": 0.5978391356542617, "percentage": 59.78, "elapsed_time": "16:52:41", "remaining_time": "11:21:13", "throughput": 1678.54, "total_tokens": 101990400} +{"current_steps": 12460, "total_steps": 20825, "loss": 0.815, "learning_rate": 1.8930599527598797e-05, "epoch": 0.5983193277310924, "percentage": 59.83, "elapsed_time": "16:53:26", "remaining_time": "11:20:22", "throughput": 1678.64, "total_tokens": 102072320} +{"current_steps": 12470, "total_steps": 20825, "loss": 1.0498, "learning_rate": 1.8892175844646215e-05, "epoch": 0.5987995198079231, "percentage": 59.88, "elapsed_time": "16:54:12", "remaining_time": "11:19:31", "throughput": 1678.73, "total_tokens": 102154240} +{"current_steps": 12480, "total_steps": 20825, "loss": 0.7995, "learning_rate": 1.8853767499377712e-05, "epoch": 0.5992797118847539, "percentage": 59.93, "elapsed_time": "16:54:58", "remaining_time": "11:18:40", "throughput": 1678.8, "total_tokens": 102236160} +{"current_steps": 12490, "total_steps": 20825, "loss": 0.7581, "learning_rate": 1.8815374588242523e-05, "epoch": 0.5997599039615846, "percentage": 59.98, "elapsed_time": "16:55:44", "remaining_time": "11:17:50", "throughput": 1678.86, "total_tokens": 102318080} +{"current_steps": 12500, "total_steps": 20825, "loss": 0.8486, "learning_rate": 1.877699720765114e-05, "epoch": 0.6002400960384153, "percentage": 60.02, "elapsed_time": "16:56:33", "remaining_time": "11:17:01", "throughput": 1678.86, "total_tokens": 102400000} +{"current_steps": 12510, "total_steps": 20825, "loss": 0.7697, "learning_rate": 1.873863545397507e-05, "epoch": 0.6007202881152461, "percentage": 60.07, "elapsed_time": "16:57:22", "remaining_time": "11:16:12", "throughput": 1678.87, "total_tokens": 102481920} +{"current_steps": 12520, "total_steps": 20825, "loss": 0.9144, "learning_rate": 1.870028942354655e-05, "epoch": 0.6012004801920768, "percentage": 60.12, "elapsed_time": "16:58:08", "remaining_time": "11:15:22", "throughput": 1678.94, "total_tokens": 102563840} +{"current_steps": 12530, "total_steps": 20825, "loss": 0.8182, "learning_rate": 1.8661959212658365e-05, "epoch": 0.6016806722689075, "percentage": 60.17, "elapsed_time": "16:58:55", "remaining_time": "11:14:32", "throughput": 1678.98, "total_tokens": 102645760} +{"current_steps": 12540, "total_steps": 20825, "loss": 0.8923, "learning_rate": 1.862364491756355e-05, "epoch": 0.6021608643457383, "percentage": 60.22, "elapsed_time": "16:59:42", "remaining_time": "11:13:42", "throughput": 1679.02, "total_tokens": 102727680} +{"current_steps": 12550, "total_steps": 20825, "loss": 0.9803, "learning_rate": 1.8585346634475175e-05, "epoch": 0.602641056422569, "percentage": 60.26, "elapsed_time": "17:00:29", "remaining_time": "11:12:52", "throughput": 1679.09, "total_tokens": 102809600} +{"current_steps": 12560, "total_steps": 20825, "loss": 0.9476, "learning_rate": 1.8547064459566117e-05, "epoch": 0.6031212484993997, "percentage": 60.31, "elapsed_time": "17:01:15", "remaining_time": "11:12:01", "throughput": 1679.16, "total_tokens": 102891520} +{"current_steps": 12570, "total_steps": 20825, "loss": 0.7547, "learning_rate": 1.8508798488968803e-05, "epoch": 0.6036014405762304, "percentage": 60.36, "elapsed_time": "17:02:04", "remaining_time": "11:11:12", "throughput": 1679.16, "total_tokens": 102973440} +{"current_steps": 12580, "total_steps": 20825, "loss": 0.9321, "learning_rate": 1.8470548818774942e-05, "epoch": 0.6040816326530613, "percentage": 60.41, "elapsed_time": "17:02:51", "remaining_time": "11:10:23", "throughput": 1679.2, "total_tokens": 103055360} +{"current_steps": 12590, "total_steps": 20825, "loss": 0.8547, "learning_rate": 1.8432315545035328e-05, "epoch": 0.604561824729892, "percentage": 60.46, "elapsed_time": "17:03:37", "remaining_time": "11:09:32", "throughput": 1679.27, "total_tokens": 103137280} +{"current_steps": 12600, "total_steps": 20825, "loss": 0.9036, "learning_rate": 1.83940987637596e-05, "epoch": 0.6050420168067226, "percentage": 60.5, "elapsed_time": "17:04:27", "remaining_time": "11:08:44", "throughput": 1679.24, "total_tokens": 103219200} +{"current_steps": 12610, "total_steps": 20825, "loss": 1.0021, "learning_rate": 1.8355898570915937e-05, "epoch": 0.6055222088835535, "percentage": 60.55, "elapsed_time": "17:05:16", "remaining_time": "11:07:56", "throughput": 1679.24, "total_tokens": 103301120} +{"current_steps": 12620, "total_steps": 20825, "loss": 0.9036, "learning_rate": 1.8317715062430902e-05, "epoch": 0.6060024009603842, "percentage": 60.6, "elapsed_time": "17:06:05", "remaining_time": "11:07:07", "throughput": 1679.25, "total_tokens": 103383040} +{"current_steps": 12630, "total_steps": 20825, "loss": 0.9671, "learning_rate": 1.8279548334189146e-05, "epoch": 0.6064825930372149, "percentage": 60.65, "elapsed_time": "17:06:53", "remaining_time": "11:06:17", "throughput": 1679.26, "total_tokens": 103464960} +{"current_steps": 12640, "total_steps": 20825, "loss": 0.943, "learning_rate": 1.8241398482033185e-05, "epoch": 0.6069627851140457, "percentage": 60.7, "elapsed_time": "17:07:41", "remaining_time": "11:05:28", "throughput": 1679.27, "total_tokens": 103546880} +{"current_steps": 12650, "total_steps": 20825, "loss": 0.9297, "learning_rate": 1.8203265601763136e-05, "epoch": 0.6074429771908764, "percentage": 60.74, "elapsed_time": "17:08:31", "remaining_time": "11:04:40", "throughput": 1679.24, "total_tokens": 103628800} +{"current_steps": 12660, "total_steps": 20825, "loss": 0.8064, "learning_rate": 1.816514978913655e-05, "epoch": 0.6079231692677071, "percentage": 60.79, "elapsed_time": "17:09:20", "remaining_time": "11:03:52", "throughput": 1679.24, "total_tokens": 103710720} +{"current_steps": 12670, "total_steps": 20825, "loss": 0.9639, "learning_rate": 1.8127051139868044e-05, "epoch": 0.6084033613445378, "percentage": 60.84, "elapsed_time": "17:10:10", "remaining_time": "11:03:04", "throughput": 1679.2, "total_tokens": 103792640} +{"current_steps": 12680, "total_steps": 20825, "loss": 0.9895, "learning_rate": 1.8088969749629197e-05, "epoch": 0.6088835534213686, "percentage": 60.89, "elapsed_time": "17:10:59", "remaining_time": "11:02:15", "throughput": 1679.21, "total_tokens": 103874560} +{"current_steps": 12690, "total_steps": 20825, "loss": 1.0683, "learning_rate": 1.8050905714048233e-05, "epoch": 0.6093637454981993, "percentage": 60.94, "elapsed_time": "17:11:45", "remaining_time": "11:01:24", "throughput": 1679.27, "total_tokens": 103956480} +{"current_steps": 12700, "total_steps": 20825, "loss": 0.7629, "learning_rate": 1.8012859128709766e-05, "epoch": 0.60984393757503, "percentage": 60.98, "elapsed_time": "17:12:34", "remaining_time": "11:00:36", "throughput": 1679.28, "total_tokens": 104038400} +{"current_steps": 12710, "total_steps": 20825, "loss": 0.9292, "learning_rate": 1.7974830089154624e-05, "epoch": 0.6103241296518608, "percentage": 61.03, "elapsed_time": "17:13:24", "remaining_time": "10:59:48", "throughput": 1679.24, "total_tokens": 104120320} +{"current_steps": 12720, "total_steps": 20825, "loss": 0.9859, "learning_rate": 1.7936818690879574e-05, "epoch": 0.6108043217286915, "percentage": 61.08, "elapsed_time": "17:14:13", "remaining_time": "10:58:59", "throughput": 1679.22, "total_tokens": 104202240} +{"current_steps": 12730, "total_steps": 20825, "loss": 0.9921, "learning_rate": 1.7898825029337054e-05, "epoch": 0.6112845138055222, "percentage": 61.13, "elapsed_time": "17:15:03", "remaining_time": "10:58:11", "throughput": 1679.19, "total_tokens": 104284160} +{"current_steps": 12740, "total_steps": 20825, "loss": 0.8653, "learning_rate": 1.7860849199934983e-05, "epoch": 0.611764705882353, "percentage": 61.18, "elapsed_time": "17:15:53", "remaining_time": "10:57:23", "throughput": 1679.18, "total_tokens": 104366080} +{"current_steps": 12750, "total_steps": 20825, "loss": 0.9741, "learning_rate": 1.7822891298036515e-05, "epoch": 0.6122448979591837, "percentage": 61.22, "elapsed_time": "17:16:44", "remaining_time": "10:56:35", "throughput": 1679.12, "total_tokens": 104448000} +{"current_steps": 12760, "total_steps": 20825, "loss": 0.9431, "learning_rate": 1.7784951418959747e-05, "epoch": 0.6127250900360144, "percentage": 61.27, "elapsed_time": "17:17:34", "remaining_time": "10:55:48", "throughput": 1679.07, "total_tokens": 104529920} +{"current_steps": 12770, "total_steps": 20825, "loss": 0.9441, "learning_rate": 1.7747029657977556e-05, "epoch": 0.6132052821128451, "percentage": 61.32, "elapsed_time": "17:18:24", "remaining_time": "10:55:00", "throughput": 1679.05, "total_tokens": 104611840} +{"current_steps": 12780, "total_steps": 20825, "loss": 1.0325, "learning_rate": 1.7709126110317297e-05, "epoch": 0.6136854741896759, "percentage": 61.37, "elapsed_time": "17:19:13", "remaining_time": "10:54:11", "throughput": 1679.02, "total_tokens": 104693760} +{"current_steps": 12790, "total_steps": 20825, "loss": 0.9102, "learning_rate": 1.7671240871160593e-05, "epoch": 0.6141656662665066, "percentage": 61.42, "elapsed_time": "17:20:04", "remaining_time": "10:53:23", "throughput": 1678.99, "total_tokens": 104775680} +{"current_steps": 12800, "total_steps": 20825, "loss": 0.817, "learning_rate": 1.76333740356431e-05, "epoch": 0.6146458583433373, "percentage": 61.46, "elapsed_time": "17:20:53", "remaining_time": "10:52:35", "throughput": 1678.98, "total_tokens": 104857600} +{"current_steps": 12810, "total_steps": 20825, "loss": 0.8403, "learning_rate": 1.7595525698854263e-05, "epoch": 0.6151260504201681, "percentage": 61.51, "elapsed_time": "17:21:41", "remaining_time": "10:51:46", "throughput": 1678.99, "total_tokens": 104939520} +{"current_steps": 12820, "total_steps": 20825, "loss": 0.8923, "learning_rate": 1.7557695955837063e-05, "epoch": 0.6156062424969988, "percentage": 61.56, "elapsed_time": "17:22:32", "remaining_time": "10:50:58", "throughput": 1678.92, "total_tokens": 105021440} +{"current_steps": 12830, "total_steps": 20825, "loss": 0.8347, "learning_rate": 1.7519884901587772e-05, "epoch": 0.6160864345738295, "percentage": 61.61, "elapsed_time": "17:23:23", "remaining_time": "10:50:11", "throughput": 1678.88, "total_tokens": 105103360} +{"current_steps": 12840, "total_steps": 20825, "loss": 1.0152, "learning_rate": 1.748209263105577e-05, "epoch": 0.6165666266506603, "percentage": 61.66, "elapsed_time": "17:24:11", "remaining_time": "10:49:22", "throughput": 1678.89, "total_tokens": 105185280} +{"current_steps": 12850, "total_steps": 20825, "loss": 0.9691, "learning_rate": 1.744431923914326e-05, "epoch": 0.617046818727491, "percentage": 61.7, "elapsed_time": "17:24:58", "remaining_time": "10:48:32", "throughput": 1678.93, "total_tokens": 105267200} +{"current_steps": 12860, "total_steps": 20825, "loss": 0.9528, "learning_rate": 1.7406564820705e-05, "epoch": 0.6175270108043217, "percentage": 61.75, "elapsed_time": "17:25:46", "remaining_time": "10:47:42", "throughput": 1678.96, "total_tokens": 105349120} +{"current_steps": 12870, "total_steps": 20825, "loss": 0.8165, "learning_rate": 1.736882947054815e-05, "epoch": 0.6180072028811524, "percentage": 61.8, "elapsed_time": "17:26:32", "remaining_time": "10:46:52", "throughput": 1679.03, "total_tokens": 105431040} +{"current_steps": 12880, "total_steps": 20825, "loss": 0.9941, "learning_rate": 1.7331113283431966e-05, "epoch": 0.6184873949579832, "percentage": 61.85, "elapsed_time": "17:27:20", "remaining_time": "10:46:03", "throughput": 1679.05, "total_tokens": 105512960} +{"current_steps": 12890, "total_steps": 20825, "loss": 0.7875, "learning_rate": 1.729341635406757e-05, "epoch": 0.6189675870348139, "percentage": 61.9, "elapsed_time": "17:28:09", "remaining_time": "10:45:14", "throughput": 1679.06, "total_tokens": 105594880} +{"current_steps": 12900, "total_steps": 20825, "loss": 0.9376, "learning_rate": 1.725573877711776e-05, "epoch": 0.6194477791116446, "percentage": 61.94, "elapsed_time": "17:28:58", "remaining_time": "10:44:25", "throughput": 1679.06, "total_tokens": 105676800} +{"current_steps": 12910, "total_steps": 20825, "loss": 0.9336, "learning_rate": 1.7218080647196698e-05, "epoch": 0.6199279711884754, "percentage": 61.99, "elapsed_time": "17:29:48", "remaining_time": "10:43:37", "throughput": 1679.01, "total_tokens": 105758720} +{"current_steps": 12920, "total_steps": 20825, "loss": 0.8139, "learning_rate": 1.7180442058869732e-05, "epoch": 0.6204081632653061, "percentage": 62.04, "elapsed_time": "17:30:39", "remaining_time": "10:42:50", "throughput": 1678.96, "total_tokens": 105840640} +{"current_steps": 12930, "total_steps": 20825, "loss": 0.8121, "learning_rate": 1.7142823106653135e-05, "epoch": 0.6208883553421368, "percentage": 62.09, "elapsed_time": "17:31:28", "remaining_time": "10:42:01", "throughput": 1678.96, "total_tokens": 105922560} +{"current_steps": 12940, "total_steps": 20825, "loss": 0.8867, "learning_rate": 1.7105223885013884e-05, "epoch": 0.6213685474189676, "percentage": 62.14, "elapsed_time": "17:32:16", "remaining_time": "10:41:12", "throughput": 1678.98, "total_tokens": 106004480} +{"current_steps": 12950, "total_steps": 20825, "loss": 0.9163, "learning_rate": 1.706764448836938e-05, "epoch": 0.6218487394957983, "percentage": 62.18, "elapsed_time": "17:33:07", "remaining_time": "10:40:25", "throughput": 1678.9, "total_tokens": 106086400} +{"current_steps": 12960, "total_steps": 20825, "loss": 0.969, "learning_rate": 1.703008501108726e-05, "epoch": 0.622328931572629, "percentage": 62.23, "elapsed_time": "17:33:56", "remaining_time": "10:39:36", "throughput": 1678.91, "total_tokens": 106168320} +{"current_steps": 12970, "total_steps": 20825, "loss": 0.9426, "learning_rate": 1.699254554748515e-05, "epoch": 0.6228091236494598, "percentage": 62.28, "elapsed_time": "17:34:44", "remaining_time": "10:38:46", "throughput": 1678.94, "total_tokens": 106250240} +{"current_steps": 12980, "total_steps": 20825, "loss": 0.8038, "learning_rate": 1.6955026191830385e-05, "epoch": 0.6232893157262905, "percentage": 62.33, "elapsed_time": "17:35:32", "remaining_time": "10:37:57", "throughput": 1678.95, "total_tokens": 106332160} +{"current_steps": 12990, "total_steps": 20825, "loss": 0.9071, "learning_rate": 1.691752703833984e-05, "epoch": 0.6237695078031212, "percentage": 62.38, "elapsed_time": "17:36:17", "remaining_time": "10:37:06", "throughput": 1679.05, "total_tokens": 106414080} +{"current_steps": 13000, "total_steps": 20825, "loss": 0.8317, "learning_rate": 1.6880048181179652e-05, "epoch": 0.6242496998799519, "percentage": 62.42, "elapsed_time": "17:37:02", "remaining_time": "10:36:15", "throughput": 1679.14, "total_tokens": 106496000} +{"current_steps": 13010, "total_steps": 20825, "loss": 0.938, "learning_rate": 1.684258971446497e-05, "epoch": 0.6247298919567827, "percentage": 62.47, "elapsed_time": "17:37:51", "remaining_time": "10:35:26", "throughput": 1679.16, "total_tokens": 106577920} +{"current_steps": 13020, "total_steps": 20825, "loss": 0.8077, "learning_rate": 1.6805151732259755e-05, "epoch": 0.6252100840336134, "percentage": 62.52, "elapsed_time": "17:38:36", "remaining_time": "10:34:35", "throughput": 1679.25, "total_tokens": 106659840} +{"current_steps": 13030, "total_steps": 20825, "loss": 0.8399, "learning_rate": 1.6767734328576544e-05, "epoch": 0.6256902761104441, "percentage": 62.57, "elapsed_time": "17:39:21", "remaining_time": "10:33:44", "throughput": 1679.34, "total_tokens": 106741760} +{"current_steps": 13040, "total_steps": 20825, "loss": 0.8906, "learning_rate": 1.6730337597376165e-05, "epoch": 0.626170468187275, "percentage": 62.62, "elapsed_time": "17:40:07", "remaining_time": "10:32:54", "throughput": 1679.43, "total_tokens": 106823680} +{"current_steps": 13050, "total_steps": 20825, "loss": 0.7171, "learning_rate": 1.669296163256755e-05, "epoch": 0.6266506602641057, "percentage": 62.67, "elapsed_time": "17:40:52", "remaining_time": "10:32:03", "throughput": 1679.51, "total_tokens": 106905600} +{"current_steps": 13060, "total_steps": 20825, "loss": 1.0005, "learning_rate": 1.6655606528007505e-05, "epoch": 0.6271308523409364, "percentage": 62.71, "elapsed_time": "17:41:38", "remaining_time": "10:31:12", "throughput": 1679.6, "total_tokens": 106987520} +{"current_steps": 13070, "total_steps": 20825, "loss": 0.9795, "learning_rate": 1.6618272377500406e-05, "epoch": 0.6276110444177672, "percentage": 62.76, "elapsed_time": "17:42:23", "remaining_time": "10:30:21", "throughput": 1679.69, "total_tokens": 107069440} +{"current_steps": 13080, "total_steps": 20825, "loss": 0.7443, "learning_rate": 1.658095927479805e-05, "epoch": 0.6280912364945979, "percentage": 62.81, "elapsed_time": "17:43:08", "remaining_time": "10:29:30", "throughput": 1679.79, "total_tokens": 107151360} +{"current_steps": 13090, "total_steps": 20825, "loss": 1.141, "learning_rate": 1.6543667313599365e-05, "epoch": 0.6285714285714286, "percentage": 62.86, "elapsed_time": "17:43:54", "remaining_time": "10:28:40", "throughput": 1679.87, "total_tokens": 107233280} +{"current_steps": 13100, "total_steps": 20825, "loss": 0.8862, "learning_rate": 1.6506396587550188e-05, "epoch": 0.6290516206482593, "percentage": 62.91, "elapsed_time": "17:44:39", "remaining_time": "10:27:49", "throughput": 1679.96, "total_tokens": 107315200} +{"current_steps": 13110, "total_steps": 20825, "loss": 0.8555, "learning_rate": 1.6469147190243027e-05, "epoch": 0.6295318127250901, "percentage": 62.95, "elapsed_time": "17:45:25", "remaining_time": "10:26:58", "throughput": 1680.04, "total_tokens": 107397120} +{"current_steps": 13120, "total_steps": 20825, "loss": 0.8369, "learning_rate": 1.6431919215216862e-05, "epoch": 0.6300120048019208, "percentage": 63.0, "elapsed_time": "17:46:10", "remaining_time": "10:26:08", "throughput": 1680.14, "total_tokens": 107479040} +{"current_steps": 13130, "total_steps": 20825, "loss": 0.9955, "learning_rate": 1.6394712755956817e-05, "epoch": 0.6304921968787515, "percentage": 63.05, "elapsed_time": "17:46:55", "remaining_time": "10:25:17", "throughput": 1680.23, "total_tokens": 107560960} +{"current_steps": 13140, "total_steps": 20825, "loss": 0.8961, "learning_rate": 1.635752790589405e-05, "epoch": 0.6309723889555823, "percentage": 63.1, "elapsed_time": "17:47:40", "remaining_time": "10:24:26", "throughput": 1680.32, "total_tokens": 107642880} +{"current_steps": 13150, "total_steps": 20825, "loss": 0.987, "learning_rate": 1.6320364758405422e-05, "epoch": 0.631452581032413, "percentage": 63.15, "elapsed_time": "17:48:26", "remaining_time": "10:23:35", "throughput": 1680.41, "total_tokens": 107724800} +{"current_steps": 13160, "total_steps": 20825, "loss": 0.9919, "learning_rate": 1.628322340681329e-05, "epoch": 0.6319327731092437, "percentage": 63.19, "elapsed_time": "17:49:11", "remaining_time": "10:22:44", "throughput": 1680.51, "total_tokens": 107806720} +{"current_steps": 13170, "total_steps": 20825, "loss": 1.0279, "learning_rate": 1.6246103944385295e-05, "epoch": 0.6324129651860745, "percentage": 63.24, "elapsed_time": "17:49:56", "remaining_time": "10:21:53", "throughput": 1680.6, "total_tokens": 107888640} +{"current_steps": 13180, "total_steps": 20825, "loss": 0.8903, "learning_rate": 1.620900646433412e-05, "epoch": 0.6328931572629052, "percentage": 63.29, "elapsed_time": "17:50:41", "remaining_time": "10:21:03", "throughput": 1680.69, "total_tokens": 107970560} +{"current_steps": 13190, "total_steps": 20825, "loss": 0.9969, "learning_rate": 1.6171931059817214e-05, "epoch": 0.6333733493397359, "percentage": 63.34, "elapsed_time": "17:51:27", "remaining_time": "10:20:12", "throughput": 1680.77, "total_tokens": 108052480} +{"current_steps": 13200, "total_steps": 20825, "loss": 0.6298, "learning_rate": 1.613487782393661e-05, "epoch": 0.6338535414165666, "percentage": 63.39, "elapsed_time": "17:52:12", "remaining_time": "10:19:21", "throughput": 1680.86, "total_tokens": 108134400} +{"current_steps": 13210, "total_steps": 20825, "loss": 0.7394, "learning_rate": 1.6097846849738685e-05, "epoch": 0.6343337334933974, "percentage": 63.43, "elapsed_time": "17:52:58", "remaining_time": "10:18:31", "throughput": 1680.95, "total_tokens": 108216320} +{"current_steps": 13220, "total_steps": 20825, "loss": 0.9739, "learning_rate": 1.6060838230213883e-05, "epoch": 0.6348139255702281, "percentage": 63.48, "elapsed_time": "17:53:43", "remaining_time": "10:17:40", "throughput": 1681.04, "total_tokens": 108298240} +{"current_steps": 13230, "total_steps": 20825, "loss": 1.0424, "learning_rate": 1.6023852058296544e-05, "epoch": 0.6352941176470588, "percentage": 63.53, "elapsed_time": "17:54:28", "remaining_time": "10:16:49", "throughput": 1681.13, "total_tokens": 108380160} +{"current_steps": 13240, "total_steps": 20825, "loss": 0.897, "learning_rate": 1.5986888426864617e-05, "epoch": 0.6357743097238896, "percentage": 63.58, "elapsed_time": "17:55:13", "remaining_time": "10:15:58", "throughput": 1681.22, "total_tokens": 108462080} +{"current_steps": 13250, "total_steps": 20825, "loss": 0.8078, "learning_rate": 1.5949947428739448e-05, "epoch": 0.6362545018007203, "percentage": 63.63, "elapsed_time": "17:55:58", "remaining_time": "10:15:08", "throughput": 1681.32, "total_tokens": 108544000} +{"current_steps": 13260, "total_steps": 20825, "loss": 0.7465, "learning_rate": 1.591302915668556e-05, "epoch": 0.636734693877551, "percentage": 63.67, "elapsed_time": "17:56:44", "remaining_time": "10:14:17", "throughput": 1681.39, "total_tokens": 108625920} +{"current_steps": 13270, "total_steps": 20825, "loss": 0.9428, "learning_rate": 1.5876133703410412e-05, "epoch": 0.6372148859543818, "percentage": 63.72, "elapsed_time": "17:57:30", "remaining_time": "10:13:27", "throughput": 1681.48, "total_tokens": 108707840} +{"current_steps": 13280, "total_steps": 20825, "loss": 1.0362, "learning_rate": 1.5839261161564138e-05, "epoch": 0.6376950780312125, "percentage": 63.77, "elapsed_time": "17:58:15", "remaining_time": "10:12:36", "throughput": 1681.57, "total_tokens": 108789760} +{"current_steps": 13290, "total_steps": 20825, "loss": 0.9749, "learning_rate": 1.5802411623739345e-05, "epoch": 0.6381752701080432, "percentage": 63.82, "elapsed_time": "17:59:00", "remaining_time": "10:11:45", "throughput": 1681.65, "total_tokens": 108871680} +{"current_steps": 13300, "total_steps": 20825, "loss": 0.8378, "learning_rate": 1.57655851824709e-05, "epoch": 0.6386554621848739, "percentage": 63.87, "elapsed_time": "17:59:45", "remaining_time": "10:10:55", "throughput": 1681.75, "total_tokens": 108953600} +{"current_steps": 13310, "total_steps": 20825, "loss": 0.9856, "learning_rate": 1.5728781930235627e-05, "epoch": 0.6391356542617047, "percentage": 63.91, "elapsed_time": "18:00:31", "remaining_time": "10:10:04", "throughput": 1681.83, "total_tokens": 109035520} +{"current_steps": 13320, "total_steps": 20825, "loss": 1.0489, "learning_rate": 1.5692001959452164e-05, "epoch": 0.6396158463385354, "percentage": 63.96, "elapsed_time": "18:01:16", "remaining_time": "10:09:13", "throughput": 1681.92, "total_tokens": 109117440} +{"current_steps": 13330, "total_steps": 20825, "loss": 0.8971, "learning_rate": 1.5655245362480654e-05, "epoch": 0.6400960384153661, "percentage": 64.01, "elapsed_time": "18:02:01", "remaining_time": "10:08:23", "throughput": 1682.01, "total_tokens": 109199360} +{"current_steps": 13340, "total_steps": 20825, "loss": 0.8842, "learning_rate": 1.561851223162254e-05, "epoch": 0.6405762304921969, "percentage": 64.06, "elapsed_time": "18:02:46", "remaining_time": "10:07:32", "throughput": 1682.1, "total_tokens": 109281280} +{"current_steps": 13350, "total_steps": 20825, "loss": 0.9354, "learning_rate": 1.558180265912037e-05, "epoch": 0.6410564225690276, "percentage": 64.11, "elapsed_time": "18:03:32", "remaining_time": "10:06:41", "throughput": 1682.2, "total_tokens": 109363200} +{"current_steps": 13360, "total_steps": 20825, "loss": 0.9725, "learning_rate": 1.5545116737157522e-05, "epoch": 0.6415366146458583, "percentage": 64.15, "elapsed_time": "18:04:17", "remaining_time": "10:05:51", "throughput": 1682.29, "total_tokens": 109445120} +{"current_steps": 13370, "total_steps": 20825, "loss": 0.7562, "learning_rate": 1.5508454557857966e-05, "epoch": 0.6420168067226891, "percentage": 64.2, "elapsed_time": "18:05:02", "remaining_time": "10:05:00", "throughput": 1682.38, "total_tokens": 109527040} +{"current_steps": 13380, "total_steps": 20825, "loss": 0.8151, "learning_rate": 1.5471816213286054e-05, "epoch": 0.6424969987995198, "percentage": 64.25, "elapsed_time": "18:05:47", "remaining_time": "10:04:10", "throughput": 1682.46, "total_tokens": 109608960} +{"current_steps": 13390, "total_steps": 20825, "loss": 0.9497, "learning_rate": 1.5435201795446317e-05, "epoch": 0.6429771908763505, "percentage": 64.3, "elapsed_time": "18:06:33", "remaining_time": "10:03:19", "throughput": 1682.55, "total_tokens": 109690880} +{"current_steps": 13400, "total_steps": 20825, "loss": 0.8651, "learning_rate": 1.5398611396283153e-05, "epoch": 0.6434573829531812, "percentage": 64.35, "elapsed_time": "18:07:18", "remaining_time": "10:02:29", "throughput": 1682.63, "total_tokens": 109772800} +{"current_steps": 13410, "total_steps": 20825, "loss": 0.8622, "learning_rate": 1.536204510768069e-05, "epoch": 0.643937575030012, "percentage": 64.39, "elapsed_time": "18:08:04", "remaining_time": "10:01:38", "throughput": 1682.72, "total_tokens": 109854720} +{"current_steps": 13420, "total_steps": 20825, "loss": 0.8377, "learning_rate": 1.532550302146249e-05, "epoch": 0.6444177671068427, "percentage": 64.44, "elapsed_time": "18:08:55", "remaining_time": "10:00:51", "throughput": 1682.65, "total_tokens": 109936640} +{"current_steps": 13430, "total_steps": 20825, "loss": 0.7773, "learning_rate": 1.528898522939133e-05, "epoch": 0.6448979591836734, "percentage": 64.49, "elapsed_time": "18:10:00", "remaining_time": "10:00:11", "throughput": 1682.22, "total_tokens": 110018560} +{"current_steps": 13440, "total_steps": 20825, "loss": 0.9058, "learning_rate": 1.5252491823168994e-05, "epoch": 0.6453781512605042, "percentage": 64.54, "elapsed_time": "18:10:50", "remaining_time": "9:59:23", "throughput": 1682.19, "total_tokens": 110100480} +{"current_steps": 13450, "total_steps": 20825, "loss": 0.9108, "learning_rate": 1.5216022894436043e-05, "epoch": 0.6458583433373349, "percentage": 64.59, "elapsed_time": "18:11:41", "remaining_time": "9:58:36", "throughput": 1682.14, "total_tokens": 110182400} +{"current_steps": 13460, "total_steps": 20825, "loss": 0.9771, "learning_rate": 1.517957853477154e-05, "epoch": 0.6463385354141656, "percentage": 64.63, "elapsed_time": "18:12:31", "remaining_time": "9:57:48", "throughput": 1682.11, "total_tokens": 110264320} +{"current_steps": 13470, "total_steps": 20825, "loss": 0.8984, "learning_rate": 1.5143158835692866e-05, "epoch": 0.6468187274909964, "percentage": 64.68, "elapsed_time": "18:13:18", "remaining_time": "9:56:58", "throughput": 1682.15, "total_tokens": 110346240} +{"current_steps": 13480, "total_steps": 20825, "loss": 1.1943, "learning_rate": 1.5106763888655478e-05, "epoch": 0.6472989195678271, "percentage": 64.73, "elapsed_time": "18:14:04", "remaining_time": "9:56:08", "throughput": 1682.23, "total_tokens": 110428160} +{"current_steps": 13490, "total_steps": 20825, "loss": 0.9233, "learning_rate": 1.5070393785052695e-05, "epoch": 0.6477791116446578, "percentage": 64.78, "elapsed_time": "18:14:49", "remaining_time": "9:55:17", "throughput": 1682.3, "total_tokens": 110510080} +{"current_steps": 13500, "total_steps": 20825, "loss": 0.7714, "learning_rate": 1.5034048616215402e-05, "epoch": 0.6482593037214885, "percentage": 64.83, "elapsed_time": "18:15:35", "remaining_time": "9:54:27", "throughput": 1682.37, "total_tokens": 110592000} +{"current_steps": 13510, "total_steps": 20825, "loss": 1.0867, "learning_rate": 1.4997728473411903e-05, "epoch": 0.6487394957983194, "percentage": 64.87, "elapsed_time": "18:16:21", "remaining_time": "9:53:37", "throughput": 1682.44, "total_tokens": 110673920} +{"current_steps": 13520, "total_steps": 20825, "loss": 0.8682, "learning_rate": 1.4961433447847672e-05, "epoch": 0.64921968787515, "percentage": 64.92, "elapsed_time": "18:17:07", "remaining_time": "9:52:47", "throughput": 1682.52, "total_tokens": 110755840} +{"current_steps": 13530, "total_steps": 20825, "loss": 0.8386, "learning_rate": 1.4925163630665065e-05, "epoch": 0.6496998799519808, "percentage": 64.97, "elapsed_time": "18:17:52", "remaining_time": "9:51:56", "throughput": 1682.6, "total_tokens": 110837760} +{"current_steps": 13540, "total_steps": 20825, "loss": 0.9952, "learning_rate": 1.4888919112943173e-05, "epoch": 0.6501800720288116, "percentage": 65.02, "elapsed_time": "18:18:38", "remaining_time": "9:51:06", "throughput": 1682.68, "total_tokens": 110919680} +{"current_steps": 13550, "total_steps": 20825, "loss": 0.8368, "learning_rate": 1.4852699985697546e-05, "epoch": 0.6506602641056423, "percentage": 65.07, "elapsed_time": "18:19:24", "remaining_time": "9:50:16", "throughput": 1682.76, "total_tokens": 111001600} +{"current_steps": 13560, "total_steps": 20825, "loss": 0.8539, "learning_rate": 1.4816506339879965e-05, "epoch": 0.651140456182473, "percentage": 65.11, "elapsed_time": "18:20:10", "remaining_time": "9:49:26", "throughput": 1682.82, "total_tokens": 111083520} +{"current_steps": 13570, "total_steps": 20825, "loss": 0.8573, "learning_rate": 1.4780338266378232e-05, "epoch": 0.6516206482593038, "percentage": 65.16, "elapsed_time": "18:20:56", "remaining_time": "9:48:36", "throughput": 1682.88, "total_tokens": 111165440} +{"current_steps": 13580, "total_steps": 20825, "loss": 0.6835, "learning_rate": 1.4744195856015947e-05, "epoch": 0.6521008403361345, "percentage": 65.21, "elapsed_time": "18:21:44", "remaining_time": "9:47:47", "throughput": 1682.9, "total_tokens": 111247360} +{"current_steps": 13590, "total_steps": 20825, "loss": 0.8532, "learning_rate": 1.4708079199552221e-05, "epoch": 0.6525810324129652, "percentage": 65.26, "elapsed_time": "18:22:30", "remaining_time": "9:46:56", "throughput": 1682.97, "total_tokens": 111329280} +{"current_steps": 13600, "total_steps": 20825, "loss": 1.038, "learning_rate": 1.4671988387681549e-05, "epoch": 0.6530612244897959, "percentage": 65.31, "elapsed_time": "18:23:16", "remaining_time": "9:46:06", "throughput": 1683.04, "total_tokens": 111411200} +{"current_steps": 13610, "total_steps": 20825, "loss": 0.9945, "learning_rate": 1.4635923511033494e-05, "epoch": 0.6535414165666267, "percentage": 65.35, "elapsed_time": "18:24:02", "remaining_time": "9:45:16", "throughput": 1683.11, "total_tokens": 111493120} +{"current_steps": 13620, "total_steps": 20825, "loss": 1.7508, "learning_rate": 1.4599884660172485e-05, "epoch": 0.6540216086434574, "percentage": 65.4, "elapsed_time": "18:24:48", "remaining_time": "9:44:26", "throughput": 1683.17, "total_tokens": 111575040} +{"current_steps": 13630, "total_steps": 20825, "loss": 0.8786, "learning_rate": 1.4563871925597622e-05, "epoch": 0.6545018007202881, "percentage": 65.45, "elapsed_time": "18:25:34", "remaining_time": "9:43:36", "throughput": 1683.25, "total_tokens": 111656960} +{"current_steps": 13640, "total_steps": 20825, "loss": 0.6227, "learning_rate": 1.452788539774241e-05, "epoch": 0.6549819927971189, "percentage": 65.5, "elapsed_time": "18:26:20", "remaining_time": "9:42:46", "throughput": 1683.3, "total_tokens": 111738880} +{"current_steps": 13650, "total_steps": 20825, "loss": 0.8651, "learning_rate": 1.4491925166974532e-05, "epoch": 0.6554621848739496, "percentage": 65.55, "elapsed_time": "18:27:06", "remaining_time": "9:41:56", "throughput": 1683.37, "total_tokens": 111820800} +{"current_steps": 13660, "total_steps": 20825, "loss": 0.8945, "learning_rate": 1.4455991323595655e-05, "epoch": 0.6559423769507803, "percentage": 65.59, "elapsed_time": "18:27:52", "remaining_time": "9:41:06", "throughput": 1683.44, "total_tokens": 111902720} +{"current_steps": 13670, "total_steps": 20825, "loss": 0.8423, "learning_rate": 1.4420083957841185e-05, "epoch": 0.6564225690276111, "percentage": 65.64, "elapsed_time": "18:28:38", "remaining_time": "9:40:16", "throughput": 1683.51, "total_tokens": 111984640} +{"current_steps": 13680, "total_steps": 20825, "loss": 0.8682, "learning_rate": 1.4384203159880017e-05, "epoch": 0.6569027611044418, "percentage": 65.69, "elapsed_time": "18:29:24", "remaining_time": "9:39:26", "throughput": 1683.58, "total_tokens": 112066560} +{"current_steps": 13690, "total_steps": 20825, "loss": 1.1063, "learning_rate": 1.4348349019814344e-05, "epoch": 0.6573829531812725, "percentage": 65.74, "elapsed_time": "18:30:10", "remaining_time": "9:38:36", "throughput": 1683.64, "total_tokens": 112148480} +{"current_steps": 13700, "total_steps": 20825, "loss": 0.9632, "learning_rate": 1.4312521627679428e-05, "epoch": 0.6578631452581032, "percentage": 65.79, "elapsed_time": "18:30:56", "remaining_time": "9:37:46", "throughput": 1683.72, "total_tokens": 112230400} +{"current_steps": 13710, "total_steps": 20825, "loss": 0.804, "learning_rate": 1.4276721073443344e-05, "epoch": 0.658343337334934, "percentage": 65.83, "elapsed_time": "18:31:41", "remaining_time": "9:36:55", "throughput": 1683.79, "total_tokens": 112312320} +{"current_steps": 13720, "total_steps": 20825, "loss": 1.0239, "learning_rate": 1.4240947447006764e-05, "epoch": 0.6588235294117647, "percentage": 65.88, "elapsed_time": "18:32:28", "remaining_time": "9:36:05", "throughput": 1683.86, "total_tokens": 112394240} +{"current_steps": 13730, "total_steps": 20825, "loss": 1.049, "learning_rate": 1.4205200838202782e-05, "epoch": 0.6593037214885954, "percentage": 65.93, "elapsed_time": "18:33:13", "remaining_time": "9:35:15", "throughput": 1683.93, "total_tokens": 112476160} +{"current_steps": 13740, "total_steps": 20825, "loss": 1.0863, "learning_rate": 1.4169481336796597e-05, "epoch": 0.6597839135654262, "percentage": 65.98, "elapsed_time": "18:33:59", "remaining_time": "9:34:25", "throughput": 1684.01, "total_tokens": 112558080} +{"current_steps": 13750, "total_steps": 20825, "loss": 0.9013, "learning_rate": 1.4133789032485367e-05, "epoch": 0.6602641056422569, "percentage": 66.03, "elapsed_time": "18:34:45", "remaining_time": "9:33:35", "throughput": 1684.08, "total_tokens": 112640000} +{"current_steps": 13760, "total_steps": 20825, "loss": 0.8773, "learning_rate": 1.4098124014897961e-05, "epoch": 0.6607442977190876, "percentage": 66.07, "elapsed_time": "18:35:31", "remaining_time": "9:32:45", "throughput": 1684.15, "total_tokens": 112721920} +{"current_steps": 13770, "total_steps": 20825, "loss": 0.7995, "learning_rate": 1.4062486373594694e-05, "epoch": 0.6612244897959184, "percentage": 66.12, "elapsed_time": "18:36:16", "remaining_time": "9:31:55", "throughput": 1684.22, "total_tokens": 112803840} +{"current_steps": 13780, "total_steps": 20825, "loss": 1.0093, "learning_rate": 1.4026876198067163e-05, "epoch": 0.6617046818727491, "percentage": 66.17, "elapsed_time": "18:37:02", "remaining_time": "9:31:05", "throughput": 1684.29, "total_tokens": 112885760} +{"current_steps": 13790, "total_steps": 20825, "loss": 0.9332, "learning_rate": 1.399129357773799e-05, "epoch": 0.6621848739495798, "percentage": 66.22, "elapsed_time": "18:37:48", "remaining_time": "9:30:15", "throughput": 1684.37, "total_tokens": 112967680} +{"current_steps": 13800, "total_steps": 20825, "loss": 0.8836, "learning_rate": 1.3955738601960588e-05, "epoch": 0.6626650660264105, "percentage": 66.27, "elapsed_time": "18:38:34", "remaining_time": "9:29:24", "throughput": 1684.44, "total_tokens": 113049600} +{"current_steps": 13810, "total_steps": 20825, "loss": 0.7864, "learning_rate": 1.392021136001897e-05, "epoch": 0.6631452581032413, "percentage": 66.31, "elapsed_time": "18:39:20", "remaining_time": "9:28:34", "throughput": 1684.51, "total_tokens": 113131520} +{"current_steps": 13820, "total_steps": 20825, "loss": 0.9925, "learning_rate": 1.3884711941127487e-05, "epoch": 0.663625450180072, "percentage": 66.36, "elapsed_time": "18:40:05", "remaining_time": "9:27:44", "throughput": 1684.58, "total_tokens": 113213440} +{"current_steps": 13830, "total_steps": 20825, "loss": 0.7822, "learning_rate": 1.384924043443062e-05, "epoch": 0.6641056422569027, "percentage": 66.41, "elapsed_time": "18:40:51", "remaining_time": "9:26:54", "throughput": 1684.65, "total_tokens": 113295360} +{"current_steps": 13840, "total_steps": 20825, "loss": 0.7278, "learning_rate": 1.3813796929002779e-05, "epoch": 0.6645858343337335, "percentage": 66.46, "elapsed_time": "18:41:37", "remaining_time": "9:26:04", "throughput": 1684.72, "total_tokens": 113377280} +{"current_steps": 13850, "total_steps": 20825, "loss": 0.7792, "learning_rate": 1.3778381513848055e-05, "epoch": 0.6650660264105642, "percentage": 66.51, "elapsed_time": "18:42:23", "remaining_time": "9:25:14", "throughput": 1684.78, "total_tokens": 113459200} +{"current_steps": 13860, "total_steps": 20825, "loss": 0.7843, "learning_rate": 1.3742994277899967e-05, "epoch": 0.6655462184873949, "percentage": 66.55, "elapsed_time": "18:43:09", "remaining_time": "9:24:24", "throughput": 1684.85, "total_tokens": 113541120} +{"current_steps": 13870, "total_steps": 20825, "loss": 1.2019, "learning_rate": 1.370763531002132e-05, "epoch": 0.6660264105642257, "percentage": 66.6, "elapsed_time": "18:43:55", "remaining_time": "9:23:34", "throughput": 1684.92, "total_tokens": 113623040} +{"current_steps": 13880, "total_steps": 20825, "loss": 0.7672, "learning_rate": 1.3672304699003908e-05, "epoch": 0.6665066026410564, "percentage": 66.65, "elapsed_time": "18:44:41", "remaining_time": "9:22:45", "throughput": 1684.98, "total_tokens": 113704960} +{"current_steps": 13890, "total_steps": 20825, "loss": 0.847, "learning_rate": 1.3637002533568302e-05, "epoch": 0.6669867947178871, "percentage": 66.7, "elapsed_time": "18:45:27", "remaining_time": "9:21:55", "throughput": 1685.05, "total_tokens": 113786880} +{"current_steps": 13900, "total_steps": 20825, "loss": 1.1898, "learning_rate": 1.3601728902363681e-05, "epoch": 0.6674669867947179, "percentage": 66.75, "elapsed_time": "18:46:13", "remaining_time": "9:21:05", "throughput": 1685.11, "total_tokens": 113868800} +{"current_steps": 13910, "total_steps": 20825, "loss": 0.9134, "learning_rate": 1.356648389396754e-05, "epoch": 0.6679471788715486, "percentage": 66.79, "elapsed_time": "18:46:59", "remaining_time": "9:20:15", "throughput": 1685.19, "total_tokens": 113950720} +{"current_steps": 13920, "total_steps": 20825, "loss": 1.1422, "learning_rate": 1.3531267596885488e-05, "epoch": 0.6684273709483793, "percentage": 66.84, "elapsed_time": "18:47:44", "remaining_time": "9:19:25", "throughput": 1685.26, "total_tokens": 114032640} +{"current_steps": 13930, "total_steps": 20825, "loss": 0.7922, "learning_rate": 1.349608009955107e-05, "epoch": 0.66890756302521, "percentage": 66.89, "elapsed_time": "18:48:30", "remaining_time": "9:18:35", "throughput": 1685.33, "total_tokens": 114114560} +{"current_steps": 13940, "total_steps": 20825, "loss": 0.8027, "learning_rate": 1.34609214903255e-05, "epoch": 0.6693877551020408, "percentage": 66.94, "elapsed_time": "18:49:16", "remaining_time": "9:17:45", "throughput": 1685.4, "total_tokens": 114196480} +{"current_steps": 13950, "total_steps": 20825, "loss": 0.9642, "learning_rate": 1.3425791857497422e-05, "epoch": 0.6698679471788715, "percentage": 66.99, "elapsed_time": "18:50:02", "remaining_time": "9:16:55", "throughput": 1685.47, "total_tokens": 114278400} +{"current_steps": 13960, "total_steps": 20825, "loss": 0.8414, "learning_rate": 1.3390691289282754e-05, "epoch": 0.6703481392557022, "percentage": 67.03, "elapsed_time": "18:50:48", "remaining_time": "9:16:05", "throughput": 1685.54, "total_tokens": 114360320} +{"current_steps": 13970, "total_steps": 20825, "loss": 0.9272, "learning_rate": 1.335561987382441e-05, "epoch": 0.6708283313325331, "percentage": 67.08, "elapsed_time": "18:51:33", "remaining_time": "9:15:15", "throughput": 1685.61, "total_tokens": 114442240} +{"current_steps": 13980, "total_steps": 20825, "loss": 0.7937, "learning_rate": 1.3320577699192086e-05, "epoch": 0.6713085234093638, "percentage": 67.13, "elapsed_time": "18:52:19", "remaining_time": "9:14:25", "throughput": 1685.68, "total_tokens": 114524160} +{"current_steps": 13990, "total_steps": 20825, "loss": 0.9645, "learning_rate": 1.3285564853382076e-05, "epoch": 0.6717887154861945, "percentage": 67.18, "elapsed_time": "18:53:04", "remaining_time": "9:13:34", "throughput": 1685.76, "total_tokens": 114606080} +{"current_steps": 14000, "total_steps": 20825, "loss": 0.8027, "learning_rate": 1.325058142431701e-05, "epoch": 0.6722689075630253, "percentage": 67.23, "elapsed_time": "18:53:50", "remaining_time": "9:12:44", "throughput": 1685.83, "total_tokens": 114688000} +{"current_steps": 14010, "total_steps": 20825, "loss": 0.7335, "learning_rate": 1.321562749984563e-05, "epoch": 0.672749099639856, "percentage": 67.27, "elapsed_time": "18:54:39", "remaining_time": "9:11:56", "throughput": 1685.82, "total_tokens": 114769920} +{"current_steps": 14020, "total_steps": 20825, "loss": 0.9804, "learning_rate": 1.318070316774262e-05, "epoch": 0.6732292917166867, "percentage": 67.32, "elapsed_time": "18:55:25", "remaining_time": "9:11:06", "throughput": 1685.88, "total_tokens": 114851840} +{"current_steps": 14030, "total_steps": 20825, "loss": 0.7016, "learning_rate": 1.3145808515708347e-05, "epoch": 0.6737094837935174, "percentage": 67.37, "elapsed_time": "18:56:11", "remaining_time": "9:10:16", "throughput": 1685.95, "total_tokens": 114933760} +{"current_steps": 14040, "total_steps": 20825, "loss": 0.9825, "learning_rate": 1.3110943631368616e-05, "epoch": 0.6741896758703482, "percentage": 67.42, "elapsed_time": "18:56:57", "remaining_time": "9:09:26", "throughput": 1686.02, "total_tokens": 115015680} +{"current_steps": 14050, "total_steps": 20825, "loss": 0.7027, "learning_rate": 1.3076108602274522e-05, "epoch": 0.6746698679471789, "percentage": 67.47, "elapsed_time": "18:57:42", "remaining_time": "9:08:36", "throughput": 1686.09, "total_tokens": 115097600} +{"current_steps": 14060, "total_steps": 20825, "loss": 0.8251, "learning_rate": 1.3041303515902179e-05, "epoch": 0.6751500600240096, "percentage": 67.52, "elapsed_time": "18:58:28", "remaining_time": "9:07:46", "throughput": 1686.17, "total_tokens": 115179520} +{"current_steps": 14070, "total_steps": 20825, "loss": 1.0897, "learning_rate": 1.3006528459652476e-05, "epoch": 0.6756302521008404, "percentage": 67.56, "elapsed_time": "18:59:14", "remaining_time": "9:06:56", "throughput": 1686.24, "total_tokens": 115261440} +{"current_steps": 14080, "total_steps": 20825, "loss": 0.9864, "learning_rate": 1.2971783520850939e-05, "epoch": 0.6761104441776711, "percentage": 67.61, "elapsed_time": "18:59:59", "remaining_time": "9:06:06", "throughput": 1686.31, "total_tokens": 115343360} +{"current_steps": 14090, "total_steps": 20825, "loss": 0.9467, "learning_rate": 1.2937068786747438e-05, "epoch": 0.6765906362545018, "percentage": 67.66, "elapsed_time": "19:00:45", "remaining_time": "9:05:16", "throughput": 1686.38, "total_tokens": 115425280} +{"current_steps": 14100, "total_steps": 20825, "loss": 0.971, "learning_rate": 1.2902384344515986e-05, "epoch": 0.6770708283313326, "percentage": 67.71, "elapsed_time": "19:01:31", "remaining_time": "9:04:26", "throughput": 1686.45, "total_tokens": 115507200} +{"current_steps": 14110, "total_steps": 20825, "loss": 0.7835, "learning_rate": 1.286773028125455e-05, "epoch": 0.6775510204081633, "percentage": 67.76, "elapsed_time": "19:02:16", "remaining_time": "9:03:36", "throughput": 1686.52, "total_tokens": 115589120} +{"current_steps": 14120, "total_steps": 20825, "loss": 0.9291, "learning_rate": 1.2833106683984808e-05, "epoch": 0.678031212484994, "percentage": 67.8, "elapsed_time": "19:03:02", "remaining_time": "9:02:46", "throughput": 1686.6, "total_tokens": 115671040} +{"current_steps": 14130, "total_steps": 20825, "loss": 0.8278, "learning_rate": 1.279851363965193e-05, "epoch": 0.6785114045618247, "percentage": 67.85, "elapsed_time": "19:03:48", "remaining_time": "9:01:57", "throughput": 1686.67, "total_tokens": 115752960} +{"current_steps": 14140, "total_steps": 20825, "loss": 0.8757, "learning_rate": 1.2763951235124346e-05, "epoch": 0.6789915966386555, "percentage": 67.9, "elapsed_time": "19:04:33", "remaining_time": "9:01:07", "throughput": 1686.74, "total_tokens": 115834880} +{"current_steps": 14150, "total_steps": 20825, "loss": 0.9235, "learning_rate": 1.2729419557193573e-05, "epoch": 0.6794717887154862, "percentage": 67.95, "elapsed_time": "19:05:19", "remaining_time": "9:00:17", "throughput": 1686.81, "total_tokens": 115916800} +{"current_steps": 14160, "total_steps": 20825, "loss": 0.7965, "learning_rate": 1.2694918692573954e-05, "epoch": 0.6799519807923169, "percentage": 68.0, "elapsed_time": "19:06:05", "remaining_time": "8:59:27", "throughput": 1686.88, "total_tokens": 115998720} +{"current_steps": 14170, "total_steps": 20825, "loss": 0.7966, "learning_rate": 1.2660448727902457e-05, "epoch": 0.6804321728691477, "percentage": 68.04, "elapsed_time": "19:06:50", "remaining_time": "8:58:37", "throughput": 1686.95, "total_tokens": 116080640} +{"current_steps": 14180, "total_steps": 20825, "loss": 0.7681, "learning_rate": 1.2626009749738444e-05, "epoch": 0.6809123649459784, "percentage": 68.09, "elapsed_time": "19:07:36", "remaining_time": "8:57:47", "throughput": 1687.03, "total_tokens": 116162560} +{"current_steps": 14190, "total_steps": 20825, "loss": 0.8936, "learning_rate": 1.2591601844563488e-05, "epoch": 0.6813925570228091, "percentage": 68.14, "elapsed_time": "19:08:22", "remaining_time": "8:56:57", "throughput": 1687.09, "total_tokens": 116244480} +{"current_steps": 14200, "total_steps": 20825, "loss": 0.9239, "learning_rate": 1.2557225098781105e-05, "epoch": 0.6818727490996399, "percentage": 68.19, "elapsed_time": "19:09:08", "remaining_time": "8:56:07", "throughput": 1687.16, "total_tokens": 116326400} +{"current_steps": 14210, "total_steps": 20825, "loss": 0.8666, "learning_rate": 1.2522879598716595e-05, "epoch": 0.6823529411764706, "percentage": 68.24, "elapsed_time": "19:09:54", "remaining_time": "8:55:17", "throughput": 1687.22, "total_tokens": 116408320} +{"current_steps": 14220, "total_steps": 20825, "loss": 0.873, "learning_rate": 1.2488565430616785e-05, "epoch": 0.6828331332533013, "percentage": 68.28, "elapsed_time": "19:10:40", "remaining_time": "8:54:28", "throughput": 1687.28, "total_tokens": 116490240} +{"current_steps": 14230, "total_steps": 20825, "loss": 0.6743, "learning_rate": 1.2454282680649804e-05, "epoch": 0.683313325330132, "percentage": 68.33, "elapsed_time": "19:11:26", "remaining_time": "8:53:38", "throughput": 1687.34, "total_tokens": 116572160} +{"current_steps": 14240, "total_steps": 20825, "loss": 0.8642, "learning_rate": 1.2420031434904906e-05, "epoch": 0.6837935174069628, "percentage": 68.38, "elapsed_time": "19:12:12", "remaining_time": "8:52:48", "throughput": 1687.41, "total_tokens": 116654080} +{"current_steps": 14250, "total_steps": 20825, "loss": 0.8987, "learning_rate": 1.2385811779392236e-05, "epoch": 0.6842737094837935, "percentage": 68.43, "elapsed_time": "19:12:58", "remaining_time": "8:51:59", "throughput": 1687.47, "total_tokens": 116736000} +{"current_steps": 14260, "total_steps": 20825, "loss": 0.9379, "learning_rate": 1.2351623800042587e-05, "epoch": 0.6847539015606242, "percentage": 68.48, "elapsed_time": "19:13:43", "remaining_time": "8:51:09", "throughput": 1687.54, "total_tokens": 116817920} +{"current_steps": 14270, "total_steps": 20825, "loss": 0.9432, "learning_rate": 1.2317467582707238e-05, "epoch": 0.685234093637455, "percentage": 68.52, "elapsed_time": "19:14:29", "remaining_time": "8:50:19", "throughput": 1687.61, "total_tokens": 116899840} +{"current_steps": 14280, "total_steps": 20825, "loss": 0.854, "learning_rate": 1.2283343213157688e-05, "epoch": 0.6857142857142857, "percentage": 68.57, "elapsed_time": "19:15:15", "remaining_time": "8:49:29", "throughput": 1687.68, "total_tokens": 116981760} +{"current_steps": 14290, "total_steps": 20825, "loss": 0.8973, "learning_rate": 1.2249250777085456e-05, "epoch": 0.6861944777911164, "percentage": 68.62, "elapsed_time": "19:16:00", "remaining_time": "8:48:39", "throughput": 1687.75, "total_tokens": 117063680} +{"current_steps": 14300, "total_steps": 20825, "loss": 0.9893, "learning_rate": 1.221519036010189e-05, "epoch": 0.6866746698679472, "percentage": 68.67, "elapsed_time": "19:16:46", "remaining_time": "8:47:49", "throughput": 1687.82, "total_tokens": 117145600} +{"current_steps": 14310, "total_steps": 20825, "loss": 0.7582, "learning_rate": 1.2181162047737942e-05, "epoch": 0.6871548619447779, "percentage": 68.72, "elapsed_time": "19:17:32", "remaining_time": "8:46:59", "throughput": 1687.89, "total_tokens": 117227520} +{"current_steps": 14320, "total_steps": 20825, "loss": 1.0281, "learning_rate": 1.2147165925443904e-05, "epoch": 0.6876350540216086, "percentage": 68.76, "elapsed_time": "19:18:18", "remaining_time": "8:46:10", "throughput": 1687.95, "total_tokens": 117309440} +{"current_steps": 14330, "total_steps": 20825, "loss": 0.84, "learning_rate": 1.2113202078589267e-05, "epoch": 0.6881152460984393, "percentage": 68.81, "elapsed_time": "19:19:04", "remaining_time": "8:45:20", "throughput": 1688.01, "total_tokens": 117391360} +{"current_steps": 14340, "total_steps": 20825, "loss": 0.8581, "learning_rate": 1.2079270592462475e-05, "epoch": 0.6885954381752701, "percentage": 68.86, "elapsed_time": "19:19:49", "remaining_time": "8:44:30", "throughput": 1688.08, "total_tokens": 117473280} +{"current_steps": 14350, "total_steps": 20825, "loss": 0.8766, "learning_rate": 1.204537155227068e-05, "epoch": 0.6890756302521008, "percentage": 68.91, "elapsed_time": "19:20:35", "remaining_time": "8:43:40", "throughput": 1688.15, "total_tokens": 117555200} +{"current_steps": 14360, "total_steps": 20825, "loss": 0.985, "learning_rate": 1.201150504313959e-05, "epoch": 0.6895558223289315, "percentage": 68.96, "elapsed_time": "19:21:21", "remaining_time": "8:42:51", "throughput": 1688.22, "total_tokens": 117637120} +{"current_steps": 14370, "total_steps": 20825, "loss": 0.8981, "learning_rate": 1.1977671150113206e-05, "epoch": 0.6900360144057623, "percentage": 69.0, "elapsed_time": "19:22:06", "remaining_time": "8:42:01", "throughput": 1688.29, "total_tokens": 117719040} +{"current_steps": 14380, "total_steps": 20825, "loss": 0.9291, "learning_rate": 1.1943869958153613e-05, "epoch": 0.690516206482593, "percentage": 69.05, "elapsed_time": "19:22:52", "remaining_time": "8:41:11", "throughput": 1688.35, "total_tokens": 117800960} +{"current_steps": 14390, "total_steps": 20825, "loss": 0.9612, "learning_rate": 1.1910101552140806e-05, "epoch": 0.6909963985594237, "percentage": 69.1, "elapsed_time": "19:23:38", "remaining_time": "8:40:21", "throughput": 1688.42, "total_tokens": 117882880} +{"current_steps": 14400, "total_steps": 20825, "loss": 0.9258, "learning_rate": 1.1876366016872445e-05, "epoch": 0.6914765906362546, "percentage": 69.15, "elapsed_time": "19:24:24", "remaining_time": "8:39:31", "throughput": 1688.49, "total_tokens": 117964800} +{"current_steps": 14410, "total_steps": 20825, "loss": 0.783, "learning_rate": 1.1842663437063613e-05, "epoch": 0.6919567827130852, "percentage": 69.2, "elapsed_time": "19:25:09", "remaining_time": "8:38:42", "throughput": 1688.56, "total_tokens": 118046720} +{"current_steps": 14420, "total_steps": 20825, "loss": 0.9465, "learning_rate": 1.180899389734668e-05, "epoch": 0.692436974789916, "percentage": 69.24, "elapsed_time": "19:25:55", "remaining_time": "8:37:52", "throughput": 1688.62, "total_tokens": 118128640} +{"current_steps": 14430, "total_steps": 20825, "loss": 0.8717, "learning_rate": 1.1775357482271032e-05, "epoch": 0.6929171668667466, "percentage": 69.29, "elapsed_time": "19:26:41", "remaining_time": "8:37:02", "throughput": 1688.69, "total_tokens": 118210560} +{"current_steps": 14440, "total_steps": 20825, "loss": 0.8557, "learning_rate": 1.1741754276302851e-05, "epoch": 0.6933973589435775, "percentage": 69.34, "elapsed_time": "19:27:27", "remaining_time": "8:36:13", "throughput": 1688.76, "total_tokens": 118292480} +{"current_steps": 14450, "total_steps": 20825, "loss": 0.9129, "learning_rate": 1.170818436382497e-05, "epoch": 0.6938775510204082, "percentage": 69.39, "elapsed_time": "19:28:12", "remaining_time": "8:35:23", "throughput": 1688.82, "total_tokens": 118374400} +{"current_steps": 14460, "total_steps": 20825, "loss": 0.9353, "learning_rate": 1.1674647829136581e-05, "epoch": 0.6943577430972389, "percentage": 69.44, "elapsed_time": "19:28:58", "remaining_time": "8:34:33", "throughput": 1688.9, "total_tokens": 118456320} +{"current_steps": 14470, "total_steps": 20825, "loss": 0.9419, "learning_rate": 1.164114475645306e-05, "epoch": 0.6948379351740697, "percentage": 69.48, "elapsed_time": "19:29:43", "remaining_time": "8:33:43", "throughput": 1688.97, "total_tokens": 118538240} +{"current_steps": 14480, "total_steps": 20825, "loss": 0.8269, "learning_rate": 1.1607675229905776e-05, "epoch": 0.6953181272509004, "percentage": 69.53, "elapsed_time": "19:30:29", "remaining_time": "8:32:53", "throughput": 1689.03, "total_tokens": 118620160} +{"current_steps": 14490, "total_steps": 20825, "loss": 0.8265, "learning_rate": 1.1574239333541856e-05, "epoch": 0.6957983193277311, "percentage": 69.58, "elapsed_time": "19:31:15", "remaining_time": "8:32:04", "throughput": 1689.09, "total_tokens": 118702080} +{"current_steps": 14500, "total_steps": 20825, "loss": 1.0225, "learning_rate": 1.1540837151323951e-05, "epoch": 0.6962785114045619, "percentage": 69.63, "elapsed_time": "19:32:01", "remaining_time": "8:31:14", "throughput": 1689.15, "total_tokens": 118784000} +{"current_steps": 14510, "total_steps": 20825, "loss": 1.0267, "learning_rate": 1.150746876713008e-05, "epoch": 0.6967587034813926, "percentage": 69.68, "elapsed_time": "19:32:49", "remaining_time": "8:30:25", "throughput": 1689.17, "total_tokens": 118865920} +{"current_steps": 14520, "total_steps": 20825, "loss": 0.9422, "learning_rate": 1.1474134264753384e-05, "epoch": 0.6972388955582233, "percentage": 69.72, "elapsed_time": "19:33:35", "remaining_time": "8:29:36", "throughput": 1689.23, "total_tokens": 118947840} +{"current_steps": 14530, "total_steps": 20825, "loss": 0.8435, "learning_rate": 1.1440833727901894e-05, "epoch": 0.697719087635054, "percentage": 69.77, "elapsed_time": "19:34:20", "remaining_time": "8:28:46", "throughput": 1689.3, "total_tokens": 119029760} +{"current_steps": 14540, "total_steps": 20825, "loss": 0.7872, "learning_rate": 1.1407567240198397e-05, "epoch": 0.6981992797118848, "percentage": 69.82, "elapsed_time": "19:35:07", "remaining_time": "8:27:57", "throughput": 1689.36, "total_tokens": 119111680} +{"current_steps": 14550, "total_steps": 20825, "loss": 0.8584, "learning_rate": 1.1374334885180135e-05, "epoch": 0.6986794717887155, "percentage": 69.87, "elapsed_time": "19:35:52", "remaining_time": "8:27:07", "throughput": 1689.43, "total_tokens": 119193600} +{"current_steps": 14560, "total_steps": 20825, "loss": 0.9188, "learning_rate": 1.1341136746298647e-05, "epoch": 0.6991596638655462, "percentage": 69.92, "elapsed_time": "19:36:38", "remaining_time": "8:26:17", "throughput": 1689.49, "total_tokens": 119275520} +{"current_steps": 14570, "total_steps": 20825, "loss": 0.8331, "learning_rate": 1.1307972906919562e-05, "epoch": 0.699639855942377, "percentage": 69.96, "elapsed_time": "19:37:24", "remaining_time": "8:25:27", "throughput": 1689.56, "total_tokens": 119357440} +{"current_steps": 14580, "total_steps": 20825, "loss": 0.8539, "learning_rate": 1.1274843450322381e-05, "epoch": 0.7001200480192077, "percentage": 70.01, "elapsed_time": "19:38:09", "remaining_time": "8:24:38", "throughput": 1689.63, "total_tokens": 119439360} +{"current_steps": 14590, "total_steps": 20825, "loss": 0.8792, "learning_rate": 1.1241748459700241e-05, "epoch": 0.7006002400960384, "percentage": 70.06, "elapsed_time": "19:38:55", "remaining_time": "8:23:48", "throughput": 1689.7, "total_tokens": 119521280} +{"current_steps": 14600, "total_steps": 20825, "loss": 0.9642, "learning_rate": 1.1208688018159746e-05, "epoch": 0.7010804321728692, "percentage": 70.11, "elapsed_time": "19:39:40", "remaining_time": "8:22:58", "throughput": 1689.77, "total_tokens": 119603200} +{"current_steps": 14610, "total_steps": 20825, "loss": 1.0876, "learning_rate": 1.1175662208720758e-05, "epoch": 0.7015606242496999, "percentage": 70.16, "elapsed_time": "19:40:26", "remaining_time": "8:22:09", "throughput": 1689.84, "total_tokens": 119685120} +{"current_steps": 14620, "total_steps": 20825, "loss": 0.941, "learning_rate": 1.1142671114316127e-05, "epoch": 0.7020408163265306, "percentage": 70.2, "elapsed_time": "19:41:11", "remaining_time": "8:21:19", "throughput": 1689.91, "total_tokens": 119767040} +{"current_steps": 14630, "total_steps": 20825, "loss": 0.9637, "learning_rate": 1.1109714817791584e-05, "epoch": 0.7025210084033613, "percentage": 70.25, "elapsed_time": "19:41:57", "remaining_time": "8:20:29", "throughput": 1689.98, "total_tokens": 119848960} +{"current_steps": 14640, "total_steps": 20825, "loss": 0.8024, "learning_rate": 1.1076793401905419e-05, "epoch": 0.7030012004801921, "percentage": 70.3, "elapsed_time": "19:42:42", "remaining_time": "8:19:39", "throughput": 1690.05, "total_tokens": 119930880} +{"current_steps": 14650, "total_steps": 20825, "loss": 0.8844, "learning_rate": 1.1043906949328387e-05, "epoch": 0.7034813925570228, "percentage": 70.35, "elapsed_time": "19:43:28", "remaining_time": "8:18:50", "throughput": 1690.12, "total_tokens": 120012800} +{"current_steps": 14660, "total_steps": 20825, "loss": 0.8125, "learning_rate": 1.1011055542643398e-05, "epoch": 0.7039615846338535, "percentage": 70.4, "elapsed_time": "19:44:13", "remaining_time": "8:18:00", "throughput": 1690.19, "total_tokens": 120094720} +{"current_steps": 14670, "total_steps": 20825, "loss": 0.9473, "learning_rate": 1.0978239264345397e-05, "epoch": 0.7044417767106843, "percentage": 70.44, "elapsed_time": "19:44:59", "remaining_time": "8:17:10", "throughput": 1690.27, "total_tokens": 120176640} +{"current_steps": 14680, "total_steps": 20825, "loss": 0.9443, "learning_rate": 1.0945458196841078e-05, "epoch": 0.704921968787515, "percentage": 70.49, "elapsed_time": "19:45:44", "remaining_time": "8:16:21", "throughput": 1690.33, "total_tokens": 120258560} +{"current_steps": 14690, "total_steps": 20825, "loss": 1.0888, "learning_rate": 1.0912712422448737e-05, "epoch": 0.7054021608643457, "percentage": 70.54, "elapsed_time": "19:46:30", "remaining_time": "8:15:31", "throughput": 1690.4, "total_tokens": 120340480} +{"current_steps": 14700, "total_steps": 20825, "loss": 0.8219, "learning_rate": 1.0880002023398058e-05, "epoch": 0.7058823529411765, "percentage": 70.59, "elapsed_time": "19:47:15", "remaining_time": "8:14:41", "throughput": 1690.47, "total_tokens": 120422400} +{"current_steps": 14710, "total_steps": 20825, "loss": 0.8348, "learning_rate": 1.0847327081829853e-05, "epoch": 0.7063625450180072, "percentage": 70.64, "elapsed_time": "19:48:01", "remaining_time": "8:13:51", "throughput": 1690.55, "total_tokens": 120504320} +{"current_steps": 14720, "total_steps": 20825, "loss": 1.4222, "learning_rate": 1.0814687679795924e-05, "epoch": 0.7068427370948379, "percentage": 70.68, "elapsed_time": "19:48:47", "remaining_time": "8:13:02", "throughput": 1690.61, "total_tokens": 120586240} +{"current_steps": 14730, "total_steps": 20825, "loss": 0.9349, "learning_rate": 1.0782083899258827e-05, "epoch": 0.7073229291716686, "percentage": 70.73, "elapsed_time": "19:49:32", "remaining_time": "8:12:12", "throughput": 1690.67, "total_tokens": 120668160} +{"current_steps": 14740, "total_steps": 20825, "loss": 0.871, "learning_rate": 1.0749515822091658e-05, "epoch": 0.7078031212484994, "percentage": 70.78, "elapsed_time": "19:50:18", "remaining_time": "8:11:23", "throughput": 1690.74, "total_tokens": 120750080} +{"current_steps": 14750, "total_steps": 20825, "loss": 1.2482, "learning_rate": 1.0716983530077843e-05, "epoch": 0.7082833133253301, "percentage": 70.83, "elapsed_time": "19:51:04", "remaining_time": "8:10:33", "throughput": 1690.8, "total_tokens": 120832000} +{"current_steps": 14760, "total_steps": 20825, "loss": 0.7965, "learning_rate": 1.0684487104910974e-05, "epoch": 0.7087635054021608, "percentage": 70.88, "elapsed_time": "19:51:49", "remaining_time": "8:09:43", "throughput": 1690.87, "total_tokens": 120913920} +{"current_steps": 14770, "total_steps": 20825, "loss": 0.8365, "learning_rate": 1.0652026628194567e-05, "epoch": 0.7092436974789916, "percentage": 70.92, "elapsed_time": "19:52:35", "remaining_time": "8:08:54", "throughput": 1690.93, "total_tokens": 120995840} +{"current_steps": 14780, "total_steps": 20825, "loss": 0.8743, "learning_rate": 1.0619602181441848e-05, "epoch": 0.7097238895558223, "percentage": 70.97, "elapsed_time": "19:53:21", "remaining_time": "8:08:04", "throughput": 1691.0, "total_tokens": 121077760} +{"current_steps": 14790, "total_steps": 20825, "loss": 0.7954, "learning_rate": 1.0587213846075591e-05, "epoch": 0.710204081632653, "percentage": 71.02, "elapsed_time": "19:54:06", "remaining_time": "8:07:15", "throughput": 1691.07, "total_tokens": 121159680} +{"current_steps": 14800, "total_steps": 20825, "loss": 0.9451, "learning_rate": 1.0554861703427884e-05, "epoch": 0.7106842737094838, "percentage": 71.07, "elapsed_time": "19:54:52", "remaining_time": "8:06:25", "throughput": 1691.13, "total_tokens": 121241600} +{"current_steps": 14810, "total_steps": 20825, "loss": 1.0584, "learning_rate": 1.0522545834739908e-05, "epoch": 0.7111644657863145, "percentage": 71.12, "elapsed_time": "19:55:38", "remaining_time": "8:05:36", "throughput": 1691.19, "total_tokens": 121323520} +{"current_steps": 14820, "total_steps": 20825, "loss": 0.9405, "learning_rate": 1.0490266321161785e-05, "epoch": 0.7116446578631452, "percentage": 71.16, "elapsed_time": "19:56:24", "remaining_time": "8:04:46", "throughput": 1691.25, "total_tokens": 121405440} +{"current_steps": 14830, "total_steps": 20825, "loss": 0.9526, "learning_rate": 1.0458023243752321e-05, "epoch": 0.712124849939976, "percentage": 71.21, "elapsed_time": "19:57:09", "remaining_time": "8:03:57", "throughput": 1691.32, "total_tokens": 121487360} +{"current_steps": 14840, "total_steps": 20825, "loss": 1.1452, "learning_rate": 1.0425816683478823e-05, "epoch": 0.7126050420168067, "percentage": 71.26, "elapsed_time": "19:57:55", "remaining_time": "8:03:07", "throughput": 1691.38, "total_tokens": 121569280} +{"current_steps": 14850, "total_steps": 20825, "loss": 0.9537, "learning_rate": 1.039364672121692e-05, "epoch": 0.7130852340936374, "percentage": 71.31, "elapsed_time": "19:58:41", "remaining_time": "8:02:18", "throughput": 1691.45, "total_tokens": 121651200} +{"current_steps": 14860, "total_steps": 20825, "loss": 1.0094, "learning_rate": 1.0361513437750333e-05, "epoch": 0.7135654261704681, "percentage": 71.36, "elapsed_time": "19:59:26", "remaining_time": "8:01:28", "throughput": 1691.52, "total_tokens": 121733120} +{"current_steps": 14870, "total_steps": 20825, "loss": 0.8121, "learning_rate": 1.0329416913770651e-05, "epoch": 0.714045618247299, "percentage": 71.4, "elapsed_time": "20:00:12", "remaining_time": "8:00:39", "throughput": 1691.57, "total_tokens": 121815040} +{"current_steps": 14880, "total_steps": 20825, "loss": 0.8583, "learning_rate": 1.0297357229877183e-05, "epoch": 0.7145258103241297, "percentage": 71.45, "elapsed_time": "20:00:58", "remaining_time": "7:59:49", "throughput": 1691.64, "total_tokens": 121896960} +{"current_steps": 14890, "total_steps": 20825, "loss": 0.9234, "learning_rate": 1.0265334466576723e-05, "epoch": 0.7150060024009603, "percentage": 71.5, "elapsed_time": "20:01:44", "remaining_time": "7:59:00", "throughput": 1691.7, "total_tokens": 121978880} +{"current_steps": 14900, "total_steps": 20825, "loss": 0.7661, "learning_rate": 1.0233348704283332e-05, "epoch": 0.7154861944777912, "percentage": 71.55, "elapsed_time": "20:02:30", "remaining_time": "7:58:10", "throughput": 1691.76, "total_tokens": 122060800} +{"current_steps": 14910, "total_steps": 20825, "loss": 0.8836, "learning_rate": 1.0201400023318184e-05, "epoch": 0.7159663865546219, "percentage": 71.6, "elapsed_time": "20:03:15", "remaining_time": "7:57:20", "throughput": 1691.83, "total_tokens": 122142720} +{"current_steps": 14920, "total_steps": 20825, "loss": 0.9656, "learning_rate": 1.0169488503909313e-05, "epoch": 0.7164465786314526, "percentage": 71.64, "elapsed_time": "20:04:01", "remaining_time": "7:56:31", "throughput": 1691.9, "total_tokens": 122224640} +{"current_steps": 14930, "total_steps": 20825, "loss": 1.1411, "learning_rate": 1.0137614226191434e-05, "epoch": 0.7169267707082834, "percentage": 71.69, "elapsed_time": "20:04:46", "remaining_time": "7:55:41", "throughput": 1691.96, "total_tokens": 122306560} +{"current_steps": 14940, "total_steps": 20825, "loss": 1.0296, "learning_rate": 1.010577727020576e-05, "epoch": 0.7174069627851141, "percentage": 71.74, "elapsed_time": "20:05:32", "remaining_time": "7:54:52", "throughput": 1692.02, "total_tokens": 122388480} +{"current_steps": 14950, "total_steps": 20825, "loss": 1.0557, "learning_rate": 1.0073977715899785e-05, "epoch": 0.7178871548619448, "percentage": 71.79, "elapsed_time": "20:06:17", "remaining_time": "7:54:02", "throughput": 1692.09, "total_tokens": 122470400} +{"current_steps": 14960, "total_steps": 20825, "loss": 0.857, "learning_rate": 1.0042215643127051e-05, "epoch": 0.7183673469387755, "percentage": 71.84, "elapsed_time": "20:07:03", "remaining_time": "7:53:13", "throughput": 1692.16, "total_tokens": 122552320} +{"current_steps": 14970, "total_steps": 20825, "loss": 0.9649, "learning_rate": 1.0010491131647013e-05, "epoch": 0.7188475390156063, "percentage": 71.88, "elapsed_time": "20:07:48", "remaining_time": "7:52:23", "throughput": 1692.23, "total_tokens": 122634240} +{"current_steps": 14980, "total_steps": 20825, "loss": 1.0374, "learning_rate": 9.978804261124792e-06, "epoch": 0.719327731092437, "percentage": 71.93, "elapsed_time": "20:08:35", "remaining_time": "7:51:34", "throughput": 1692.28, "total_tokens": 122716160} +{"current_steps": 14990, "total_steps": 20825, "loss": 0.8151, "learning_rate": 9.947155111130969e-06, "epoch": 0.7198079231692677, "percentage": 71.98, "elapsed_time": "20:09:20", "remaining_time": "7:50:44", "throughput": 1692.35, "total_tokens": 122798080} +{"current_steps": 15000, "total_steps": 20825, "loss": 0.9461, "learning_rate": 9.915543761141432e-06, "epoch": 0.7202881152460985, "percentage": 72.03, "elapsed_time": "20:10:06", "remaining_time": "7:49:55", "throughput": 1692.42, "total_tokens": 122880000} +{"current_steps": 15010, "total_steps": 20825, "loss": 0.7584, "learning_rate": 9.883970290537134e-06, "epoch": 0.7207683073229292, "percentage": 72.08, "elapsed_time": "20:10:55", "remaining_time": "7:49:07", "throughput": 1692.4, "total_tokens": 122961920} +{"current_steps": 15020, "total_steps": 20825, "loss": 0.9356, "learning_rate": 9.852434778603888e-06, "epoch": 0.7212484993997599, "percentage": 72.12, "elapsed_time": "20:11:40", "remaining_time": "7:48:17", "throughput": 1692.47, "total_tokens": 123043840} +{"current_steps": 15030, "total_steps": 20825, "loss": 0.821, "learning_rate": 9.820937304532221e-06, "epoch": 0.7217286914765907, "percentage": 72.17, "elapsed_time": "20:12:26", "remaining_time": "7:47:28", "throughput": 1692.53, "total_tokens": 123125760} +{"current_steps": 15040, "total_steps": 20825, "loss": 1.0243, "learning_rate": 9.789477947417131e-06, "epoch": 0.7222088835534214, "percentage": 72.22, "elapsed_time": "20:13:12", "remaining_time": "7:46:39", "throughput": 1692.58, "total_tokens": 123207680} +{"current_steps": 15050, "total_steps": 20825, "loss": 0.8123, "learning_rate": 9.758056786257874e-06, "epoch": 0.7226890756302521, "percentage": 72.27, "elapsed_time": "20:13:58", "remaining_time": "7:45:49", "throughput": 1692.64, "total_tokens": 123289600} +{"current_steps": 15060, "total_steps": 20825, "loss": 0.9684, "learning_rate": 9.726673899957823e-06, "epoch": 0.7231692677070828, "percentage": 72.32, "elapsed_time": "20:14:44", "remaining_time": "7:45:00", "throughput": 1692.7, "total_tokens": 123371520} +{"current_steps": 15070, "total_steps": 20825, "loss": 0.8307, "learning_rate": 9.695329367324226e-06, "epoch": 0.7236494597839136, "percentage": 72.36, "elapsed_time": "20:15:29", "remaining_time": "7:44:10", "throughput": 1692.77, "total_tokens": 123453440} +{"current_steps": 15080, "total_steps": 20825, "loss": 0.7508, "learning_rate": 9.664023267068007e-06, "epoch": 0.7241296518607443, "percentage": 72.41, "elapsed_time": "20:16:15", "remaining_time": "7:43:21", "throughput": 1692.84, "total_tokens": 123535360} +{"current_steps": 15090, "total_steps": 20825, "loss": 0.9069, "learning_rate": 9.632755677803595e-06, "epoch": 0.724609843937575, "percentage": 72.46, "elapsed_time": "20:17:00", "remaining_time": "7:42:31", "throughput": 1692.91, "total_tokens": 123617280} +{"current_steps": 15100, "total_steps": 20825, "loss": 0.9597, "learning_rate": 9.601526678048701e-06, "epoch": 0.7250900360144058, "percentage": 72.51, "elapsed_time": "20:17:46", "remaining_time": "7:41:42", "throughput": 1692.98, "total_tokens": 123699200} +{"current_steps": 15110, "total_steps": 20825, "loss": 0.8658, "learning_rate": 9.570336346224145e-06, "epoch": 0.7255702280912365, "percentage": 72.56, "elapsed_time": "20:18:31", "remaining_time": "7:40:52", "throughput": 1693.04, "total_tokens": 123781120} +{"current_steps": 15120, "total_steps": 20825, "loss": 0.9606, "learning_rate": 9.53918476065363e-06, "epoch": 0.7260504201680672, "percentage": 72.61, "elapsed_time": "20:19:17", "remaining_time": "7:40:03", "throughput": 1693.11, "total_tokens": 123863040} +{"current_steps": 15130, "total_steps": 20825, "loss": 0.8755, "learning_rate": 9.508071999563578e-06, "epoch": 0.726530612244898, "percentage": 72.65, "elapsed_time": "20:20:03", "remaining_time": "7:39:13", "throughput": 1693.17, "total_tokens": 123944960} +{"current_steps": 15140, "total_steps": 20825, "loss": 0.8532, "learning_rate": 9.476998141082896e-06, "epoch": 0.7270108043217287, "percentage": 72.7, "elapsed_time": "20:20:48", "remaining_time": "7:38:24", "throughput": 1693.23, "total_tokens": 124026880} +{"current_steps": 15150, "total_steps": 20825, "loss": 0.8118, "learning_rate": 9.445963263242822e-06, "epoch": 0.7274909963985594, "percentage": 72.75, "elapsed_time": "20:21:34", "remaining_time": "7:37:35", "throughput": 1693.29, "total_tokens": 124108800} +{"current_steps": 15160, "total_steps": 20825, "loss": 0.8174, "learning_rate": 9.414967443976705e-06, "epoch": 0.7279711884753901, "percentage": 72.8, "elapsed_time": "20:22:20", "remaining_time": "7:36:45", "throughput": 1693.35, "total_tokens": 124190720} +{"current_steps": 15170, "total_steps": 20825, "loss": 0.7558, "learning_rate": 9.384010761119787e-06, "epoch": 0.7284513805522209, "percentage": 72.85, "elapsed_time": "20:23:05", "remaining_time": "7:35:56", "throughput": 1693.41, "total_tokens": 124272640} +{"current_steps": 15180, "total_steps": 20825, "loss": 1.0988, "learning_rate": 9.353093292409063e-06, "epoch": 0.7289315726290516, "percentage": 72.89, "elapsed_time": "20:23:51", "remaining_time": "7:35:06", "throughput": 1693.48, "total_tokens": 124354560} +{"current_steps": 15190, "total_steps": 20825, "loss": 0.9021, "learning_rate": 9.322215115483049e-06, "epoch": 0.7294117647058823, "percentage": 72.94, "elapsed_time": "20:24:36", "remaining_time": "7:34:17", "throughput": 1693.55, "total_tokens": 124436480} +{"current_steps": 15200, "total_steps": 20825, "loss": 0.7027, "learning_rate": 9.291376307881577e-06, "epoch": 0.7298919567827131, "percentage": 72.99, "elapsed_time": "20:25:22", "remaining_time": "7:33:28", "throughput": 1693.61, "total_tokens": 124518400} +{"current_steps": 15210, "total_steps": 20825, "loss": 0.7578, "learning_rate": 9.260576947045624e-06, "epoch": 0.7303721488595438, "percentage": 73.04, "elapsed_time": "20:26:08", "remaining_time": "7:32:38", "throughput": 1693.67, "total_tokens": 124600320} +{"current_steps": 15220, "total_steps": 20825, "loss": 0.8909, "learning_rate": 9.229817110317126e-06, "epoch": 0.7308523409363745, "percentage": 73.09, "elapsed_time": "20:26:53", "remaining_time": "7:31:49", "throughput": 1693.73, "total_tokens": 124682240} +{"current_steps": 15230, "total_steps": 20825, "loss": 0.8751, "learning_rate": 9.19909687493874e-06, "epoch": 0.7313325330132053, "percentage": 73.13, "elapsed_time": "20:27:39", "remaining_time": "7:30:59", "throughput": 1693.8, "total_tokens": 124764160} +{"current_steps": 15240, "total_steps": 20825, "loss": 0.7469, "learning_rate": 9.168416318053701e-06, "epoch": 0.731812725090036, "percentage": 73.18, "elapsed_time": "20:28:24", "remaining_time": "7:30:10", "throughput": 1693.86, "total_tokens": 124846080} +{"current_steps": 15250, "total_steps": 20825, "loss": 0.7833, "learning_rate": 9.137775516705604e-06, "epoch": 0.7322929171668667, "percentage": 73.23, "elapsed_time": "20:29:10", "remaining_time": "7:29:21", "throughput": 1693.93, "total_tokens": 124928000} +{"current_steps": 15260, "total_steps": 20825, "loss": 0.9773, "learning_rate": 9.107174547838188e-06, "epoch": 0.7327731092436974, "percentage": 73.28, "elapsed_time": "20:29:55", "remaining_time": "7:28:31", "throughput": 1694.0, "total_tokens": 125009920} +{"current_steps": 15270, "total_steps": 20825, "loss": 0.9884, "learning_rate": 9.076613488295193e-06, "epoch": 0.7332533013205282, "percentage": 73.33, "elapsed_time": "20:30:41", "remaining_time": "7:27:42", "throughput": 1694.06, "total_tokens": 125091840} +{"current_steps": 15280, "total_steps": 20825, "loss": 0.916, "learning_rate": 9.04609241482014e-06, "epoch": 0.7337334933973589, "percentage": 73.37, "elapsed_time": "20:31:27", "remaining_time": "7:26:53", "throughput": 1694.12, "total_tokens": 125173760} +{"current_steps": 15290, "total_steps": 20825, "loss": 0.945, "learning_rate": 9.015611404056121e-06, "epoch": 0.7342136854741896, "percentage": 73.42, "elapsed_time": "20:32:13", "remaining_time": "7:26:03", "throughput": 1694.18, "total_tokens": 125255680} +{"current_steps": 15300, "total_steps": 20825, "loss": 0.9736, "learning_rate": 8.985170532545622e-06, "epoch": 0.7346938775510204, "percentage": 73.47, "elapsed_time": "20:32:58", "remaining_time": "7:25:14", "throughput": 1694.24, "total_tokens": 125337600} +{"current_steps": 15310, "total_steps": 20825, "loss": 1.0286, "learning_rate": 8.954769876730368e-06, "epoch": 0.7351740696278511, "percentage": 73.52, "elapsed_time": "20:33:44", "remaining_time": "7:24:25", "throughput": 1694.3, "total_tokens": 125419520} +{"current_steps": 15320, "total_steps": 20825, "loss": 0.8448, "learning_rate": 8.924409512951045e-06, "epoch": 0.7356542617046818, "percentage": 73.57, "elapsed_time": "20:34:29", "remaining_time": "7:23:35", "throughput": 1694.37, "total_tokens": 125501440} +{"current_steps": 15330, "total_steps": 20825, "loss": 1.0115, "learning_rate": 8.894089517447206e-06, "epoch": 0.7361344537815127, "percentage": 73.61, "elapsed_time": "20:35:15", "remaining_time": "7:22:46", "throughput": 1694.43, "total_tokens": 125583360} +{"current_steps": 15340, "total_steps": 20825, "loss": 0.9291, "learning_rate": 8.863809966357017e-06, "epoch": 0.7366146458583434, "percentage": 73.66, "elapsed_time": "20:36:00", "remaining_time": "7:21:57", "throughput": 1694.5, "total_tokens": 125665280} +{"current_steps": 15350, "total_steps": 20825, "loss": 0.8129, "learning_rate": 8.833570935717064e-06, "epoch": 0.737094837935174, "percentage": 73.71, "elapsed_time": "20:36:46", "remaining_time": "7:21:07", "throughput": 1694.56, "total_tokens": 125747200} +{"current_steps": 15360, "total_steps": 20825, "loss": 0.8452, "learning_rate": 8.803372501462203e-06, "epoch": 0.7375750300120048, "percentage": 73.76, "elapsed_time": "20:37:32", "remaining_time": "7:20:18", "throughput": 1694.62, "total_tokens": 125829120} +{"current_steps": 15370, "total_steps": 20825, "loss": 0.7171, "learning_rate": 8.773214739425346e-06, "epoch": 0.7380552220888356, "percentage": 73.81, "elapsed_time": "20:38:18", "remaining_time": "7:19:29", "throughput": 1694.67, "total_tokens": 125911040} +{"current_steps": 15380, "total_steps": 20825, "loss": 0.5982, "learning_rate": 8.743097725337255e-06, "epoch": 0.7385354141656663, "percentage": 73.85, "elapsed_time": "20:39:04", "remaining_time": "7:18:40", "throughput": 1694.72, "total_tokens": 125992960} +{"current_steps": 15390, "total_steps": 20825, "loss": 0.8511, "learning_rate": 8.713021534826366e-06, "epoch": 0.739015606242497, "percentage": 73.9, "elapsed_time": "20:39:50", "remaining_time": "7:17:50", "throughput": 1694.78, "total_tokens": 126074880} +{"current_steps": 15400, "total_steps": 20825, "loss": 1.0259, "learning_rate": 8.68298624341862e-06, "epoch": 0.7394957983193278, "percentage": 73.95, "elapsed_time": "20:40:35", "remaining_time": "7:17:01", "throughput": 1694.84, "total_tokens": 126156800} +{"current_steps": 15410, "total_steps": 20825, "loss": 0.9125, "learning_rate": 8.652991926537254e-06, "epoch": 0.7399759903961585, "percentage": 74.0, "elapsed_time": "20:41:21", "remaining_time": "7:16:12", "throughput": 1694.91, "total_tokens": 126238720} +{"current_steps": 15420, "total_steps": 20825, "loss": 0.9149, "learning_rate": 8.623038659502583e-06, "epoch": 0.7404561824729892, "percentage": 74.05, "elapsed_time": "20:42:07", "remaining_time": "7:15:23", "throughput": 1694.96, "total_tokens": 126320640} +{"current_steps": 15430, "total_steps": 20825, "loss": 0.7081, "learning_rate": 8.59312651753187e-06, "epoch": 0.74093637454982, "percentage": 74.09, "elapsed_time": "20:42:52", "remaining_time": "7:14:33", "throughput": 1695.02, "total_tokens": 126402560} +{"current_steps": 15440, "total_steps": 20825, "loss": 0.9284, "learning_rate": 8.5632555757391e-06, "epoch": 0.7414165666266507, "percentage": 74.14, "elapsed_time": "20:43:38", "remaining_time": "7:13:44", "throughput": 1695.07, "total_tokens": 126484480} +{"current_steps": 15450, "total_steps": 20825, "loss": 0.8449, "learning_rate": 8.53342590913478e-06, "epoch": 0.7418967587034814, "percentage": 74.19, "elapsed_time": "20:44:24", "remaining_time": "7:12:55", "throughput": 1695.14, "total_tokens": 126566400} +{"current_steps": 15460, "total_steps": 20825, "loss": 0.8641, "learning_rate": 8.503637592625796e-06, "epoch": 0.7423769507803121, "percentage": 74.24, "elapsed_time": "20:45:09", "remaining_time": "7:12:06", "throughput": 1695.21, "total_tokens": 126648320} +{"current_steps": 15470, "total_steps": 20825, "loss": 0.9529, "learning_rate": 8.473890701015177e-06, "epoch": 0.7428571428571429, "percentage": 74.29, "elapsed_time": "20:45:55", "remaining_time": "7:11:16", "throughput": 1695.27, "total_tokens": 126730240} +{"current_steps": 15480, "total_steps": 20825, "loss": 1.0765, "learning_rate": 8.444185309001926e-06, "epoch": 0.7433373349339736, "percentage": 74.33, "elapsed_time": "20:46:41", "remaining_time": "7:10:27", "throughput": 1695.32, "total_tokens": 126812160} +{"current_steps": 15490, "total_steps": 20825, "loss": 0.7986, "learning_rate": 8.41452149118085e-06, "epoch": 0.7438175270108043, "percentage": 74.38, "elapsed_time": "20:47:27", "remaining_time": "7:09:38", "throughput": 1695.37, "total_tokens": 126894080} +{"current_steps": 15500, "total_steps": 20825, "loss": 0.8623, "learning_rate": 8.384899322042356e-06, "epoch": 0.7442977190876351, "percentage": 74.43, "elapsed_time": "20:48:12", "remaining_time": "7:08:49", "throughput": 1695.44, "total_tokens": 126976000} +{"current_steps": 15510, "total_steps": 20825, "loss": 0.8208, "learning_rate": 8.355318875972243e-06, "epoch": 0.7447779111644658, "percentage": 74.48, "elapsed_time": "20:48:58", "remaining_time": "7:08:00", "throughput": 1695.5, "total_tokens": 127057920} +{"current_steps": 15520, "total_steps": 20825, "loss": 0.7385, "learning_rate": 8.325780227251562e-06, "epoch": 0.7452581032412965, "percentage": 74.53, "elapsed_time": "20:49:43", "remaining_time": "7:07:10", "throughput": 1695.56, "total_tokens": 127139840} +{"current_steps": 15530, "total_steps": 20825, "loss": 0.9799, "learning_rate": 8.2962834500564e-06, "epoch": 0.7457382953181273, "percentage": 74.57, "elapsed_time": "20:50:29", "remaining_time": "7:06:21", "throughput": 1695.62, "total_tokens": 127221760} +{"current_steps": 15540, "total_steps": 20825, "loss": 0.9194, "learning_rate": 8.266828618457678e-06, "epoch": 0.746218487394958, "percentage": 74.62, "elapsed_time": "20:51:14", "remaining_time": "7:05:32", "throughput": 1695.69, "total_tokens": 127303680} +{"current_steps": 15550, "total_steps": 20825, "loss": 1.1017, "learning_rate": 8.237415806421015e-06, "epoch": 0.7466986794717887, "percentage": 74.67, "elapsed_time": "20:52:00", "remaining_time": "7:04:42", "throughput": 1695.75, "total_tokens": 127385600} +{"current_steps": 15560, "total_steps": 20825, "loss": 0.7884, "learning_rate": 8.20804508780648e-06, "epoch": 0.7471788715486194, "percentage": 74.72, "elapsed_time": "20:52:46", "remaining_time": "7:03:53", "throughput": 1695.81, "total_tokens": 127467520} +{"current_steps": 15570, "total_steps": 20825, "loss": 1.0092, "learning_rate": 8.178716536368475e-06, "epoch": 0.7476590636254502, "percentage": 74.77, "elapsed_time": "20:53:31", "remaining_time": "7:03:04", "throughput": 1695.88, "total_tokens": 127549440} +{"current_steps": 15580, "total_steps": 20825, "loss": 0.9778, "learning_rate": 8.149430225755476e-06, "epoch": 0.7481392557022809, "percentage": 74.81, "elapsed_time": "20:54:17", "remaining_time": "7:02:15", "throughput": 1695.93, "total_tokens": 127631360} +{"current_steps": 15590, "total_steps": 20825, "loss": 0.8936, "learning_rate": 8.120186229509922e-06, "epoch": 0.7486194477791116, "percentage": 74.86, "elapsed_time": "20:55:02", "remaining_time": "7:01:26", "throughput": 1696.0, "total_tokens": 127713280} +{"current_steps": 15600, "total_steps": 20825, "loss": 1.0426, "learning_rate": 8.090984621067963e-06, "epoch": 0.7490996398559424, "percentage": 74.91, "elapsed_time": "20:55:48", "remaining_time": "7:00:36", "throughput": 1696.06, "total_tokens": 127795200} +{"current_steps": 15610, "total_steps": 20825, "loss": 0.8386, "learning_rate": 8.061825473759324e-06, "epoch": 0.7495798319327731, "percentage": 74.96, "elapsed_time": "20:56:34", "remaining_time": "6:59:47", "throughput": 1696.12, "total_tokens": 127877120} +{"current_steps": 15010, "total_steps": 20825, "loss": 0.7584, "learning_rate": 9.883970290537134e-06, "epoch": 0.7207683073229292, "percentage": 72.08, "elapsed_time": "0:00:51", "remaining_time": "0:00:20", "throughput": 2369202.75, "total_tokens": 122961920} +{"current_steps": 15020, "total_steps": 20825, "loss": 0.9357, "learning_rate": 9.852434778603888e-06, "epoch": 0.7212484993997599, "percentage": 72.12, "elapsed_time": "0:01:37", "remaining_time": "0:00:37", "throughput": 1264082.75, "total_tokens": 123043840} +{"current_steps": 15030, "total_steps": 20825, "loss": 0.8206, "learning_rate": 9.820937304532221e-06, "epoch": 0.7217286914765907, "percentage": 72.17, "elapsed_time": "0:02:22", "remaining_time": "0:00:55", "throughput": 861368.75, "total_tokens": 123125760} +{"current_steps": 15040, "total_steps": 20825, "loss": 1.0253, "learning_rate": 9.789477947417131e-06, "epoch": 0.7222088835534214, "percentage": 72.22, "elapsed_time": "0:03:08", "remaining_time": "0:01:12", "throughput": 652031.63, "total_tokens": 123207680} +{"current_steps": 15050, "total_steps": 20825, "loss": 0.8122, "learning_rate": 9.758056786257874e-06, "epoch": 0.7226890756302521, "percentage": 72.27, "elapsed_time": "0:03:54", "remaining_time": "0:01:30", "throughput": 524936.53, "total_tokens": 123289600} +{"current_steps": 15060, "total_steps": 20825, "loss": 0.9684, "learning_rate": 9.726673899957823e-06, "epoch": 0.7231692677070828, "percentage": 72.32, "elapsed_time": "0:04:40", "remaining_time": "0:01:47", "throughput": 440232.85, "total_tokens": 123371520} +{"current_steps": 15070, "total_steps": 20825, "loss": 0.8309, "learning_rate": 9.695329367324226e-06, "epoch": 0.7236494597839136, "percentage": 72.36, "elapsed_time": "0:05:25", "remaining_time": "0:02:04", "throughput": 379027.39, "total_tokens": 123453440} +{"current_steps": 15080, "total_steps": 20825, "loss": 0.7509, "learning_rate": 9.664023267068007e-06, "epoch": 0.7241296518607443, "percentage": 72.41, "elapsed_time": "0:06:10", "remaining_time": "0:02:21", "throughput": 332999.27, "total_tokens": 123535360} +{"current_steps": 15090, "total_steps": 20825, "loss": 0.9072, "learning_rate": 9.632755677803595e-06, "epoch": 0.724609843937575, "percentage": 72.46, "elapsed_time": "0:06:56", "remaining_time": "0:02:38", "throughput": 296988.59, "total_tokens": 123617280} +{"current_steps": 15100, "total_steps": 20825, "loss": 0.9596, "learning_rate": 9.601526678048701e-06, "epoch": 0.7250900360144058, "percentage": 72.51, "elapsed_time": "0:07:41", "remaining_time": "0:02:54", "throughput": 268067.63, "total_tokens": 123699200} +{"current_steps": 15110, "total_steps": 20825, "loss": 0.8658, "learning_rate": 9.570336346224145e-06, "epoch": 0.7255702280912365, "percentage": 72.56, "elapsed_time": "0:08:26", "remaining_time": "0:03:11", "throughput": 244207.17, "total_tokens": 123781120} +{"current_steps": 15120, "total_steps": 20825, "loss": 0.9609, "learning_rate": 9.53918476065363e-06, "epoch": 0.7260504201680672, "percentage": 72.61, "elapsed_time": "0:09:12", "remaining_time": "0:03:28", "throughput": 224300.55, "total_tokens": 123863040} +{"current_steps": 15130, "total_steps": 20825, "loss": 0.8759, "learning_rate": 9.508071999563578e-06, "epoch": 0.726530612244898, "percentage": 72.65, "elapsed_time": "0:09:58", "remaining_time": "0:03:45", "throughput": 207258.87, "total_tokens": 123944960} +{"current_steps": 15140, "total_steps": 20825, "loss": 0.8535, "learning_rate": 9.476998141082896e-06, "epoch": 0.7270108043217287, "percentage": 72.7, "elapsed_time": "0:10:43", "remaining_time": "0:04:01", "throughput": 192726.73, "total_tokens": 124026880} +{"current_steps": 15150, "total_steps": 20825, "loss": 0.8117, "learning_rate": 9.445963263242822e-06, "epoch": 0.7274909963985594, "percentage": 72.75, "elapsed_time": "0:11:29", "remaining_time": "0:04:18", "throughput": 180093.35, "total_tokens": 124108800} +{"current_steps": 15160, "total_steps": 20825, "loss": 0.8172, "learning_rate": 9.414967443976705e-06, "epoch": 0.7279711884753901, "percentage": 72.8, "elapsed_time": "0:12:14", "remaining_time": "0:04:34", "throughput": 169029.7, "total_tokens": 124190720} +{"current_steps": 15170, "total_steps": 20825, "loss": 0.7557, "learning_rate": 9.384010761119787e-06, "epoch": 0.7284513805522209, "percentage": 72.85, "elapsed_time": "0:13:00", "remaining_time": "0:04:50", "throughput": 159252.01, "total_tokens": 124272640} +{"current_steps": 15180, "total_steps": 20825, "loss": 1.0988, "learning_rate": 9.353093292409063e-06, "epoch": 0.7289315726290516, "percentage": 72.89, "elapsed_time": "0:13:45", "remaining_time": "0:05:07", "throughput": 150604.84, "total_tokens": 124354560} +{"current_steps": 15190, "total_steps": 20825, "loss": 0.9023, "learning_rate": 9.322215115483049e-06, "epoch": 0.7294117647058823, "percentage": 72.94, "elapsed_time": "0:14:31", "remaining_time": "0:05:23", "throughput": 142863.05, "total_tokens": 124436480} +{"current_steps": 15200, "total_steps": 20825, "loss": 0.7027, "learning_rate": 9.291376307881577e-06, "epoch": 0.7298919567827131, "percentage": 72.99, "elapsed_time": "0:15:16", "remaining_time": "0:05:39", "throughput": 135855.5, "total_tokens": 124518400} +{"current_steps": 15210, "total_steps": 20825, "loss": 0.7578, "learning_rate": 9.260576947045624e-06, "epoch": 0.7303721488595438, "percentage": 73.04, "elapsed_time": "0:16:02", "remaining_time": "0:05:55", "throughput": 129492.68, "total_tokens": 124600320} +{"current_steps": 15220, "total_steps": 20825, "loss": 0.8909, "learning_rate": 9.229817110317126e-06, "epoch": 0.7308523409363745, "percentage": 73.09, "elapsed_time": "0:16:47", "remaining_time": "0:06:11", "throughput": 123733.21, "total_tokens": 124682240} +{"current_steps": 15230, "total_steps": 20825, "loss": 0.8752, "learning_rate": 9.19909687493874e-06, "epoch": 0.7313325330132053, "percentage": 73.13, "elapsed_time": "0:17:32", "remaining_time": "0:06:26", "throughput": 118494.47, "total_tokens": 124764160} +{"current_steps": 15240, "total_steps": 20825, "loss": 0.7467, "learning_rate": 9.168416318053701e-06, "epoch": 0.731812725090036, "percentage": 73.18, "elapsed_time": "0:18:18", "remaining_time": "0:06:42", "throughput": 113655.92, "total_tokens": 124846080} +{"current_steps": 15250, "total_steps": 20825, "loss": 0.7833, "learning_rate": 9.137775516705604e-06, "epoch": 0.7322929171668667, "percentage": 73.23, "elapsed_time": "0:19:03", "remaining_time": "0:06:58", "throughput": 109231.0, "total_tokens": 124928000} +{"current_steps": 15260, "total_steps": 20825, "loss": 0.9774, "learning_rate": 9.107174547838188e-06, "epoch": 0.7327731092436974, "percentage": 73.28, "elapsed_time": "0:19:49", "remaining_time": "0:07:13", "throughput": 105124.64, "total_tokens": 125009920} +{"current_steps": 15270, "total_steps": 20825, "loss": 0.9886, "learning_rate": 9.076613488295193e-06, "epoch": 0.7332533013205282, "percentage": 73.33, "elapsed_time": "0:20:34", "remaining_time": "0:07:29", "throughput": 101291.18, "total_tokens": 125091840} +{"current_steps": 15280, "total_steps": 20825, "loss": 0.9161, "learning_rate": 9.04609241482014e-06, "epoch": 0.7337334933973589, "percentage": 73.37, "elapsed_time": "0:21:20", "remaining_time": "0:07:44", "throughput": 97757.55, "total_tokens": 125173760} +{"current_steps": 15290, "total_steps": 20825, "loss": 0.9453, "learning_rate": 9.015611404056121e-06, "epoch": 0.7342136854741896, "percentage": 73.42, "elapsed_time": "0:22:05", "remaining_time": "0:07:59", "throughput": 94468.19, "total_tokens": 125255680} +{"current_steps": 15300, "total_steps": 20825, "loss": 0.9736, "learning_rate": 8.985170532545622e-06, "epoch": 0.7346938775510204, "percentage": 73.47, "elapsed_time": "0:22:51", "remaining_time": "0:08:15", "throughput": 91389.37, "total_tokens": 125337600} +{"current_steps": 15310, "total_steps": 20825, "loss": 1.0289, "learning_rate": 8.954769876730368e-06, "epoch": 0.7351740696278511, "percentage": 73.52, "elapsed_time": "0:23:36", "remaining_time": "0:08:30", "throughput": 88532.0, "total_tokens": 125419520} +{"current_steps": 15320, "total_steps": 20825, "loss": 0.8446, "learning_rate": 8.924409512951045e-06, "epoch": 0.7356542617046818, "percentage": 73.57, "elapsed_time": "0:24:21", "remaining_time": "0:08:45", "throughput": 85847.7, "total_tokens": 125501440} +{"current_steps": 15330, "total_steps": 20825, "loss": 1.0116, "learning_rate": 8.894089517447206e-06, "epoch": 0.7361344537815127, "percentage": 73.61, "elapsed_time": "0:25:07", "remaining_time": "0:09:00", "throughput": 83313.65, "total_tokens": 125583360} +{"current_steps": 15340, "total_steps": 20825, "loss": 0.9291, "learning_rate": 8.863809966357017e-06, "epoch": 0.7366146458583434, "percentage": 73.66, "elapsed_time": "0:25:52", "remaining_time": "0:09:15", "throughput": 80937.9, "total_tokens": 125665280} +{"current_steps": 15350, "total_steps": 20825, "loss": 0.8133, "learning_rate": 8.833570935717064e-06, "epoch": 0.737094837935174, "percentage": 73.71, "elapsed_time": "0:26:38", "remaining_time": "0:09:30", "throughput": 78675.72, "total_tokens": 125747200} +{"current_steps": 15360, "total_steps": 20825, "loss": 0.845, "learning_rate": 8.803372501462203e-06, "epoch": 0.7375750300120048, "percentage": 73.76, "elapsed_time": "0:27:23", "remaining_time": "0:09:44", "throughput": 76558.16, "total_tokens": 125829120} +{"current_steps": 15370, "total_steps": 20825, "loss": 0.7169, "learning_rate": 8.773214739425346e-06, "epoch": 0.7380552220888356, "percentage": 73.81, "elapsed_time": "0:28:09", "remaining_time": "0:09:59", "throughput": 74519.92, "total_tokens": 125911040} +{"current_steps": 15380, "total_steps": 20825, "loss": 0.599, "learning_rate": 8.743097725337255e-06, "epoch": 0.7385354141656663, "percentage": 73.85, "elapsed_time": "0:28:55", "remaining_time": "0:10:14", "throughput": 72588.5, "total_tokens": 125992960} +{"current_steps": 15390, "total_steps": 20825, "loss": 0.8508, "learning_rate": 8.713021534826366e-06, "epoch": 0.739015606242497, "percentage": 73.9, "elapsed_time": "0:29:41", "remaining_time": "0:10:29", "throughput": 70779.03, "total_tokens": 126074880} +{"current_steps": 15400, "total_steps": 20825, "loss": 1.0262, "learning_rate": 8.68298624341862e-06, "epoch": 0.7394957983193278, "percentage": 73.95, "elapsed_time": "0:30:27", "remaining_time": "0:10:43", "throughput": 69019.08, "total_tokens": 126156800} +{"current_steps": 15410, "total_steps": 20825, "loss": 0.9126, "learning_rate": 8.652991926537254e-06, "epoch": 0.7399759903961585, "percentage": 74.0, "elapsed_time": "0:31:15", "remaining_time": "0:10:59", "throughput": 67301.55, "total_tokens": 126238720} +{"current_steps": 15420, "total_steps": 20825, "loss": 0.9147, "learning_rate": 8.623038659502583e-06, "epoch": 0.7404561824729892, "percentage": 74.05, "elapsed_time": "0:32:07", "remaining_time": "0:11:15", "throughput": 65544.68, "total_tokens": 126320640} +{"current_steps": 15430, "total_steps": 20825, "loss": 0.7083, "learning_rate": 8.59312651753187e-06, "epoch": 0.74093637454982, "percentage": 74.09, "elapsed_time": "0:32:56", "remaining_time": "0:11:31", "throughput": 63955.44, "total_tokens": 126402560} +{"current_steps": 15440, "total_steps": 20825, "loss": 0.9287, "learning_rate": 8.5632555757391e-06, "epoch": 0.7414165666266507, "percentage": 74.14, "elapsed_time": "0:33:42", "remaining_time": "0:11:45", "throughput": 62531.07, "total_tokens": 126484480} +{"current_steps": 15450, "total_steps": 20825, "loss": 0.845, "learning_rate": 8.53342590913478e-06, "epoch": 0.7418967587034814, "percentage": 74.19, "elapsed_time": "0:34:29", "remaining_time": "0:12:00", "throughput": 61150.82, "total_tokens": 126566400} +{"current_steps": 15460, "total_steps": 20825, "loss": 0.8641, "learning_rate": 8.503637592625796e-06, "epoch": 0.7423769507803121, "percentage": 74.24, "elapsed_time": "0:35:16", "remaining_time": "0:12:14", "throughput": 59844.95, "total_tokens": 126648320} +{"current_steps": 15470, "total_steps": 20825, "loss": 0.9529, "learning_rate": 8.473890701015177e-06, "epoch": 0.7428571428571429, "percentage": 74.29, "elapsed_time": "0:36:01", "remaining_time": "0:12:28", "throughput": 58634.13, "total_tokens": 126730240} +{"current_steps": 15480, "total_steps": 20825, "loss": 1.0765, "learning_rate": 8.444185309001926e-06, "epoch": 0.7433373349339736, "percentage": 74.33, "elapsed_time": "0:36:47", "remaining_time": "0:12:42", "throughput": 57458.33, "total_tokens": 126812160} +{"current_steps": 15490, "total_steps": 20825, "loss": 0.7988, "learning_rate": 8.41452149118085e-06, "epoch": 0.7438175270108043, "percentage": 74.38, "elapsed_time": "0:37:32", "remaining_time": "0:12:55", "throughput": 56328.4, "total_tokens": 126894080} +{"current_steps": 15500, "total_steps": 20825, "loss": 0.8623, "learning_rate": 8.384899322042356e-06, "epoch": 0.7442977190876351, "percentage": 74.43, "elapsed_time": "0:38:17", "remaining_time": "0:13:09", "throughput": 55260.49, "total_tokens": 126976000} +{"current_steps": 15510, "total_steps": 20825, "loss": 0.8205, "learning_rate": 8.355318875972243e-06, "epoch": 0.7447779111644658, "percentage": 74.48, "elapsed_time": "0:39:03", "remaining_time": "0:13:22", "throughput": 54227.28, "total_tokens": 127057920} +{"current_steps": 15520, "total_steps": 20825, "loss": 0.7383, "learning_rate": 8.325780227251562e-06, "epoch": 0.7452581032412965, "percentage": 74.53, "elapsed_time": "0:39:48", "remaining_time": "0:13:36", "throughput": 53232.72, "total_tokens": 127139840} +{"current_steps": 15530, "total_steps": 20825, "loss": 0.9802, "learning_rate": 8.2962834500564e-06, "epoch": 0.7457382953181273, "percentage": 74.57, "elapsed_time": "0:40:33", "remaining_time": "0:13:49", "throughput": 52278.31, "total_tokens": 127221760} +{"current_steps": 15540, "total_steps": 20825, "loss": 0.9196, "learning_rate": 8.266828618457678e-06, "epoch": 0.746218487394958, "percentage": 74.62, "elapsed_time": "0:41:18", "remaining_time": "0:14:02", "throughput": 51362.38, "total_tokens": 127303680} +{"current_steps": 15550, "total_steps": 20825, "loss": 1.1014, "learning_rate": 8.237415806421015e-06, "epoch": 0.7466986794717887, "percentage": 74.67, "elapsed_time": "0:42:03", "remaining_time": "0:14:16", "throughput": 50474.05, "total_tokens": 127385600} +{"current_steps": 15560, "total_steps": 20825, "loss": 0.7883, "learning_rate": 8.20804508780648e-06, "epoch": 0.7471788715486194, "percentage": 74.72, "elapsed_time": "0:42:49", "remaining_time": "0:14:29", "throughput": 49614.78, "total_tokens": 127467520} +{"current_steps": 15570, "total_steps": 20825, "loss": 1.0093, "learning_rate": 8.178716536368475e-06, "epoch": 0.7476590636254502, "percentage": 74.77, "elapsed_time": "0:43:34", "remaining_time": "0:14:42", "throughput": 48786.53, "total_tokens": 127549440} +{"current_steps": 15580, "total_steps": 20825, "loss": 0.978, "learning_rate": 8.149430225755476e-06, "epoch": 0.7481392557022809, "percentage": 74.81, "elapsed_time": "0:44:20", "remaining_time": "0:14:55", "throughput": 47981.08, "total_tokens": 127631360} +{"current_steps": 15590, "total_steps": 20825, "loss": 0.8938, "learning_rate": 8.120186229509922e-06, "epoch": 0.7486194477791116, "percentage": 74.86, "elapsed_time": "0:45:05", "remaining_time": "0:15:08", "throughput": 47209.72, "total_tokens": 127713280} +{"current_steps": 15600, "total_steps": 20825, "loss": 1.0422, "learning_rate": 8.090984621067963e-06, "epoch": 0.7490996398559424, "percentage": 74.91, "elapsed_time": "0:45:50", "remaining_time": "0:15:21", "throughput": 46457.61, "total_tokens": 127795200} +{"current_steps": 15610, "total_steps": 20825, "loss": 0.8388, "learning_rate": 8.061825473759324e-06, "epoch": 0.7495798319327731, "percentage": 74.96, "elapsed_time": "0:46:36", "remaining_time": "0:15:34", "throughput": 45733.63, "total_tokens": 127877120} +{"current_steps": 15620, "total_steps": 20825, "loss": 0.8558, "learning_rate": 8.032708860807111e-06, "epoch": 0.7500600240096038, "percentage": 75.01, "elapsed_time": "0:47:21", "remaining_time": "0:15:46", "throughput": 45033.76, "total_tokens": 127959040} +{"current_steps": 15630, "total_steps": 20825, "loss": 0.7606, "learning_rate": 8.003634855327594e-06, "epoch": 0.7505402160864346, "percentage": 75.05, "elapsed_time": "0:48:06", "remaining_time": "0:15:59", "throughput": 44357.44, "total_tokens": 128040960} +{"current_steps": 15640, "total_steps": 20825, "loss": 0.7422, "learning_rate": 7.974603530330069e-06, "epoch": 0.7510204081632653, "percentage": 75.1, "elapsed_time": "0:48:52", "remaining_time": "0:16:12", "throughput": 43690.67, "total_tokens": 128122880} +{"current_steps": 15650, "total_steps": 20825, "loss": 0.7774, "learning_rate": 7.945614958716658e-06, "epoch": 0.751500600240096, "percentage": 75.15, "elapsed_time": "0:49:40", "remaining_time": "0:16:25", "throughput": 43010.07, "total_tokens": 128204800} +{"current_steps": 15660, "total_steps": 20825, "loss": 0.831, "learning_rate": 7.916669213282107e-06, "epoch": 0.7519807923169267, "percentage": 75.2, "elapsed_time": "0:50:27", "remaining_time": "0:16:38", "throughput": 42373.51, "total_tokens": 128286720} +{"current_steps": 15670, "total_steps": 20825, "loss": 1.1006, "learning_rate": 7.88776636671362e-06, "epoch": 0.7524609843937575, "percentage": 75.25, "elapsed_time": "0:51:12", "remaining_time": "0:16:50", "throughput": 41774.44, "total_tokens": 128368640} +{"current_steps": 15680, "total_steps": 20825, "loss": 0.903, "learning_rate": 7.858906491590697e-06, "epoch": 0.7529411764705882, "percentage": 75.29, "elapsed_time": "0:51:58", "remaining_time": "0:17:03", "throughput": 41193.01, "total_tokens": 128450560} +{"current_steps": 15690, "total_steps": 20825, "loss": 0.8458, "learning_rate": 7.830089660384895e-06, "epoch": 0.7534213685474189, "percentage": 75.34, "elapsed_time": "0:52:44", "remaining_time": "0:17:15", "throughput": 40623.2, "total_tokens": 128532480} +{"current_steps": 15700, "total_steps": 20825, "loss": 1.3148, "learning_rate": 7.801315945459714e-06, "epoch": 0.7539015606242497, "percentage": 75.39, "elapsed_time": "0:53:31", "remaining_time": "0:17:28", "throughput": 40046.94, "total_tokens": 128614400} +{"current_steps": 15710, "total_steps": 20825, "loss": 0.9315, "learning_rate": 7.772585419070374e-06, "epoch": 0.7543817527010804, "percentage": 75.44, "elapsed_time": "0:54:17", "remaining_time": "0:17:40", "throughput": 39512.69, "total_tokens": 128696320} +{"current_steps": 15720, "total_steps": 20825, "loss": 0.7756, "learning_rate": 7.743898153363625e-06, "epoch": 0.7548619447779111, "percentage": 75.49, "elapsed_time": "0:55:02", "remaining_time": "0:17:52", "throughput": 38989.88, "total_tokens": 128778240} +{"current_steps": 15730, "total_steps": 20825, "loss": 0.8351, "learning_rate": 7.715254220377596e-06, "epoch": 0.7553421368547419, "percentage": 75.53, "elapsed_time": "0:55:51", "remaining_time": "0:18:05", "throughput": 38452.78, "total_tokens": 128860160} +{"current_steps": 15740, "total_steps": 20825, "loss": 0.7978, "learning_rate": 7.686653692041615e-06, "epoch": 0.7558223289315726, "percentage": 75.58, "elapsed_time": "0:56:36", "remaining_time": "0:18:17", "throughput": 37963.63, "total_tokens": 128942080} +{"current_steps": 15750, "total_steps": 20825, "loss": 0.8335, "learning_rate": 7.658096640175988e-06, "epoch": 0.7563025210084033, "percentage": 75.63, "elapsed_time": "0:57:21", "remaining_time": "0:18:29", "throughput": 37487.9, "total_tokens": 129024000} +{"current_steps": 15760, "total_steps": 20825, "loss": 0.7803, "learning_rate": 7.629583136491844e-06, "epoch": 0.7567827130852341, "percentage": 75.68, "elapsed_time": "0:58:08", "remaining_time": "0:18:41", "throughput": 37006.23, "total_tokens": 129105920} +{"current_steps": 15770, "total_steps": 20825, "loss": 0.8551, "learning_rate": 7.601113252590991e-06, "epoch": 0.7572629051620648, "percentage": 75.73, "elapsed_time": "0:58:55", "remaining_time": "0:18:53", "throughput": 36545.07, "total_tokens": 129187840} +{"current_steps": 15780, "total_steps": 20825, "loss": 1.0544, "learning_rate": 7.572687059965661e-06, "epoch": 0.7577430972388955, "percentage": 75.77, "elapsed_time": "0:59:40", "remaining_time": "0:19:04", "throughput": 36105.6, "total_tokens": 129269760} +{"current_steps": 15790, "total_steps": 20825, "loss": 0.9997, "learning_rate": 7.544304629998389e-06, "epoch": 0.7582232893157262, "percentage": 75.82, "elapsed_time": "1:00:26", "remaining_time": "0:19:16", "throughput": 35671.61, "total_tokens": 129351680} +{"current_steps": 15800, "total_steps": 20825, "loss": 0.8806, "learning_rate": 7.51596603396183e-06, "epoch": 0.758703481392557, "percentage": 75.87, "elapsed_time": "1:01:13", "remaining_time": "0:19:28", "throughput": 35235.39, "total_tokens": 129433600} +{"current_steps": 15810, "total_steps": 20825, "loss": 0.9649, "learning_rate": 7.4876713430185265e-06, "epoch": 0.7591836734693878, "percentage": 75.92, "elapsed_time": "1:01:58", "remaining_time": "0:19:39", "throughput": 34827.46, "total_tokens": 129515520} +{"current_steps": 15820, "total_steps": 20825, "loss": 0.926, "learning_rate": 7.4594206282208e-06, "epoch": 0.7596638655462185, "percentage": 75.97, "elapsed_time": "1:02:44", "remaining_time": "0:19:50", "throughput": 34428.5, "total_tokens": 129597440} +{"current_steps": 15830, "total_steps": 20825, "loss": 0.8361, "learning_rate": 7.431213960510544e-06, "epoch": 0.7601440576230493, "percentage": 76.01, "elapsed_time": "1:03:29", "remaining_time": "0:20:02", "throughput": 34038.05, "total_tokens": 129679360} +{"current_steps": 15840, "total_steps": 20825, "loss": 1.068, "learning_rate": 7.40305141071902e-06, "epoch": 0.76062424969988, "percentage": 76.06, "elapsed_time": "1:04:15", "remaining_time": "0:20:13", "throughput": 33658.8, "total_tokens": 129761280} +{"current_steps": 15850, "total_steps": 20825, "loss": 0.724, "learning_rate": 7.374933049566704e-06, "epoch": 0.7611044417767107, "percentage": 76.11, "elapsed_time": "1:05:00", "remaining_time": "0:20:24", "throughput": 33287.73, "total_tokens": 129843200} +{"current_steps": 15860, "total_steps": 20825, "loss": 0.8833, "learning_rate": 7.346858947663138e-06, "epoch": 0.7615846338535415, "percentage": 76.16, "elapsed_time": "1:05:52", "remaining_time": "0:20:37", "throughput": 32872.77, "total_tokens": 129925120} +{"current_steps": 15870, "total_steps": 20825, "loss": 1.0074, "learning_rate": 7.318829175506684e-06, "epoch": 0.7620648259303722, "percentage": 76.21, "elapsed_time": "1:06:41", "remaining_time": "0:20:49", "throughput": 32488.82, "total_tokens": 130007040} +{"current_steps": 15880, "total_steps": 20825, "loss": 0.9735, "learning_rate": 7.290843803484409e-06, "epoch": 0.7625450180072029, "percentage": 76.25, "elapsed_time": "1:07:29", "remaining_time": "0:21:01", "throughput": 32124.5, "total_tokens": 130088960} +{"current_steps": 15890, "total_steps": 20825, "loss": 0.9231, "learning_rate": 7.262902901871885e-06, "epoch": 0.7630252100840336, "percentage": 76.3, "elapsed_time": "1:08:15", "remaining_time": "0:21:11", "throughput": 31784.88, "total_tokens": 130170880} +{"current_steps": 15900, "total_steps": 20825, "loss": 0.9472, "learning_rate": 7.235006540832995e-06, "epoch": 0.7635054021608644, "percentage": 76.35, "elapsed_time": "1:09:01", "remaining_time": "0:21:22", "throughput": 31452.74, "total_tokens": 130252800} +{"current_steps": 15910, "total_steps": 20825, "loss": 0.8525, "learning_rate": 7.207154790419784e-06, "epoch": 0.7639855942376951, "percentage": 76.4, "elapsed_time": "1:09:46", "remaining_time": "0:21:33", "throughput": 31128.53, "total_tokens": 130334720} +{"current_steps": 15920, "total_steps": 20825, "loss": 1.0461, "learning_rate": 7.179347720572288e-06, "epoch": 0.7644657863145258, "percentage": 76.45, "elapsed_time": "1:10:33", "remaining_time": "0:21:44", "throughput": 30804.67, "total_tokens": 130416640} +{"current_steps": 15930, "total_steps": 20825, "loss": 0.77, "learning_rate": 7.151585401118316e-06, "epoch": 0.7649459783913566, "percentage": 76.49, "elapsed_time": "1:11:19", "remaining_time": "0:21:55", "throughput": 30492.74, "total_tokens": 130498560} +{"current_steps": 15940, "total_steps": 20825, "loss": 0.8252, "learning_rate": 7.12386790177331e-06, "epoch": 0.7654261704681873, "percentage": 76.54, "elapsed_time": "1:12:05", "remaining_time": "0:22:05", "throughput": 30190.35, "total_tokens": 130580480} +{"current_steps": 15950, "total_steps": 20825, "loss": 0.8723, "learning_rate": 7.096195292140173e-06, "epoch": 0.765906362545018, "percentage": 76.59, "elapsed_time": "1:12:51", "remaining_time": "0:22:16", "throughput": 29891.21, "total_tokens": 130662400} +{"current_steps": 15960, "total_steps": 20825, "loss": 0.7436, "learning_rate": 7.06856764170907e-06, "epoch": 0.7663865546218488, "percentage": 76.64, "elapsed_time": "1:13:36", "remaining_time": "0:22:26", "throughput": 29601.52, "total_tokens": 130744320} +{"current_steps": 15970, "total_steps": 20825, "loss": 0.959, "learning_rate": 7.040985019857274e-06, "epoch": 0.7668667466986795, "percentage": 76.69, "elapsed_time": "1:14:22", "remaining_time": "0:22:36", "throughput": 29316.54, "total_tokens": 130826240} +{"current_steps": 15980, "total_steps": 20825, "loss": 1.1143, "learning_rate": 7.013447495848996e-06, "epoch": 0.7673469387755102, "percentage": 76.73, "elapsed_time": "1:15:08", "remaining_time": "0:22:46", "throughput": 29036.93, "total_tokens": 130908160} +{"current_steps": 15990, "total_steps": 20825, "loss": 0.9102, "learning_rate": 6.985955138835162e-06, "epoch": 0.7678271308523409, "percentage": 76.78, "elapsed_time": "1:15:53", "remaining_time": "0:22:57", "throughput": 28763.85, "total_tokens": 130990080} +{"current_steps": 16000, "total_steps": 20825, "loss": 0.9424, "learning_rate": 6.958508017853319e-06, "epoch": 0.7683073229291717, "percentage": 76.83, "elapsed_time": "1:16:39", "remaining_time": "0:23:07", "throughput": 28496.33, "total_tokens": 131072000} +{"current_steps": 16010, "total_steps": 20825, "loss": 0.905, "learning_rate": 6.931106201827397e-06, "epoch": 0.7687875150060024, "percentage": 76.88, "elapsed_time": "1:17:28", "remaining_time": "0:23:17", "throughput": 28216.48, "total_tokens": 131153920} +{"current_steps": 16020, "total_steps": 20825, "loss": 0.8972, "learning_rate": 6.903749759567557e-06, "epoch": 0.7692677070828331, "percentage": 76.93, "elapsed_time": "1:18:13", "remaining_time": "0:23:27", "throughput": 27959.23, "total_tokens": 131235840} +{"current_steps": 16030, "total_steps": 20825, "loss": 0.8669, "learning_rate": 6.876438759770037e-06, "epoch": 0.7697478991596639, "percentage": 76.97, "elapsed_time": "1:18:59", "remaining_time": "0:23:37", "throughput": 27706.63, "total_tokens": 131317760} +{"current_steps": 16040, "total_steps": 20825, "loss": 1.0239, "learning_rate": 6.8491732710169344e-06, "epoch": 0.7702280912364946, "percentage": 77.02, "elapsed_time": "1:19:47", "remaining_time": "0:23:48", "throughput": 27448.36, "total_tokens": 131399680} +{"current_steps": 16050, "total_steps": 20825, "loss": 0.7977, "learning_rate": 6.821953361776093e-06, "epoch": 0.7707082833133253, "percentage": 77.07, "elapsed_time": "1:20:33", "remaining_time": "0:23:58", "throughput": 27202.1, "total_tokens": 131481600} +{"current_steps": 16060, "total_steps": 20825, "loss": 0.8704, "learning_rate": 6.7947791004008665e-06, "epoch": 0.7711884753901561, "percentage": 77.12, "elapsed_time": "1:21:20", "remaining_time": "0:24:07", "throughput": 26958.47, "total_tokens": 131563520} +{"current_steps": 16070, "total_steps": 20825, "loss": 0.8018, "learning_rate": 6.767650555130009e-06, "epoch": 0.7716686674669868, "percentage": 77.17, "elapsed_time": "1:22:05", "remaining_time": "0:24:17", "throughput": 26724.72, "total_tokens": 131645440} +{"current_steps": 16080, "total_steps": 20825, "loss": 0.9043, "learning_rate": 6.740567794087463e-06, "epoch": 0.7721488595438175, "percentage": 77.21, "elapsed_time": "1:22:51", "remaining_time": "0:24:27", "throughput": 26496.1, "total_tokens": 131727360} +{"current_steps": 16090, "total_steps": 20825, "loss": 1.1105, "learning_rate": 6.713530885282188e-06, "epoch": 0.7726290516206482, "percentage": 77.26, "elapsed_time": "1:23:37", "remaining_time": "0:24:36", "throughput": 26271.37, "total_tokens": 131809280} +{"current_steps": 16100, "total_steps": 20825, "loss": 0.781, "learning_rate": 6.686539896608016e-06, "epoch": 0.773109243697479, "percentage": 77.31, "elapsed_time": "1:24:23", "remaining_time": "0:24:45", "throughput": 26049.99, "total_tokens": 131891200} +{"current_steps": 16110, "total_steps": 20825, "loss": 0.7886, "learning_rate": 6.659594895843477e-06, "epoch": 0.7735894357743097, "percentage": 77.36, "elapsed_time": "1:25:08", "remaining_time": "0:24:55", "throughput": 25833.0, "total_tokens": 131973120} +{"current_steps": 16120, "total_steps": 20825, "loss": 0.8849, "learning_rate": 6.632695950651594e-06, "epoch": 0.7740696278511404, "percentage": 77.41, "elapsed_time": "1:25:54", "remaining_time": "0:25:04", "throughput": 25620.6, "total_tokens": 132055040} +{"current_steps": 16130, "total_steps": 20825, "loss": 0.9594, "learning_rate": 6.605843128579739e-06, "epoch": 0.7745498199279712, "percentage": 77.45, "elapsed_time": "1:26:40", "remaining_time": "0:25:13", "throughput": 25410.03, "total_tokens": 132136960} +{"current_steps": 16140, "total_steps": 20825, "loss": 0.8384, "learning_rate": 6.579036497059482e-06, "epoch": 0.7750300120048019, "percentage": 77.5, "elapsed_time": "1:27:25", "remaining_time": "0:25:22", "throughput": 25204.64, "total_tokens": 132218880} +{"current_steps": 16150, "total_steps": 20825, "loss": 0.8364, "learning_rate": 6.552276123406384e-06, "epoch": 0.7755102040816326, "percentage": 77.55, "elapsed_time": "1:28:11", "remaining_time": "0:25:31", "throughput": 25002.21, "total_tokens": 132300800} +{"current_steps": 16160, "total_steps": 20825, "loss": 1.0425, "learning_rate": 6.525562074819852e-06, "epoch": 0.7759903961584634, "percentage": 77.6, "elapsed_time": "1:28:57", "remaining_time": "0:25:40", "throughput": 24801.01, "total_tokens": 132382720} +{"current_steps": 16170, "total_steps": 20825, "loss": 0.9449, "learning_rate": 6.4988944183829695e-06, "epoch": 0.7764705882352941, "percentage": 77.65, "elapsed_time": "1:29:45", "remaining_time": "0:25:50", "throughput": 24594.85, "total_tokens": 132464640} +{"current_steps": 16180, "total_steps": 20825, "loss": 1.1211, "learning_rate": 6.472273221062305e-06, "epoch": 0.7769507803121248, "percentage": 77.7, "elapsed_time": "1:30:34", "remaining_time": "0:26:00", "throughput": 24390.1, "total_tokens": 132546560} +{"current_steps": 16190, "total_steps": 20825, "loss": 1.0615, "learning_rate": 6.445698549707776e-06, "epoch": 0.7774309723889555, "percentage": 77.74, "elapsed_time": "1:31:25", "remaining_time": "0:26:10", "throughput": 24176.05, "total_tokens": 132628480} +{"current_steps": 16200, "total_steps": 20825, "loss": 0.7958, "learning_rate": 6.419170471052472e-06, "epoch": 0.7779111644657863, "percentage": 77.79, "elapsed_time": "1:32:16", "remaining_time": "0:26:20", "throughput": 23969.15, "total_tokens": 132710400} +{"current_steps": 16210, "total_steps": 20825, "loss": 0.9789, "learning_rate": 6.392689051712458e-06, "epoch": 0.778391356542617, "percentage": 77.84, "elapsed_time": "1:33:03", "remaining_time": "0:26:29", "throughput": 23783.44, "total_tokens": 132792320} +{"current_steps": 16220, "total_steps": 20825, "loss": 1.0557, "learning_rate": 6.3662543581866405e-06, "epoch": 0.7788715486194477, "percentage": 77.89, "elapsed_time": "1:33:51", "remaining_time": "0:26:38", "throughput": 23596.01, "total_tokens": 132874240} +{"current_steps": 16230, "total_steps": 20825, "loss": 0.7892, "learning_rate": 6.339866456856608e-06, "epoch": 0.7793517406962785, "percentage": 77.94, "elapsed_time": "1:34:39", "remaining_time": "0:26:47", "throughput": 23409.46, "total_tokens": 132956160} +{"current_steps": 16240, "total_steps": 20825, "loss": 0.9853, "learning_rate": 6.313525413986415e-06, "epoch": 0.7798319327731092, "percentage": 77.98, "elapsed_time": "1:35:27", "remaining_time": "0:26:57", "throughput": 23227.29, "total_tokens": 133038080} +{"current_steps": 16250, "total_steps": 20825, "loss": 0.8806, "learning_rate": 6.28723129572247e-06, "epoch": 0.78031212484994, "percentage": 78.03, "elapsed_time": "1:36:15", "remaining_time": "0:27:05", "throughput": 23050.21, "total_tokens": 133120000} +{"current_steps": 16260, "total_steps": 20825, "loss": 0.8576, "learning_rate": 6.260984168093353e-06, "epoch": 0.7807923169267708, "percentage": 78.08, "elapsed_time": "1:37:01", "remaining_time": "0:27:14", "throughput": 22881.61, "total_tokens": 133201920} +{"current_steps": 16270, "total_steps": 20825, "loss": 0.9178, "learning_rate": 6.234784097009608e-06, "epoch": 0.7812725090036015, "percentage": 78.13, "elapsed_time": "1:37:49", "remaining_time": "0:27:23", "throughput": 22708.63, "total_tokens": 133283840} +{"current_steps": 16280, "total_steps": 20825, "loss": 0.8479, "learning_rate": 6.208631148263649e-06, "epoch": 0.7817527010804322, "percentage": 78.18, "elapsed_time": "1:38:36", "remaining_time": "0:27:31", "throughput": 22539.65, "total_tokens": 133365760} +{"current_steps": 16290, "total_steps": 20825, "loss": 0.6448, "learning_rate": 6.18252538752955e-06, "epoch": 0.7822328931572629, "percentage": 78.22, "elapsed_time": "1:39:24", "remaining_time": "0:27:40", "throughput": 22373.4, "total_tokens": 133447680} +{"current_steps": 16300, "total_steps": 20825, "loss": 0.7555, "learning_rate": 6.156466880362877e-06, "epoch": 0.7827130852340937, "percentage": 78.27, "elapsed_time": "1:40:10", "remaining_time": "0:27:48", "throughput": 22215.07, "total_tokens": 133529600} +{"current_steps": 16310, "total_steps": 20825, "loss": 0.8473, "learning_rate": 6.1304556922005315e-06, "epoch": 0.7831932773109244, "percentage": 78.32, "elapsed_time": "1:40:57", "remaining_time": "0:27:56", "throughput": 22055.79, "total_tokens": 133611520} +{"current_steps": 16320, "total_steps": 20825, "loss": 0.8754, "learning_rate": 6.1044918883606225e-06, "epoch": 0.7836734693877551, "percentage": 78.37, "elapsed_time": "1:41:43", "remaining_time": "0:28:04", "throughput": 21903.86, "total_tokens": 133693440} +{"current_steps": 16330, "total_steps": 20825, "loss": 0.9731, "learning_rate": 6.078575534042222e-06, "epoch": 0.7841536614645859, "percentage": 78.42, "elapsed_time": "1:42:30", "remaining_time": "0:28:13", "throughput": 21749.98, "total_tokens": 133775360} +{"current_steps": 16340, "total_steps": 20825, "loss": 0.952, "learning_rate": 6.052706694325292e-06, "epoch": 0.7846338535414166, "percentage": 78.46, "elapsed_time": "1:43:19", "remaining_time": "0:28:21", "throughput": 21592.08, "total_tokens": 133857280} +{"current_steps": 16350, "total_steps": 20825, "loss": 0.9592, "learning_rate": 6.026885434170457e-06, "epoch": 0.7851140456182473, "percentage": 78.51, "elapsed_time": "1:44:05", "remaining_time": "0:28:29", "throughput": 21444.5, "total_tokens": 133939200} +{"current_steps": 16360, "total_steps": 20825, "loss": 0.9753, "learning_rate": 6.001111818418859e-06, "epoch": 0.7855942376950781, "percentage": 78.56, "elapsed_time": "1:44:52", "remaining_time": "0:28:37", "throughput": 21297.62, "total_tokens": 134021120} +{"current_steps": 16370, "total_steps": 20825, "loss": 0.9931, "learning_rate": 5.975385911792006e-06, "epoch": 0.7860744297719088, "percentage": 78.61, "elapsed_time": "1:45:40", "remaining_time": "0:28:45", "throughput": 21149.27, "total_tokens": 134103040} +{"current_steps": 16380, "total_steps": 20825, "loss": 1.0476, "learning_rate": 5.9497077788916055e-06, "epoch": 0.7865546218487395, "percentage": 78.66, "elapsed_time": "1:46:28", "remaining_time": "0:28:53", "throughput": 21005.18, "total_tokens": 134184960} +{"current_steps": 16390, "total_steps": 20825, "loss": 0.8325, "learning_rate": 5.924077484199389e-06, "epoch": 0.7870348139255702, "percentage": 78.7, "elapsed_time": "1:47:14", "remaining_time": "0:29:01", "throughput": 20865.49, "total_tokens": 134266880} +{"current_steps": 16400, "total_steps": 20825, "loss": 0.7674, "learning_rate": 5.89849509207695e-06, "epoch": 0.787515006002401, "percentage": 78.75, "elapsed_time": "1:48:01", "remaining_time": "0:29:08", "throughput": 20728.58, "total_tokens": 134348800} +{"current_steps": 16410, "total_steps": 20825, "loss": 0.909, "learning_rate": 5.872960666765618e-06, "epoch": 0.7879951980792317, "percentage": 78.8, "elapsed_time": "1:48:48", "remaining_time": "0:29:16", "throughput": 20591.81, "total_tokens": 134430720} +{"current_steps": 16420, "total_steps": 20825, "loss": 1.5853, "learning_rate": 5.847474272386239e-06, "epoch": 0.7884753901560624, "percentage": 78.85, "elapsed_time": "1:49:41", "remaining_time": "0:29:25", "throughput": 20437.61, "total_tokens": 134512640} +{"current_steps": 16430, "total_steps": 20825, "loss": 0.8213, "learning_rate": 5.822035972939069e-06, "epoch": 0.7889555822328932, "percentage": 78.9, "elapsed_time": "1:50:30", "remaining_time": "0:29:33", "throughput": 20299.81, "total_tokens": 134594560} +{"current_steps": 16440, "total_steps": 20825, "loss": 0.8711, "learning_rate": 5.79664583230359e-06, "epoch": 0.7894357743097239, "percentage": 78.94, "elapsed_time": "1:51:18", "remaining_time": "0:29:41", "throughput": 20166.66, "total_tokens": 134676480} +{"current_steps": 16450, "total_steps": 20825, "loss": 0.7858, "learning_rate": 5.771303914238333e-06, "epoch": 0.7899159663865546, "percentage": 78.99, "elapsed_time": "1:52:05", "remaining_time": "0:29:48", "throughput": 20038.38, "total_tokens": 134758400} +{"current_steps": 16460, "total_steps": 20825, "loss": 0.8857, "learning_rate": 5.746010282380745e-06, "epoch": 0.7903961584633854, "percentage": 79.04, "elapsed_time": "1:52:51", "remaining_time": "0:29:55", "throughput": 19911.76, "total_tokens": 134840320} +{"current_steps": 16470, "total_steps": 20825, "loss": 0.7948, "learning_rate": 5.7207650002470274e-06, "epoch": 0.7908763505402161, "percentage": 79.09, "elapsed_time": "1:53:41", "remaining_time": "0:30:03", "throughput": 19780.26, "total_tokens": 134922240} +{"current_steps": 16480, "total_steps": 20825, "loss": 0.8112, "learning_rate": 5.695568131231949e-06, "epoch": 0.7913565426170468, "percentage": 79.14, "elapsed_time": "1:54:27", "remaining_time": "0:30:10", "throughput": 19657.78, "total_tokens": 135004160} +{"current_steps": 16490, "total_steps": 20825, "loss": 0.7962, "learning_rate": 5.670419738608723e-06, "epoch": 0.7918367346938775, "percentage": 79.18, "elapsed_time": "1:55:16", "remaining_time": "0:30:18", "throughput": 19531.33, "total_tokens": 135086080} +{"current_steps": 16500, "total_steps": 20825, "loss": 0.8665, "learning_rate": 5.645319885528824e-06, "epoch": 0.7923169267707083, "percentage": 79.23, "elapsed_time": "1:56:05", "remaining_time": "0:30:25", "throughput": 19404.85, "total_tokens": 135168000} +{"current_steps": 16510, "total_steps": 20825, "loss": 0.8142, "learning_rate": 5.620268635021825e-06, "epoch": 0.792797118847539, "percentage": 79.28, "elapsed_time": "1:56:53", "remaining_time": "0:30:33", "throughput": 19284.47, "total_tokens": 135249920} +{"current_steps": 16520, "total_steps": 20825, "loss": 0.9578, "learning_rate": 5.595266049995268e-06, "epoch": 0.7932773109243697, "percentage": 79.33, "elapsed_time": "1:57:42", "remaining_time": "0:30:40", "throughput": 19161.04, "total_tokens": 135331840} +{"current_steps": 16530, "total_steps": 20825, "loss": 0.9576, "learning_rate": 5.5703121932344896e-06, "epoch": 0.7937575030012005, "percentage": 79.38, "elapsed_time": "1:58:29", "remaining_time": "0:30:47", "throughput": 19046.79, "total_tokens": 135413760} +{"current_steps": 16540, "total_steps": 20825, "loss": 0.8884, "learning_rate": 5.5454071274024436e-06, "epoch": 0.7942376950780312, "percentage": 79.42, "elapsed_time": "1:59:15", "remaining_time": "0:30:53", "throughput": 18934.58, "total_tokens": 135495680} +{"current_steps": 16550, "total_steps": 20825, "loss": 0.961, "learning_rate": 5.520550915039579e-06, "epoch": 0.7947178871548619, "percentage": 79.47, "elapsed_time": "2:00:01", "remaining_time": "0:31:00", "throughput": 18826.87, "total_tokens": 135577600} +{"current_steps": 16560, "total_steps": 20825, "loss": 0.838, "learning_rate": 5.495743618563668e-06, "epoch": 0.7951980792316927, "percentage": 79.52, "elapsed_time": "2:00:46", "remaining_time": "0:31:06", "throughput": 18720.45, "total_tokens": 135659520} +{"current_steps": 16570, "total_steps": 20825, "loss": 0.8735, "learning_rate": 5.4709853002696236e-06, "epoch": 0.7956782713085234, "percentage": 79.57, "elapsed_time": "2:01:32", "remaining_time": "0:31:12", "throughput": 18613.77, "total_tokens": 135741440} +{"current_steps": 16580, "total_steps": 20825, "loss": 0.8468, "learning_rate": 5.4462760223294e-06, "epoch": 0.7961584633853541, "percentage": 79.62, "elapsed_time": "2:02:19", "remaining_time": "0:31:19", "throughput": 18506.99, "total_tokens": 135823360} +{"current_steps": 16590, "total_steps": 20825, "loss": 0.8294, "learning_rate": 5.42161584679178e-06, "epoch": 0.7966386554621848, "percentage": 79.66, "elapsed_time": "2:03:05", "remaining_time": "0:31:25", "throughput": 18401.4, "total_tokens": 135905280} +{"current_steps": 16600, "total_steps": 20825, "loss": 0.8217, "learning_rate": 5.397004835582242e-06, "epoch": 0.7971188475390156, "percentage": 79.71, "elapsed_time": "2:03:50", "remaining_time": "0:31:31", "throughput": 18300.24, "total_tokens": 135987200} +{"current_steps": 16610, "total_steps": 20825, "loss": 0.8524, "learning_rate": 5.372443050502823e-06, "epoch": 0.7975990396158463, "percentage": 79.76, "elapsed_time": "2:04:36", "remaining_time": "0:31:37", "throughput": 18199.53, "total_tokens": 136069120} +{"current_steps": 16620, "total_steps": 20825, "loss": 0.8883, "learning_rate": 5.347930553231942e-06, "epoch": 0.798079231692677, "percentage": 79.81, "elapsed_time": "2:05:22", "remaining_time": "0:31:43", "throughput": 18098.54, "total_tokens": 136151040} +{"current_steps": 16630, "total_steps": 20825, "loss": 1.0163, "learning_rate": 5.323467405324226e-06, "epoch": 0.7985594237695078, "percentage": 79.86, "elapsed_time": "2:06:08", "remaining_time": "0:31:49", "throughput": 17999.36, "total_tokens": 136232960} +{"current_steps": 16640, "total_steps": 20825, "loss": 1.069, "learning_rate": 5.299053668210402e-06, "epoch": 0.7990396158463385, "percentage": 79.9, "elapsed_time": "2:06:55", "remaining_time": "0:31:55", "throughput": 17900.44, "total_tokens": 136314880} +{"current_steps": 16650, "total_steps": 20825, "loss": 0.7804, "learning_rate": 5.274689403197119e-06, "epoch": 0.7995198079231692, "percentage": 79.95, "elapsed_time": "2:07:41", "remaining_time": "0:32:01", "throughput": 17803.19, "total_tokens": 136396800} +{"current_steps": 16660, "total_steps": 20825, "loss": 0.8694, "learning_rate": 5.250374671466776e-06, "epoch": 0.8, "percentage": 80.0, "elapsed_time": "2:08:27", "remaining_time": "0:32:06", "throughput": 17706.71, "total_tokens": 136478720} +{"current_steps": 16670, "total_steps": 20825, "loss": 1.145, "learning_rate": 5.2261095340774085e-06, "epoch": 0.8004801920768307, "percentage": 80.05, "elapsed_time": "2:09:13", "remaining_time": "0:32:12", "throughput": 17612.67, "total_tokens": 136560640} +{"current_steps": 16680, "total_steps": 20825, "loss": 0.9997, "learning_rate": 5.201894051962486e-06, "epoch": 0.8009603841536614, "percentage": 80.1, "elapsed_time": "2:09:58", "remaining_time": "0:32:18", "throughput": 17520.77, "total_tokens": 136642560} +{"current_steps": 16690, "total_steps": 20825, "loss": 0.8972, "learning_rate": 5.177728285930816e-06, "epoch": 0.8014405762304923, "percentage": 80.14, "elapsed_time": "2:10:43", "remaining_time": "0:32:23", "throughput": 17430.56, "total_tokens": 136724480} +{"current_steps": 16700, "total_steps": 20825, "loss": 0.7987, "learning_rate": 5.153612296666335e-06, "epoch": 0.801920768307323, "percentage": 80.19, "elapsed_time": "2:11:29", "remaining_time": "0:32:28", "throughput": 17341.15, "total_tokens": 136806400} +{"current_steps": 16710, "total_steps": 20825, "loss": 0.9656, "learning_rate": 5.129546144727998e-06, "epoch": 0.8024009603841536, "percentage": 80.24, "elapsed_time": "2:12:14", "remaining_time": "0:32:33", "throughput": 17252.66, "total_tokens": 136888320} +{"current_steps": 16720, "total_steps": 20825, "loss": 0.873, "learning_rate": 5.105529890549618e-06, "epoch": 0.8028811524609843, "percentage": 80.29, "elapsed_time": "2:12:59", "remaining_time": "0:32:39", "throughput": 17165.0, "total_tokens": 136970240} +{"current_steps": 16730, "total_steps": 20825, "loss": 0.7871, "learning_rate": 5.081563594439676e-06, "epoch": 0.8033613445378152, "percentage": 80.34, "elapsed_time": "2:13:44", "remaining_time": "0:32:44", "throughput": 17078.69, "total_tokens": 137052160} +{"current_steps": 16740, "total_steps": 20825, "loss": 1.0537, "learning_rate": 5.057647316581232e-06, "epoch": 0.8038415366146459, "percentage": 80.38, "elapsed_time": "2:14:29", "remaining_time": "0:32:49", "throughput": 16993.45, "total_tokens": 137134080} +{"current_steps": 16750, "total_steps": 20825, "loss": 0.9321, "learning_rate": 5.033781117031738e-06, "epoch": 0.8043217286914766, "percentage": 80.43, "elapsed_time": "2:15:15", "remaining_time": "0:32:54", "throughput": 16908.89, "total_tokens": 137216000} +{"current_steps": 16760, "total_steps": 20825, "loss": 1.0611, "learning_rate": 5.0099650557228785e-06, "epoch": 0.8048019207683074, "percentage": 80.48, "elapsed_time": "2:16:00", "remaining_time": "0:32:59", "throughput": 16825.03, "total_tokens": 137297920} +{"current_steps": 16770, "total_steps": 20825, "loss": 0.8815, "learning_rate": 4.986199192460428e-06, "epoch": 0.8052821128451381, "percentage": 80.53, "elapsed_time": "2:16:45", "remaining_time": "0:33:04", "throughput": 16742.44, "total_tokens": 137379840} +{"current_steps": 16780, "total_steps": 20825, "loss": 0.7744, "learning_rate": 4.962483586924136e-06, "epoch": 0.8057623049219688, "percentage": 80.58, "elapsed_time": "2:17:30", "remaining_time": "0:33:08", "throughput": 16660.42, "total_tokens": 137461760} +{"current_steps": 16790, "total_steps": 20825, "loss": 0.8282, "learning_rate": 4.93881829866751e-06, "epoch": 0.8062424969987996, "percentage": 80.62, "elapsed_time": "2:18:16", "remaining_time": "0:33:13", "throughput": 16578.54, "total_tokens": 137543680} +{"current_steps": 16800, "total_steps": 20825, "loss": 0.9975, "learning_rate": 4.915203387117736e-06, "epoch": 0.8067226890756303, "percentage": 80.67, "elapsed_time": "2:19:01", "remaining_time": "0:33:18", "throughput": 16498.87, "total_tokens": 137625600} +{"current_steps": 16810, "total_steps": 20825, "loss": 0.882, "learning_rate": 4.891638911575483e-06, "epoch": 0.807202881152461, "percentage": 80.72, "elapsed_time": "2:19:46", "remaining_time": "0:33:23", "throughput": 16420.08, "total_tokens": 137707520} +{"current_steps": 16820, "total_steps": 20825, "loss": 0.9084, "learning_rate": 4.868124931214752e-06, "epoch": 0.8076830732292917, "percentage": 80.77, "elapsed_time": "2:20:31", "remaining_time": "0:33:27", "throughput": 16341.95, "total_tokens": 137789440} +{"current_steps": 16830, "total_steps": 20825, "loss": 0.8356, "learning_rate": 4.844661505082768e-06, "epoch": 0.8081632653061225, "percentage": 80.82, "elapsed_time": "2:21:16", "remaining_time": "0:33:32", "throughput": 16264.58, "total_tokens": 137871360} +{"current_steps": 16840, "total_steps": 20825, "loss": 0.7691, "learning_rate": 4.8212486920998005e-06, "epoch": 0.8086434573829532, "percentage": 80.86, "elapsed_time": "2:22:02", "remaining_time": "0:33:36", "throughput": 16187.63, "total_tokens": 137953280} +{"current_steps": 16850, "total_steps": 20825, "loss": 0.915, "learning_rate": 4.797886551059011e-06, "epoch": 0.8091236494597839, "percentage": 80.91, "elapsed_time": "2:22:47", "remaining_time": "0:33:41", "throughput": 16111.75, "total_tokens": 138035200} +{"current_steps": 16860, "total_steps": 20825, "loss": 0.9692, "learning_rate": 4.7745751406263165e-06, "epoch": 0.8096038415366147, "percentage": 80.96, "elapsed_time": "2:23:32", "remaining_time": "0:33:45", "throughput": 16036.79, "total_tokens": 138117120} +{"current_steps": 16870, "total_steps": 20825, "loss": 0.8575, "learning_rate": 4.751314519340258e-06, "epoch": 0.8100840336134454, "percentage": 81.01, "elapsed_time": "2:24:17", "remaining_time": "0:33:49", "throughput": 15962.77, "total_tokens": 138199040} +{"current_steps": 16880, "total_steps": 20825, "loss": 0.8863, "learning_rate": 4.728104745611814e-06, "epoch": 0.8105642256902761, "percentage": 81.06, "elapsed_time": "2:25:03", "remaining_time": "0:33:53", "throughput": 15888.76, "total_tokens": 138280960} +{"current_steps": 16890, "total_steps": 20825, "loss": 1.099, "learning_rate": 4.704945877724295e-06, "epoch": 0.8110444177671069, "percentage": 81.1, "elapsed_time": "2:25:48", "remaining_time": "0:33:58", "throughput": 15815.41, "total_tokens": 138362880} +{"current_steps": 16900, "total_steps": 20825, "loss": 0.9003, "learning_rate": 4.681837973833181e-06, "epoch": 0.8115246098439376, "percentage": 81.15, "elapsed_time": "2:26:34", "remaining_time": "0:34:02", "throughput": 15742.64, "total_tokens": 138444800} +{"current_steps": 16910, "total_steps": 20825, "loss": 0.8087, "learning_rate": 4.658781091965955e-06, "epoch": 0.8120048019207683, "percentage": 81.2, "elapsed_time": "2:27:19", "remaining_time": "0:34:06", "throughput": 15671.31, "total_tokens": 138526720} +{"current_steps": 16920, "total_steps": 20825, "loss": 0.8977, "learning_rate": 4.635775290021988e-06, "epoch": 0.812484993997599, "percentage": 81.25, "elapsed_time": "2:28:04", "remaining_time": "0:34:10", "throughput": 15600.55, "total_tokens": 138608640} +{"current_steps": 16930, "total_steps": 20825, "loss": 0.6357, "learning_rate": 4.612820625772391e-06, "epoch": 0.8129651860744298, "percentage": 81.3, "elapsed_time": "2:28:50", "remaining_time": "0:34:14", "throughput": 15530.73, "total_tokens": 138690560} +{"current_steps": 16940, "total_steps": 20825, "loss": 0.8636, "learning_rate": 4.589917156859838e-06, "epoch": 0.8134453781512605, "percentage": 81.34, "elapsed_time": "2:29:35", "remaining_time": "0:34:18", "throughput": 15461.76, "total_tokens": 138772480} +{"current_steps": 16950, "total_steps": 20825, "loss": 0.8897, "learning_rate": 4.5670649407984625e-06, "epoch": 0.8139255702280912, "percentage": 81.39, "elapsed_time": "2:30:20", "remaining_time": "0:34:22", "throughput": 15393.77, "total_tokens": 138854400} +{"current_steps": 16960, "total_steps": 20825, "loss": 0.7806, "learning_rate": 4.544264034973686e-06, "epoch": 0.814405762304922, "percentage": 81.44, "elapsed_time": "2:31:05", "remaining_time": "0:34:26", "throughput": 15325.06, "total_tokens": 138936320} +{"current_steps": 16970, "total_steps": 20825, "loss": 0.9632, "learning_rate": 4.521514496642074e-06, "epoch": 0.8148859543817527, "percentage": 81.49, "elapsed_time": "2:31:51", "remaining_time": "0:34:29", "throughput": 15258.19, "total_tokens": 139018240} +{"current_steps": 16980, "total_steps": 20825, "loss": 0.9245, "learning_rate": 4.498816382931217e-06, "epoch": 0.8153661464585834, "percentage": 81.54, "elapsed_time": "2:32:36", "remaining_time": "0:34:33", "throughput": 15191.97, "total_tokens": 139100160} +{"current_steps": 16990, "total_steps": 20825, "loss": 1.015, "learning_rate": 4.476169750839571e-06, "epoch": 0.8158463385354142, "percentage": 81.58, "elapsed_time": "2:33:21", "remaining_time": "0:34:36", "throughput": 15125.89, "total_tokens": 139182080} +{"current_steps": 17000, "total_steps": 20825, "loss": 0.8941, "learning_rate": 4.45357465723629e-06, "epoch": 0.8163265306122449, "percentage": 81.63, "elapsed_time": "2:34:06", "remaining_time": "0:34:40", "throughput": 15060.98, "total_tokens": 139264000} +{"current_steps": 17010, "total_steps": 20825, "loss": 0.8841, "learning_rate": 4.4310311588611294e-06, "epoch": 0.8168067226890756, "percentage": 81.68, "elapsed_time": "2:34:54", "remaining_time": "0:34:44", "throughput": 14992.15, "total_tokens": 139345920} +{"current_steps": 17020, "total_steps": 20825, "loss": 0.8452, "learning_rate": 4.408539312324281e-06, "epoch": 0.8172869147659063, "percentage": 81.73, "elapsed_time": "2:35:39", "remaining_time": "0:34:47", "throughput": 14928.48, "total_tokens": 139427840} +{"current_steps": 17030, "total_steps": 20825, "loss": 0.8382, "learning_rate": 4.386099174106212e-06, "epoch": 0.8177671068427371, "percentage": 81.78, "elapsed_time": "2:36:25", "remaining_time": "0:34:51", "throughput": 14864.95, "total_tokens": 139509760} +{"current_steps": 17040, "total_steps": 20825, "loss": 0.9468, "learning_rate": 4.363710800557566e-06, "epoch": 0.8182472989195678, "percentage": 81.82, "elapsed_time": "2:37:10", "remaining_time": "0:34:54", "throughput": 14802.48, "total_tokens": 139591680} +{"current_steps": 17050, "total_steps": 20825, "loss": 0.7798, "learning_rate": 4.341374247898983e-06, "epoch": 0.8187274909963985, "percentage": 81.87, "elapsed_time": "2:37:55", "remaining_time": "0:34:57", "throughput": 14740.64, "total_tokens": 139673600} +{"current_steps": 17060, "total_steps": 20825, "loss": 0.949, "learning_rate": 4.3190895722209635e-06, "epoch": 0.8192076830732293, "percentage": 81.92, "elapsed_time": "2:38:40", "remaining_time": "0:35:01", "throughput": 14679.34, "total_tokens": 139755520} +{"current_steps": 17070, "total_steps": 20825, "loss": 0.8836, "learning_rate": 4.296856829483759e-06, "epoch": 0.81968787515006, "percentage": 81.97, "elapsed_time": "2:39:25", "remaining_time": "0:35:04", "throughput": 14618.45, "total_tokens": 139837440} +{"current_steps": 17080, "total_steps": 20825, "loss": 0.7409, "learning_rate": 4.274676075517206e-06, "epoch": 0.8201680672268907, "percentage": 82.02, "elapsed_time": "2:40:11", "remaining_time": "0:35:07", "throughput": 14558.23, "total_tokens": 139919360} +{"current_steps": 17090, "total_steps": 20825, "loss": 0.8346, "learning_rate": 4.252547366020568e-06, "epoch": 0.8206482593037215, "percentage": 82.06, "elapsed_time": "2:40:56", "remaining_time": "0:35:10", "throughput": 14498.54, "total_tokens": 140001280} +{"current_steps": 17100, "total_steps": 20825, "loss": 0.983, "learning_rate": 4.230470756562438e-06, "epoch": 0.8211284513805522, "percentage": 82.11, "elapsed_time": "2:41:41", "remaining_time": "0:35:13", "throughput": 14439.96, "total_tokens": 140083200} +{"current_steps": 17110, "total_steps": 20825, "loss": 0.7598, "learning_rate": 4.208446302580582e-06, "epoch": 0.8216086434573829, "percentage": 82.16, "elapsed_time": "2:42:26", "remaining_time": "0:35:16", "throughput": 14380.66, "total_tokens": 140165120} +{"current_steps": 17120, "total_steps": 20825, "loss": 0.7198, "learning_rate": 4.186474059381768e-06, "epoch": 0.8220888355342136, "percentage": 82.21, "elapsed_time": "2:43:12", "remaining_time": "0:35:19", "throughput": 14322.61, "total_tokens": 140247040} +{"current_steps": 17130, "total_steps": 20825, "loss": 0.8544, "learning_rate": 4.164554082141683e-06, "epoch": 0.8225690276110444, "percentage": 82.26, "elapsed_time": "2:43:57", "remaining_time": "0:35:21", "throughput": 14265.12, "total_tokens": 140328960} +{"current_steps": 17140, "total_steps": 20825, "loss": 0.8519, "learning_rate": 4.142686425904752e-06, "epoch": 0.8230492196878751, "percentage": 82.3, "elapsed_time": "2:44:42", "remaining_time": "0:35:24", "throughput": 14208.47, "total_tokens": 140410880} +{"current_steps": 17150, "total_steps": 20825, "loss": 0.8076, "learning_rate": 4.12087114558401e-06, "epoch": 0.8235294117647058, "percentage": 82.35, "elapsed_time": "2:45:27", "remaining_time": "0:35:27", "throughput": 14151.94, "total_tokens": 140492800} +{"current_steps": 17160, "total_steps": 20825, "loss": 0.7344, "learning_rate": 4.099108295960977e-06, "epoch": 0.8240096038415367, "percentage": 82.4, "elapsed_time": "2:46:12", "remaining_time": "0:35:29", "throughput": 14095.99, "total_tokens": 140574720} +{"current_steps": 17170, "total_steps": 20825, "loss": 0.8416, "learning_rate": 4.077397931685523e-06, "epoch": 0.8244897959183674, "percentage": 82.45, "elapsed_time": "2:46:58", "remaining_time": "0:35:32", "throughput": 14039.99, "total_tokens": 140656640} +{"current_steps": 17180, "total_steps": 20825, "loss": 1.1131, "learning_rate": 4.055740107275685e-06, "epoch": 0.824969987995198, "percentage": 82.5, "elapsed_time": "2:47:43", "remaining_time": "0:35:35", "throughput": 13984.77, "total_tokens": 140738560} +{"current_steps": 17190, "total_steps": 20825, "loss": 0.9831, "learning_rate": 4.0341348771175955e-06, "epoch": 0.8254501800720289, "percentage": 82.55, "elapsed_time": "2:48:28", "remaining_time": "0:35:37", "throughput": 13930.41, "total_tokens": 140820480} +{"current_steps": 17200, "total_steps": 20825, "loss": 0.8343, "learning_rate": 4.012582295465308e-06, "epoch": 0.8259303721488596, "percentage": 82.59, "elapsed_time": "2:49:14", "remaining_time": "0:35:40", "throughput": 13876.44, "total_tokens": 140902400} +{"current_steps": 17210, "total_steps": 20825, "loss": 0.8526, "learning_rate": 3.991082416440656e-06, "epoch": 0.8264105642256903, "percentage": 82.64, "elapsed_time": "2:49:59", "remaining_time": "0:35:42", "throughput": 13823.25, "total_tokens": 140984320} +{"current_steps": 17220, "total_steps": 20825, "loss": 0.7942, "learning_rate": 3.969635294033144e-06, "epoch": 0.826890756302521, "percentage": 82.69, "elapsed_time": "2:50:44", "remaining_time": "0:35:44", "throughput": 13770.6, "total_tokens": 141066240} +{"current_steps": 17230, "total_steps": 20825, "loss": 0.8681, "learning_rate": 3.9482409820997826e-06, "epoch": 0.8273709483793518, "percentage": 82.74, "elapsed_time": "2:51:29", "remaining_time": "0:35:46", "throughput": 13718.13, "total_tokens": 141148160} +{"current_steps": 17240, "total_steps": 20825, "loss": 0.9081, "learning_rate": 3.926899534364969e-06, "epoch": 0.8278511404561825, "percentage": 82.79, "elapsed_time": "2:52:14", "remaining_time": "0:35:48", "throughput": 13666.14, "total_tokens": 141230080} +{"current_steps": 17250, "total_steps": 20825, "loss": 0.8689, "learning_rate": 3.90561100442036e-06, "epoch": 0.8283313325330132, "percentage": 82.83, "elapsed_time": "2:52:59", "remaining_time": "0:35:51", "throughput": 13614.78, "total_tokens": 141312000} +{"current_steps": 17260, "total_steps": 20825, "loss": 1.0517, "learning_rate": 3.8843754457247275e-06, "epoch": 0.828811524609844, "percentage": 82.88, "elapsed_time": "2:53:44", "remaining_time": "0:35:53", "throughput": 13563.6, "total_tokens": 141393920} +{"current_steps": 17270, "total_steps": 20825, "loss": 0.9196, "learning_rate": 3.863192911603808e-06, "epoch": 0.8292917166866747, "percentage": 82.93, "elapsed_time": "2:54:29", "remaining_time": "0:35:55", "throughput": 13512.97, "total_tokens": 141475840} +{"current_steps": 17280, "total_steps": 20825, "loss": 0.9042, "learning_rate": 3.842063455250203e-06, "epoch": 0.8297719087635054, "percentage": 82.98, "elapsed_time": "2:55:14", "remaining_time": "0:35:57", "throughput": 13462.7, "total_tokens": 141557760} +{"current_steps": 17290, "total_steps": 20825, "loss": 0.867, "learning_rate": 3.820987129723228e-06, "epoch": 0.8302521008403362, "percentage": 83.03, "elapsed_time": "2:56:00", "remaining_time": "0:35:59", "throughput": 13412.84, "total_tokens": 141639680} +{"current_steps": 17300, "total_steps": 20825, "loss": 0.7882, "learning_rate": 3.799963987948757e-06, "epoch": 0.8307322929171669, "percentage": 83.07, "elapsed_time": "2:56:46", "remaining_time": "0:36:01", "throughput": 13362.03, "total_tokens": 141721600} +{"current_steps": 17310, "total_steps": 20825, "loss": 0.8897, "learning_rate": 3.7789940827191395e-06, "epoch": 0.8312124849939976, "percentage": 83.12, "elapsed_time": "2:57:31", "remaining_time": "0:36:02", "throughput": 13312.61, "total_tokens": 141803520} +{"current_steps": 17320, "total_steps": 20825, "loss": 0.8876, "learning_rate": 3.7580774666930134e-06, "epoch": 0.8316926770708283, "percentage": 83.17, "elapsed_time": "2:58:17", "remaining_time": "0:36:04", "throughput": 13263.76, "total_tokens": 141885440} +{"current_steps": 17330, "total_steps": 20825, "loss": 0.8931, "learning_rate": 3.737214192395225e-06, "epoch": 0.8321728691476591, "percentage": 83.22, "elapsed_time": "2:59:04", "remaining_time": "0:36:06", "throughput": 13213.42, "total_tokens": 141967360} +{"current_steps": 17340, "total_steps": 20825, "loss": 1.0343, "learning_rate": 3.7164043122166508e-06, "epoch": 0.8326530612244898, "percentage": 83.27, "elapsed_time": "2:59:49", "remaining_time": "0:36:08", "throughput": 13165.58, "total_tokens": 142049280} +{"current_steps": 17350, "total_steps": 20825, "loss": 1.0005, "learning_rate": 3.6956478784140937e-06, "epoch": 0.8331332533013205, "percentage": 83.31, "elapsed_time": "3:00:34", "remaining_time": "0:36:10", "throughput": 13117.85, "total_tokens": 142131200} +{"current_steps": 17360, "total_steps": 20825, "loss": 0.9079, "learning_rate": 3.674944943110156e-06, "epoch": 0.8336134453781513, "percentage": 83.36, "elapsed_time": "3:01:20", "remaining_time": "0:36:11", "throughput": 13070.78, "total_tokens": 142213120} +{"current_steps": 17370, "total_steps": 20825, "loss": 0.7459, "learning_rate": 3.6542955582930748e-06, "epoch": 0.834093637454982, "percentage": 83.41, "elapsed_time": "3:02:05", "remaining_time": "0:36:13", "throughput": 13024.1, "total_tokens": 142295040} +{"current_steps": 17380, "total_steps": 20825, "loss": 0.9866, "learning_rate": 3.6336997758166263e-06, "epoch": 0.8345738295318127, "percentage": 83.46, "elapsed_time": "3:02:56", "remaining_time": "0:36:15", "throughput": 12971.22, "total_tokens": 142376960} +{"current_steps": 17390, "total_steps": 20825, "loss": 0.775, "learning_rate": 3.6131576473999924e-06, "epoch": 0.8350540216086435, "percentage": 83.51, "elapsed_time": "3:03:47", "remaining_time": "0:36:18", "throughput": 12918.19, "total_tokens": 142458880} +{"current_steps": 17400, "total_steps": 20825, "loss": 0.916, "learning_rate": 3.592669224627601e-06, "epoch": 0.8355342136854742, "percentage": 83.55, "elapsed_time": "3:04:40", "remaining_time": "0:36:20", "throughput": 12864.57, "total_tokens": 142540800} +{"current_steps": 17410, "total_steps": 20825, "loss": 1.046, "learning_rate": 3.5722345589490306e-06, "epoch": 0.8360144057623049, "percentage": 83.6, "elapsed_time": "3:05:30", "remaining_time": "0:36:23", "throughput": 12813.37, "total_tokens": 142622720} +{"current_steps": 17420, "total_steps": 20825, "loss": 1.0183, "learning_rate": 3.5518537016788646e-06, "epoch": 0.8364945978391356, "percentage": 83.65, "elapsed_time": "3:06:17", "remaining_time": "0:36:24", "throughput": 12767.19, "total_tokens": 142704640} +{"current_steps": 17430, "total_steps": 20825, "loss": 0.8231, "learning_rate": 3.531526703996557e-06, "epoch": 0.8369747899159664, "percentage": 83.7, "elapsed_time": "3:07:02", "remaining_time": "0:36:25", "throughput": 12722.71, "total_tokens": 142786560} +{"current_steps": 17440, "total_steps": 20825, "loss": 0.9277, "learning_rate": 3.511253616946325e-06, "epoch": 0.8374549819927971, "percentage": 83.75, "elapsed_time": "3:07:48", "remaining_time": "0:36:27", "throughput": 12678.89, "total_tokens": 142868480} +{"current_steps": 17450, "total_steps": 20825, "loss": 0.8723, "learning_rate": 3.4910344914370093e-06, "epoch": 0.8379351740696278, "percentage": 83.79, "elapsed_time": "3:08:33", "remaining_time": "0:36:28", "throughput": 12635.12, "total_tokens": 142950400} +{"current_steps": 17460, "total_steps": 20825, "loss": 0.8936, "learning_rate": 3.4708693782419225e-06, "epoch": 0.8384153661464586, "percentage": 83.84, "elapsed_time": "3:09:18", "remaining_time": "0:36:29", "throughput": 12592.33, "total_tokens": 143032320} +{"current_steps": 17470, "total_steps": 20825, "loss": 0.8404, "learning_rate": 3.450758327998768e-06, "epoch": 0.8388955582232893, "percentage": 83.89, "elapsed_time": "3:10:03", "remaining_time": "0:36:30", "throughput": 12549.74, "total_tokens": 143114240} +{"current_steps": 17480, "total_steps": 20825, "loss": 0.9405, "learning_rate": 3.4307013912094845e-06, "epoch": 0.83937575030012, "percentage": 83.94, "elapsed_time": "3:10:48", "remaining_time": "0:36:30", "throughput": 12507.52, "total_tokens": 143196160} +{"current_steps": 17490, "total_steps": 20825, "loss": 0.6978, "learning_rate": 3.41069861824011e-06, "epoch": 0.8398559423769508, "percentage": 83.99, "elapsed_time": "3:11:34", "remaining_time": "0:36:31", "throughput": 12465.28, "total_tokens": 143278080} +{"current_steps": 17500, "total_steps": 20825, "loss": 0.9487, "learning_rate": 3.390750059320688e-06, "epoch": 0.8403361344537815, "percentage": 84.03, "elapsed_time": "3:12:19", "remaining_time": "0:36:32", "throughput": 12423.74, "total_tokens": 143360000} +{"current_steps": 17510, "total_steps": 20825, "loss": 0.7978, "learning_rate": 3.3708557645451053e-06, "epoch": 0.8408163265306122, "percentage": 84.08, "elapsed_time": "3:13:04", "remaining_time": "0:36:33", "throughput": 12382.38, "total_tokens": 143441920} +{"current_steps": 17520, "total_steps": 20825, "loss": 0.9229, "learning_rate": 3.3510157838709895e-06, "epoch": 0.8412965186074429, "percentage": 84.13, "elapsed_time": "3:13:49", "remaining_time": "0:36:33", "throughput": 12341.07, "total_tokens": 143523840} +{"current_steps": 17530, "total_steps": 20825, "loss": 1.0837, "learning_rate": 3.3312301671195784e-06, "epoch": 0.8417767106842737, "percentage": 84.18, "elapsed_time": "3:14:34", "remaining_time": "0:36:34", "throughput": 12300.36, "total_tokens": 143605760} +{"current_steps": 17540, "total_steps": 20825, "loss": 0.8367, "learning_rate": 3.3114989639755983e-06, "epoch": 0.8422569027611044, "percentage": 84.23, "elapsed_time": "3:15:20", "remaining_time": "0:36:35", "throughput": 12260.0, "total_tokens": 143687680} +{"current_steps": 17550, "total_steps": 20825, "loss": 0.863, "learning_rate": 3.2918222239871206e-06, "epoch": 0.8427370948379351, "percentage": 84.27, "elapsed_time": "3:16:05", "remaining_time": "0:36:35", "throughput": 12219.76, "total_tokens": 143769600} +{"current_steps": 17560, "total_steps": 20825, "loss": 0.8599, "learning_rate": 3.272199996565464e-06, "epoch": 0.8432172869147659, "percentage": 84.32, "elapsed_time": "3:16:50", "remaining_time": "0:36:35", "throughput": 12179.96, "total_tokens": 143851520} +{"current_steps": 17570, "total_steps": 20825, "loss": 0.8835, "learning_rate": 3.252632330985059e-06, "epoch": 0.8436974789915966, "percentage": 84.37, "elapsed_time": "3:17:35", "remaining_time": "0:36:36", "throughput": 12140.27, "total_tokens": 143933440} +{"current_steps": 17580, "total_steps": 20825, "loss": 0.8098, "learning_rate": 3.233119276383309e-06, "epoch": 0.8441776710684273, "percentage": 84.42, "elapsed_time": "3:18:21", "remaining_time": "0:36:36", "throughput": 12100.92, "total_tokens": 144015360} +{"current_steps": 17590, "total_steps": 20825, "loss": 0.8136, "learning_rate": 3.2136608817604998e-06, "epoch": 0.8446578631452581, "percentage": 84.47, "elapsed_time": "3:19:06", "remaining_time": "0:36:37", "throughput": 12062.05, "total_tokens": 144097280} +{"current_steps": 17600, "total_steps": 20825, "loss": 0.9242, "learning_rate": 3.1942571959796414e-06, "epoch": 0.8451380552220888, "percentage": 84.51, "elapsed_time": "3:19:51", "remaining_time": "0:36:37", "throughput": 12023.51, "total_tokens": 144179200} +{"current_steps": 17610, "total_steps": 20825, "loss": 0.9447, "learning_rate": 3.1749082677663606e-06, "epoch": 0.8456182472989195, "percentage": 84.56, "elapsed_time": "3:20:36", "remaining_time": "0:36:37", "throughput": 11985.33, "total_tokens": 144261120} +{"current_steps": 17620, "total_steps": 20825, "loss": 1.0145, "learning_rate": 3.1556141457087932e-06, "epoch": 0.8460984393757504, "percentage": 84.61, "elapsed_time": "3:21:21", "remaining_time": "0:36:37", "throughput": 11947.36, "total_tokens": 144343040} +{"current_steps": 17630, "total_steps": 20825, "loss": 0.8731, "learning_rate": 3.1363748782574475e-06, "epoch": 0.846578631452581, "percentage": 84.66, "elapsed_time": "3:22:06", "remaining_time": "0:36:37", "throughput": 11909.55, "total_tokens": 144424960} +{"current_steps": 17640, "total_steps": 20825, "loss": 0.8883, "learning_rate": 3.1171905137250655e-06, "epoch": 0.8470588235294118, "percentage": 84.71, "elapsed_time": "3:22:51", "remaining_time": "0:36:37", "throughput": 11872.14, "total_tokens": 144506880} +{"current_steps": 17650, "total_steps": 20825, "loss": 0.8102, "learning_rate": 3.098061100286537e-06, "epoch": 0.8475390156062425, "percentage": 84.75, "elapsed_time": "3:23:37", "remaining_time": "0:36:37", "throughput": 11834.47, "total_tokens": 144588800} +{"current_steps": 17660, "total_steps": 20825, "loss": 1.0013, "learning_rate": 3.078986685978763e-06, "epoch": 0.8480192076830733, "percentage": 84.8, "elapsed_time": "3:24:22", "remaining_time": "0:36:37", "throughput": 11797.64, "total_tokens": 144670720} +{"current_steps": 17670, "total_steps": 20825, "loss": 0.7933, "learning_rate": 3.059967318700513e-06, "epoch": 0.848499399759904, "percentage": 84.85, "elapsed_time": "3:25:08", "remaining_time": "0:36:37", "throughput": 11760.72, "total_tokens": 144752640} +{"current_steps": 17680, "total_steps": 20825, "loss": 0.8733, "learning_rate": 3.0410030462123486e-06, "epoch": 0.8489795918367347, "percentage": 84.9, "elapsed_time": "3:25:53", "remaining_time": "0:36:37", "throughput": 11724.26, "total_tokens": 144834560} +{"current_steps": 17690, "total_steps": 20825, "loss": 1.1693, "learning_rate": 3.022093916136465e-06, "epoch": 0.8494597839135655, "percentage": 84.95, "elapsed_time": "3:26:38", "remaining_time": "0:36:37", "throughput": 11688.0, "total_tokens": 144916480} +{"current_steps": 17700, "total_steps": 20825, "loss": 0.8838, "learning_rate": 3.0032399759565845e-06, "epoch": 0.8499399759903962, "percentage": 84.99, "elapsed_time": "3:27:23", "remaining_time": "0:36:37", "throughput": 11652.18, "total_tokens": 144998400} +{"current_steps": 17710, "total_steps": 20825, "loss": 0.93, "learning_rate": 2.9844412730178515e-06, "epoch": 0.8504201680672269, "percentage": 85.04, "elapsed_time": "3:28:08", "remaining_time": "0:36:36", "throughput": 11616.84, "total_tokens": 145080320} +{"current_steps": 17720, "total_steps": 20825, "loss": 0.9282, "learning_rate": 2.9656978545267002e-06, "epoch": 0.8509003601440577, "percentage": 85.09, "elapsed_time": "3:28:53", "remaining_time": "0:36:36", "throughput": 11581.7, "total_tokens": 145162240} +{"current_steps": 17730, "total_steps": 20825, "loss": 0.9096, "learning_rate": 2.947009767550718e-06, "epoch": 0.8513805522208884, "percentage": 85.14, "elapsed_time": "3:29:38", "remaining_time": "0:36:35", "throughput": 11546.67, "total_tokens": 145244160} +{"current_steps": 17740, "total_steps": 20825, "loss": 1.0297, "learning_rate": 2.9283770590185696e-06, "epoch": 0.8518607442977191, "percentage": 85.19, "elapsed_time": "3:30:24", "remaining_time": "0:36:35", "throughput": 11511.8, "total_tokens": 145326080} +{"current_steps": 17750, "total_steps": 20825, "loss": 1.1381, "learning_rate": 2.9097997757198516e-06, "epoch": 0.8523409363745498, "percentage": 85.23, "elapsed_time": "3:31:09", "remaining_time": "0:36:34", "throughput": 11477.2, "total_tokens": 145408000} +{"current_steps": 17760, "total_steps": 20825, "loss": 0.8219, "learning_rate": 2.891277964304959e-06, "epoch": 0.8528211284513806, "percentage": 85.28, "elapsed_time": "3:31:54", "remaining_time": "0:36:34", "throughput": 11442.73, "total_tokens": 145489920} +{"current_steps": 17770, "total_steps": 20825, "loss": 0.8588, "learning_rate": 2.8728116712850193e-06, "epoch": 0.8533013205282113, "percentage": 85.33, "elapsed_time": "3:32:39", "remaining_time": "0:36:33", "throughput": 11408.66, "total_tokens": 145571840} +{"current_steps": 17780, "total_steps": 20825, "loss": 0.9943, "learning_rate": 2.8544009430317153e-06, "epoch": 0.853781512605042, "percentage": 85.38, "elapsed_time": "3:33:24", "remaining_time": "0:36:32", "throughput": 11375.05, "total_tokens": 145653760} +{"current_steps": 17790, "total_steps": 20825, "loss": 0.9051, "learning_rate": 2.8360458257772228e-06, "epoch": 0.8542617046818728, "percentage": 85.43, "elapsed_time": "3:34:10", "remaining_time": "0:36:32", "throughput": 11341.04, "total_tokens": 145735680} +{"current_steps": 17800, "total_steps": 20825, "loss": 0.8999, "learning_rate": 2.817746365614049e-06, "epoch": 0.8547418967587035, "percentage": 85.47, "elapsed_time": "3:34:55", "remaining_time": "0:36:31", "throughput": 11307.67, "total_tokens": 145817600} +{"current_steps": 17810, "total_steps": 20825, "loss": 0.9312, "learning_rate": 2.7995026084949584e-06, "epoch": 0.8552220888355342, "percentage": 85.52, "elapsed_time": "3:35:40", "remaining_time": "0:36:30", "throughput": 11274.6, "total_tokens": 145899520} +{"current_steps": 17820, "total_steps": 20825, "loss": 1.0525, "learning_rate": 2.781314600232815e-06, "epoch": 0.855702280912365, "percentage": 85.57, "elapsed_time": "3:36:25", "remaining_time": "0:36:29", "throughput": 11241.64, "total_tokens": 145981440} +{"current_steps": 17830, "total_steps": 20825, "loss": 0.8697, "learning_rate": 2.763182386500504e-06, "epoch": 0.8561824729891957, "percentage": 85.62, "elapsed_time": "3:37:11", "remaining_time": "0:36:28", "throughput": 11208.69, "total_tokens": 146063360} +{"current_steps": 17840, "total_steps": 20825, "loss": 0.9403, "learning_rate": 2.745106012830806e-06, "epoch": 0.8566626650660264, "percentage": 85.67, "elapsed_time": "3:37:56", "remaining_time": "0:36:27", "throughput": 11176.36, "total_tokens": 146145280} +{"current_steps": 17850, "total_steps": 20825, "loss": 1.0035, "learning_rate": 2.7270855246162547e-06, "epoch": 0.8571428571428571, "percentage": 85.71, "elapsed_time": "3:38:41", "remaining_time": "0:36:26", "throughput": 11144.25, "total_tokens": 146227200} +{"current_steps": 17860, "total_steps": 20825, "loss": 0.9146, "learning_rate": 2.7091209671090715e-06, "epoch": 0.8576230492196879, "percentage": 85.76, "elapsed_time": "3:39:26", "remaining_time": "0:36:25", "throughput": 11112.29, "total_tokens": 146309120} +{"current_steps": 17870, "total_steps": 20825, "loss": 0.8785, "learning_rate": 2.6912123854210212e-06, "epoch": 0.8581032412965186, "percentage": 85.81, "elapsed_time": "3:40:11", "remaining_time": "0:36:24", "throughput": 11080.6, "total_tokens": 146391040} +{"current_steps": 17880, "total_steps": 20825, "loss": 0.9372, "learning_rate": 2.673359824523297e-06, "epoch": 0.8585834333733493, "percentage": 85.86, "elapsed_time": "3:40:56", "remaining_time": "0:36:23", "throughput": 11049.17, "total_tokens": 146472960} +{"current_steps": 17890, "total_steps": 20825, "loss": 0.9457, "learning_rate": 2.655563329246413e-06, "epoch": 0.8590636254501801, "percentage": 85.91, "elapsed_time": "3:41:41", "remaining_time": "0:36:22", "throughput": 11017.8, "total_tokens": 146554880} +{"current_steps": 17900, "total_steps": 20825, "loss": 0.8075, "learning_rate": 2.637822944280116e-06, "epoch": 0.8595438175270108, "percentage": 85.95, "elapsed_time": "3:42:26", "remaining_time": "0:36:20", "throughput": 10986.65, "total_tokens": 146636800} +{"current_steps": 17910, "total_steps": 20825, "loss": 0.9612, "learning_rate": 2.6201387141732205e-06, "epoch": 0.8600240096038415, "percentage": 86.0, "elapsed_time": "3:43:11", "remaining_time": "0:36:19", "throughput": 10955.98, "total_tokens": 146718720} +{"current_steps": 17920, "total_steps": 20825, "loss": 1.0508, "learning_rate": 2.6025106833335505e-06, "epoch": 0.8605042016806723, "percentage": 86.05, "elapsed_time": "3:43:56", "remaining_time": "0:36:18", "throughput": 10925.21, "total_tokens": 146800640} +{"current_steps": 17930, "total_steps": 20825, "loss": 0.7723, "learning_rate": 2.5849388960277997e-06, "epoch": 0.860984393757503, "percentage": 86.1, "elapsed_time": "3:44:42", "remaining_time": "0:36:16", "throughput": 10894.13, "total_tokens": 146882560} +{"current_steps": 17940, "total_steps": 20825, "loss": 0.783, "learning_rate": 2.567423396381419e-06, "epoch": 0.8614645858343337, "percentage": 86.15, "elapsed_time": "3:45:27", "remaining_time": "0:36:15", "throughput": 10863.85, "total_tokens": 146964480} +{"current_steps": 17950, "total_steps": 20825, "loss": 0.7405, "learning_rate": 2.549964228378518e-06, "epoch": 0.8619447779111644, "percentage": 86.19, "elapsed_time": "3:46:13", "remaining_time": "0:36:13", "throughput": 10833.74, "total_tokens": 147046400} +{"current_steps": 17960, "total_steps": 20825, "loss": 0.9065, "learning_rate": 2.532561435861755e-06, "epoch": 0.8624249699879952, "percentage": 86.24, "elapsed_time": "3:46:58", "remaining_time": "0:36:12", "throughput": 10803.92, "total_tokens": 147128320} +{"current_steps": 17970, "total_steps": 20825, "loss": 0.8906, "learning_rate": 2.515215062532206e-06, "epoch": 0.8629051620648259, "percentage": 86.29, "elapsed_time": "3:47:43", "remaining_time": "0:36:10", "throughput": 10774.0, "total_tokens": 147210240} +{"current_steps": 17980, "total_steps": 20825, "loss": 0.9354, "learning_rate": 2.497925151949271e-06, "epoch": 0.8633853541416566, "percentage": 86.34, "elapsed_time": "3:48:28", "remaining_time": "0:36:09", "throughput": 10744.45, "total_tokens": 147292160} +{"current_steps": 17990, "total_steps": 20825, "loss": 0.985, "learning_rate": 2.4806917475305806e-06, "epoch": 0.8638655462184874, "percentage": 86.39, "elapsed_time": "3:49:13", "remaining_time": "0:36:07", "throughput": 10715.27, "total_tokens": 147374080} +{"current_steps": 18000, "total_steps": 20825, "loss": 0.8599, "learning_rate": 2.4635148925518577e-06, "epoch": 0.8643457382953181, "percentage": 86.43, "elapsed_time": "3:49:58", "remaining_time": "0:36:05", "throughput": 10686.14, "total_tokens": 147456000} +{"current_steps": 18010, "total_steps": 20825, "loss": 0.8387, "learning_rate": 2.4463946301468143e-06, "epoch": 0.8648259303721488, "percentage": 86.48, "elapsed_time": "3:50:48", "remaining_time": "0:36:04", "throughput": 10654.09, "total_tokens": 147537920} +{"current_steps": 18020, "total_steps": 20825, "loss": 0.9122, "learning_rate": 2.4293310033070614e-06, "epoch": 0.8653061224489796, "percentage": 86.53, "elapsed_time": "3:51:33", "remaining_time": "0:36:02", "throughput": 10625.42, "total_tokens": 147619840} +{"current_steps": 18030, "total_steps": 20825, "loss": 0.9507, "learning_rate": 2.4123240548819955e-06, "epoch": 0.8657863145258103, "percentage": 86.58, "elapsed_time": "3:52:18", "remaining_time": "0:36:00", "throughput": 10596.79, "total_tokens": 147701760} +{"current_steps": 18040, "total_steps": 20825, "loss": 0.7972, "learning_rate": 2.3953738275786565e-06, "epoch": 0.866266506602641, "percentage": 86.63, "elapsed_time": "3:53:03", "remaining_time": "0:35:58", "throughput": 10568.51, "total_tokens": 147783680} +{"current_steps": 18050, "total_steps": 20825, "loss": 0.8777, "learning_rate": 2.3784803639616854e-06, "epoch": 0.8667466986794717, "percentage": 86.67, "elapsed_time": "3:53:48", "remaining_time": "0:35:56", "throughput": 10540.33, "total_tokens": 147865600} +{"current_steps": 18060, "total_steps": 20825, "loss": 0.8028, "learning_rate": 2.361643706453151e-06, "epoch": 0.8672268907563025, "percentage": 86.72, "elapsed_time": "3:54:33", "remaining_time": "0:35:54", "throughput": 10512.3, "total_tokens": 147947520} +{"current_steps": 18070, "total_steps": 20825, "loss": 0.872, "learning_rate": 2.3448638973324833e-06, "epoch": 0.8677070828331332, "percentage": 86.77, "elapsed_time": "3:55:18", "remaining_time": "0:35:52", "throughput": 10484.5, "total_tokens": 148029440} +{"current_steps": 18080, "total_steps": 20825, "loss": 1.2244, "learning_rate": 2.328140978736365e-06, "epoch": 0.868187274909964, "percentage": 86.82, "elapsed_time": "3:56:04", "remaining_time": "0:35:50", "throughput": 10456.8, "total_tokens": 148111360} +{"current_steps": 18090, "total_steps": 20825, "loss": 0.8573, "learning_rate": 2.311474992658613e-06, "epoch": 0.8686674669867948, "percentage": 86.87, "elapsed_time": "3:56:49", "remaining_time": "0:35:48", "throughput": 10429.12, "total_tokens": 148193280} +{"current_steps": 18100, "total_steps": 20825, "loss": 0.7746, "learning_rate": 2.29486598095007e-06, "epoch": 0.8691476590636255, "percentage": 86.91, "elapsed_time": "3:57:34", "remaining_time": "0:35:46", "throughput": 10401.7, "total_tokens": 148275200} +{"current_steps": 18110, "total_steps": 20825, "loss": 0.9389, "learning_rate": 2.278313985318517e-06, "epoch": 0.8696278511404562, "percentage": 86.96, "elapsed_time": "3:58:20", "remaining_time": "0:35:43", "throughput": 10374.58, "total_tokens": 148357120} +{"current_steps": 18120, "total_steps": 20825, "loss": 0.8541, "learning_rate": 2.261819047328562e-06, "epoch": 0.870108043217287, "percentage": 87.01, "elapsed_time": "3:59:05", "remaining_time": "0:35:41", "throughput": 10347.33, "total_tokens": 148439040} +{"current_steps": 18130, "total_steps": 20825, "loss": 0.9053, "learning_rate": 2.2453812084015175e-06, "epoch": 0.8705882352941177, "percentage": 87.06, "elapsed_time": "3:59:50", "remaining_time": "0:35:39", "throughput": 10320.59, "total_tokens": 148520960} +{"current_steps": 18140, "total_steps": 20825, "loss": 1.2452, "learning_rate": 2.2290005098153296e-06, "epoch": 0.8710684273709484, "percentage": 87.11, "elapsed_time": "4:00:36", "remaining_time": "0:35:36", "throughput": 10293.87, "total_tokens": 148602880} +{"current_steps": 18150, "total_steps": 20825, "loss": 0.9268, "learning_rate": 2.212676992704435e-06, "epoch": 0.8715486194477791, "percentage": 87.15, "elapsed_time": "4:01:21", "remaining_time": "0:35:34", "throughput": 10267.46, "total_tokens": 148684800} +{"current_steps": 18160, "total_steps": 20825, "loss": 0.6561, "learning_rate": 2.1964106980597034e-06, "epoch": 0.8720288115246099, "percentage": 87.2, "elapsed_time": "4:02:06", "remaining_time": "0:35:31", "throughput": 10241.17, "total_tokens": 148766720} +{"current_steps": 18170, "total_steps": 20825, "loss": 0.8747, "learning_rate": 2.1802016667282847e-06, "epoch": 0.8725090036014406, "percentage": 87.25, "elapsed_time": "4:02:51", "remaining_time": "0:35:29", "throughput": 10214.92, "total_tokens": 148848640} +{"current_steps": 18180, "total_steps": 20825, "loss": 0.8711, "learning_rate": 2.1640499394135595e-06, "epoch": 0.8729891956782713, "percentage": 87.3, "elapsed_time": "4:03:36", "remaining_time": "0:35:26", "throughput": 10189.0, "total_tokens": 148930560} +{"current_steps": 18190, "total_steps": 20825, "loss": 0.9279, "learning_rate": 2.1479555566749825e-06, "epoch": 0.8734693877551021, "percentage": 87.35, "elapsed_time": "4:04:22", "remaining_time": "0:35:23", "throughput": 10162.97, "total_tokens": 149012480} +{"current_steps": 18200, "total_steps": 20825, "loss": 0.9047, "learning_rate": 2.131918558928023e-06, "epoch": 0.8739495798319328, "percentage": 87.39, "elapsed_time": "4:05:07", "remaining_time": "0:35:21", "throughput": 10137.23, "total_tokens": 149094400} +{"current_steps": 18210, "total_steps": 20825, "loss": 0.8876, "learning_rate": 2.1159389864440495e-06, "epoch": 0.8744297719087635, "percentage": 87.44, "elapsed_time": "4:05:52", "remaining_time": "0:35:18", "throughput": 10111.82, "total_tokens": 149176320} +{"current_steps": 18220, "total_steps": 20825, "loss": 0.7592, "learning_rate": 2.100016879350214e-06, "epoch": 0.8749099639855943, "percentage": 87.49, "elapsed_time": "4:06:38", "remaining_time": "0:35:15", "throughput": 10086.38, "total_tokens": 149258240} +{"current_steps": 18230, "total_steps": 20825, "loss": 0.8473, "learning_rate": 2.0841522776293725e-06, "epoch": 0.875390156062425, "percentage": 87.54, "elapsed_time": "4:07:23", "remaining_time": "0:35:12", "throughput": 10061.0, "total_tokens": 149340160} +{"current_steps": 18240, "total_steps": 20825, "loss": 1.1182, "learning_rate": 2.0683452211199854e-06, "epoch": 0.8758703481392557, "percentage": 87.59, "elapsed_time": "4:08:08", "remaining_time": "0:35:10", "throughput": 10035.92, "total_tokens": 149422080} +{"current_steps": 18250, "total_steps": 20825, "loss": 0.8305, "learning_rate": 2.052595749515987e-06, "epoch": 0.8763505402160864, "percentage": 87.64, "elapsed_time": "4:08:53", "remaining_time": "0:35:07", "throughput": 10011.07, "total_tokens": 149504000} +{"current_steps": 18260, "total_steps": 20825, "loss": 0.9346, "learning_rate": 2.0369039023667215e-06, "epoch": 0.8768307322929172, "percentage": 87.68, "elapsed_time": "4:09:39", "remaining_time": "0:35:04", "throughput": 9986.36, "total_tokens": 149585920} +{"current_steps": 18270, "total_steps": 20825, "loss": 0.9082, "learning_rate": 2.0212697190768263e-06, "epoch": 0.8773109243697479, "percentage": 87.73, "elapsed_time": "4:10:24", "remaining_time": "0:35:01", "throughput": 9961.65, "total_tokens": 149667840} +{"current_steps": 18280, "total_steps": 20825, "loss": 0.8169, "learning_rate": 2.0056932389061338e-06, "epoch": 0.8777911164465786, "percentage": 87.78, "elapsed_time": "4:11:09", "remaining_time": "0:34:58", "throughput": 9937.19, "total_tokens": 149749760} +{"current_steps": 18290, "total_steps": 20825, "loss": 0.9433, "learning_rate": 1.9901745009695773e-06, "epoch": 0.8782713085234094, "percentage": 87.83, "elapsed_time": "4:11:54", "remaining_time": "0:34:54", "throughput": 9912.97, "total_tokens": 149831680} +{"current_steps": 18300, "total_steps": 20825, "loss": 0.8976, "learning_rate": 1.9747135442370946e-06, "epoch": 0.8787515006002401, "percentage": 87.88, "elapsed_time": "4:12:39", "remaining_time": "0:34:51", "throughput": 9888.88, "total_tokens": 149913600} +{"current_steps": 18310, "total_steps": 20825, "loss": 0.7622, "learning_rate": 1.9593104075335158e-06, "epoch": 0.8792316926770708, "percentage": 87.92, "elapsed_time": "4:13:25", "remaining_time": "0:34:48", "throughput": 9864.85, "total_tokens": 149995520} +{"current_steps": 18320, "total_steps": 20825, "loss": 0.8789, "learning_rate": 1.943965129538483e-06, "epoch": 0.8797118847539016, "percentage": 87.97, "elapsed_time": "4:14:10", "remaining_time": "0:34:45", "throughput": 9840.94, "total_tokens": 150077440} +{"current_steps": 18330, "total_steps": 20825, "loss": 0.8331, "learning_rate": 1.9286777487863477e-06, "epoch": 0.8801920768307323, "percentage": 88.02, "elapsed_time": "4:14:55", "remaining_time": "0:34:41", "throughput": 9817.36, "total_tokens": 150159360} +{"current_steps": 18340, "total_steps": 20825, "loss": 0.9994, "learning_rate": 1.913448303666071e-06, "epoch": 0.880672268907563, "percentage": 88.07, "elapsed_time": "4:15:40", "remaining_time": "0:34:38", "throughput": 9793.66, "total_tokens": 150241280} +{"current_steps": 18350, "total_steps": 20825, "loss": 0.9293, "learning_rate": 1.8982768324211197e-06, "epoch": 0.8811524609843937, "percentage": 88.12, "elapsed_time": "4:16:25", "remaining_time": "0:34:35", "throughput": 9770.45, "total_tokens": 150323200} +{"current_steps": 18360, "total_steps": 20825, "loss": 0.9782, "learning_rate": 1.8831633731493963e-06, "epoch": 0.8816326530612245, "percentage": 88.16, "elapsed_time": "4:17:10", "remaining_time": "0:34:31", "throughput": 9747.27, "total_tokens": 150405120} +{"current_steps": 18370, "total_steps": 20825, "loss": 0.8177, "learning_rate": 1.8681079638031062e-06, "epoch": 0.8821128451380552, "percentage": 88.21, "elapsed_time": "4:17:55", "remaining_time": "0:34:28", "throughput": 9724.08, "total_tokens": 150487040} +{"current_steps": 18380, "total_steps": 20825, "loss": 0.8863, "learning_rate": 1.8531106421887017e-06, "epoch": 0.8825930372148859, "percentage": 88.26, "elapsed_time": "4:18:40", "remaining_time": "0:34:24", "throughput": 9701.12, "total_tokens": 150568960} +{"current_steps": 18390, "total_steps": 20825, "loss": 0.7228, "learning_rate": 1.8381714459667603e-06, "epoch": 0.8830732292917167, "percentage": 88.31, "elapsed_time": "4:19:26", "remaining_time": "0:34:21", "throughput": 9678.01, "total_tokens": 150650880} +{"current_steps": 18400, "total_steps": 20825, "loss": 1.0011, "learning_rate": 1.823290412651893e-06, "epoch": 0.8835534213685474, "percentage": 88.36, "elapsed_time": "4:20:11", "remaining_time": "0:34:17", "throughput": 9655.27, "total_tokens": 150732800} +{"current_steps": 18410, "total_steps": 20825, "loss": 1.1894, "learning_rate": 1.8084675796126576e-06, "epoch": 0.8840336134453781, "percentage": 88.4, "elapsed_time": "4:20:56", "remaining_time": "0:34:13", "throughput": 9632.43, "total_tokens": 150814720} +{"current_steps": 18420, "total_steps": 20825, "loss": 1.0122, "learning_rate": 1.7937029840714715e-06, "epoch": 0.8845138055222089, "percentage": 88.45, "elapsed_time": "4:21:42", "remaining_time": "0:34:10", "throughput": 9609.45, "total_tokens": 150896640} +{"current_steps": 18430, "total_steps": 20825, "loss": 0.836, "learning_rate": 1.778996663104493e-06, "epoch": 0.8849939975990396, "percentage": 88.5, "elapsed_time": "4:22:27", "remaining_time": "0:34:06", "throughput": 9587.19, "total_tokens": 150978560} +{"current_steps": 18440, "total_steps": 20825, "loss": 0.9355, "learning_rate": 1.7643486536415537e-06, "epoch": 0.8854741896758703, "percentage": 88.55, "elapsed_time": "4:23:13", "remaining_time": "0:34:02", "throughput": 9564.94, "total_tokens": 151060480} +{"current_steps": 18450, "total_steps": 20825, "loss": 0.8795, "learning_rate": 1.7497589924660552e-06, "epoch": 0.885954381752701, "percentage": 88.6, "elapsed_time": "4:23:58", "remaining_time": "0:33:58", "throughput": 9542.69, "total_tokens": 151142400} +{"current_steps": 18460, "total_steps": 20825, "loss": 0.814, "learning_rate": 1.7352277162148712e-06, "epoch": 0.8864345738295318, "percentage": 88.64, "elapsed_time": "4:24:43", "remaining_time": "0:33:54", "throughput": 9520.55, "total_tokens": 151224320} +{"current_steps": 18470, "total_steps": 20825, "loss": 0.8757, "learning_rate": 1.7207548613782709e-06, "epoch": 0.8869147659063625, "percentage": 88.69, "elapsed_time": "4:25:29", "remaining_time": "0:33:51", "throughput": 9498.73, "total_tokens": 151306240} +{"current_steps": 18480, "total_steps": 20825, "loss": 1.0152, "learning_rate": 1.7063404642998186e-06, "epoch": 0.8873949579831932, "percentage": 88.74, "elapsed_time": "4:26:14", "remaining_time": "0:33:47", "throughput": 9477.05, "total_tokens": 151388160} +{"current_steps": 18490, "total_steps": 20825, "loss": 0.9454, "learning_rate": 1.6919845611762714e-06, "epoch": 0.887875150060024, "percentage": 88.79, "elapsed_time": "4:26:59", "remaining_time": "0:33:43", "throughput": 9455.31, "total_tokens": 151470080} +{"current_steps": 18500, "total_steps": 20825, "loss": 1.0313, "learning_rate": 1.6776871880575084e-06, "epoch": 0.8883553421368547, "percentage": 88.84, "elapsed_time": "4:27:44", "remaining_time": "0:33:38", "throughput": 9433.85, "total_tokens": 151552000} +{"current_steps": 18510, "total_steps": 20825, "loss": 0.8417, "learning_rate": 1.663448380846433e-06, "epoch": 0.8888355342136854, "percentage": 88.88, "elapsed_time": "4:28:29", "remaining_time": "0:33:34", "throughput": 9412.57, "total_tokens": 151633920} +{"current_steps": 18520, "total_steps": 20825, "loss": 0.8187, "learning_rate": 1.649268175298868e-06, "epoch": 0.8893157262905163, "percentage": 88.93, "elapsed_time": "4:29:15", "remaining_time": "0:33:30", "throughput": 9391.25, "total_tokens": 151715840} +{"current_steps": 18530, "total_steps": 20825, "loss": 1.1659, "learning_rate": 1.6351466070234882e-06, "epoch": 0.889795918367347, "percentage": 88.98, "elapsed_time": "4:30:00", "remaining_time": "0:33:26", "throughput": 9370.01, "total_tokens": 151797760} +{"current_steps": 18540, "total_steps": 20825, "loss": 0.8884, "learning_rate": 1.6210837114817272e-06, "epoch": 0.8902761104441776, "percentage": 89.03, "elapsed_time": "4:30:45", "remaining_time": "0:33:22", "throughput": 9349.01, "total_tokens": 151879680} +{"current_steps": 18550, "total_steps": 20825, "loss": 0.7856, "learning_rate": 1.6070795239876618e-06, "epoch": 0.8907563025210085, "percentage": 89.08, "elapsed_time": "4:31:30", "remaining_time": "0:33:17", "throughput": 9328.09, "total_tokens": 151961600} +{"current_steps": 18560, "total_steps": 20825, "loss": 0.7931, "learning_rate": 1.5931340797079613e-06, "epoch": 0.8912364945978392, "percentage": 89.12, "elapsed_time": "4:32:15", "remaining_time": "0:33:13", "throughput": 9307.32, "total_tokens": 152043520} +{"current_steps": 18570, "total_steps": 20825, "loss": 0.8341, "learning_rate": 1.5792474136617858e-06, "epoch": 0.8917166866746699, "percentage": 89.17, "elapsed_time": "4:33:00", "remaining_time": "0:33:09", "throughput": 9286.74, "total_tokens": 152125440} +{"current_steps": 18580, "total_steps": 20825, "loss": 0.8317, "learning_rate": 1.5654195607206712e-06, "epoch": 0.8921968787515006, "percentage": 89.22, "elapsed_time": "4:33:46", "remaining_time": "0:33:04", "throughput": 9266.18, "total_tokens": 152207360} +{"current_steps": 18590, "total_steps": 20825, "loss": 0.859, "learning_rate": 1.5516505556084888e-06, "epoch": 0.8926770708283314, "percentage": 89.27, "elapsed_time": "4:34:31", "remaining_time": "0:33:00", "throughput": 9245.61, "total_tokens": 152289280} +{"current_steps": 18600, "total_steps": 20825, "loss": 1.0143, "learning_rate": 1.5379404329013246e-06, "epoch": 0.8931572629051621, "percentage": 89.32, "elapsed_time": "4:35:16", "remaining_time": "0:32:55", "throughput": 9225.26, "total_tokens": 152371200} +{"current_steps": 18610, "total_steps": 20825, "loss": 0.8301, "learning_rate": 1.5242892270273951e-06, "epoch": 0.8936374549819928, "percentage": 89.36, "elapsed_time": "4:36:01", "remaining_time": "0:32:51", "throughput": 9205.16, "total_tokens": 152453120} +{"current_steps": 18620, "total_steps": 20825, "loss": 0.9141, "learning_rate": 1.5106969722669812e-06, "epoch": 0.8941176470588236, "percentage": 89.41, "elapsed_time": "4:36:47", "remaining_time": "0:32:46", "throughput": 9184.95, "total_tokens": 152535040} +{"current_steps": 18630, "total_steps": 20825, "loss": 1.1308, "learning_rate": 1.4971637027523106e-06, "epoch": 0.8945978391356543, "percentage": 89.46, "elapsed_time": "4:37:32", "remaining_time": "0:32:41", "throughput": 9164.99, "total_tokens": 152616960} +{"current_steps": 18640, "total_steps": 20825, "loss": 0.9492, "learning_rate": 1.4836894524675126e-06, "epoch": 0.895078031212485, "percentage": 89.51, "elapsed_time": "4:38:17", "remaining_time": "0:32:37", "throughput": 9145.18, "total_tokens": 152698880} +{"current_steps": 18650, "total_steps": 20825, "loss": 1.1131, "learning_rate": 1.4702742552484884e-06, "epoch": 0.8955582232893158, "percentage": 89.56, "elapsed_time": "4:39:02", "remaining_time": "0:32:32", "throughput": 9125.16, "total_tokens": 152780800} +{"current_steps": 18660, "total_steps": 20825, "loss": 0.8355, "learning_rate": 1.4569181447828623e-06, "epoch": 0.8960384153661465, "percentage": 89.6, "elapsed_time": "4:39:48", "remaining_time": "0:32:27", "throughput": 9105.44, "total_tokens": 152862720} +{"current_steps": 18670, "total_steps": 20825, "loss": 1.055, "learning_rate": 1.4436211546098782e-06, "epoch": 0.8965186074429772, "percentage": 89.65, "elapsed_time": "4:40:33", "remaining_time": "0:32:23", "throughput": 9085.72, "total_tokens": 152944640} +{"current_steps": 18680, "total_steps": 20825, "loss": 0.9159, "learning_rate": 1.430383318120318e-06, "epoch": 0.8969987995198079, "percentage": 89.7, "elapsed_time": "4:41:18", "remaining_time": "0:32:18", "throughput": 9066.29, "total_tokens": 153026560} +{"current_steps": 18690, "total_steps": 20825, "loss": 0.8634, "learning_rate": 1.4172046685564212e-06, "epoch": 0.8974789915966387, "percentage": 89.75, "elapsed_time": "4:42:03", "remaining_time": "0:32:13", "throughput": 9047.01, "total_tokens": 153108480} +{"current_steps": 18700, "total_steps": 20825, "loss": 0.9027, "learning_rate": 1.4040852390118042e-06, "epoch": 0.8979591836734694, "percentage": 89.8, "elapsed_time": "4:42:48", "remaining_time": "0:32:08", "throughput": 9027.73, "total_tokens": 153190400} +{"current_steps": 18710, "total_steps": 20825, "loss": 1.0014, "learning_rate": 1.3910250624313642e-06, "epoch": 0.8984393757503001, "percentage": 89.84, "elapsed_time": "4:43:34", "remaining_time": "0:32:03", "throughput": 9008.37, "total_tokens": 153272320} +{"current_steps": 18720, "total_steps": 20825, "loss": 0.8953, "learning_rate": 1.3780241716112057e-06, "epoch": 0.8989195678271309, "percentage": 89.89, "elapsed_time": "4:44:19", "remaining_time": "0:31:58", "throughput": 8989.29, "total_tokens": 153354240} +{"current_steps": 18730, "total_steps": 20825, "loss": 0.8398, "learning_rate": 1.3650825991985722e-06, "epoch": 0.8993997599039616, "percentage": 89.94, "elapsed_time": "4:45:05", "remaining_time": "0:31:53", "throughput": 8970.18, "total_tokens": 153436160} +{"current_steps": 18740, "total_steps": 20825, "loss": 0.7956, "learning_rate": 1.3522003776917285e-06, "epoch": 0.8998799519807923, "percentage": 89.99, "elapsed_time": "4:45:50", "remaining_time": "0:31:48", "throughput": 8951.43, "total_tokens": 153518080} +{"current_steps": 18750, "total_steps": 20825, "loss": 0.8044, "learning_rate": 1.3393775394399123e-06, "epoch": 0.9003601440576231, "percentage": 90.04, "elapsed_time": "4:46:35", "remaining_time": "0:31:42", "throughput": 8932.73, "total_tokens": 153600000} +{"current_steps": 18760, "total_steps": 20825, "loss": 0.7121, "learning_rate": 1.326614116643246e-06, "epoch": 0.9008403361344538, "percentage": 90.08, "elapsed_time": "4:47:20", "remaining_time": "0:31:37", "throughput": 8914.13, "total_tokens": 153681920} +{"current_steps": 18770, "total_steps": 20825, "loss": 0.8775, "learning_rate": 1.3139101413526339e-06, "epoch": 0.9013205282112845, "percentage": 90.13, "elapsed_time": "4:48:05", "remaining_time": "0:31:32", "throughput": 8895.61, "total_tokens": 153763840} +{"current_steps": 18780, "total_steps": 20825, "loss": 1.0345, "learning_rate": 1.3012656454697125e-06, "epoch": 0.9018007202881152, "percentage": 90.18, "elapsed_time": "4:48:50", "remaining_time": "0:31:27", "throughput": 8877.0, "total_tokens": 153845760} +{"current_steps": 18790, "total_steps": 20825, "loss": 0.9592, "learning_rate": 1.2886806607467578e-06, "epoch": 0.902280912364946, "percentage": 90.23, "elapsed_time": "4:49:35", "remaining_time": "0:31:21", "throughput": 8858.68, "total_tokens": 153927680} +{"current_steps": 18800, "total_steps": 20825, "loss": 0.927, "learning_rate": 1.2761552187865899e-06, "epoch": 0.9027611044417767, "percentage": 90.28, "elapsed_time": "4:50:21", "remaining_time": "0:31:16", "throughput": 8840.46, "total_tokens": 154009600} +{"current_steps": 18810, "total_steps": 20825, "loss": 0.8942, "learning_rate": 1.2636893510425186e-06, "epoch": 0.9032412965186074, "percentage": 90.32, "elapsed_time": "4:51:05", "remaining_time": "0:31:11", "throughput": 8822.39, "total_tokens": 154091520} +{"current_steps": 18820, "total_steps": 20825, "loss": 0.97, "learning_rate": 1.2512830888182531e-06, "epoch": 0.9037214885954382, "percentage": 90.37, "elapsed_time": "4:51:51", "remaining_time": "0:31:05", "throughput": 8804.15, "total_tokens": 154173440} +{"current_steps": 18830, "total_steps": 20825, "loss": 0.9964, "learning_rate": 1.23893646326782e-06, "epoch": 0.9042016806722689, "percentage": 90.42, "elapsed_time": "4:52:36", "remaining_time": "0:31:00", "throughput": 8786.07, "total_tokens": 154255360} +{"current_steps": 18840, "total_steps": 20825, "loss": 0.7055, "learning_rate": 1.2266495053954913e-06, "epoch": 0.9046818727490996, "percentage": 90.47, "elapsed_time": "4:53:22", "remaining_time": "0:30:54", "throughput": 8768.07, "total_tokens": 154337280} +{"current_steps": 18850, "total_steps": 20825, "loss": 0.8709, "learning_rate": 1.2144222460557074e-06, "epoch": 0.9051620648259304, "percentage": 90.52, "elapsed_time": "4:54:07", "remaining_time": "0:30:48", "throughput": 8750.32, "total_tokens": 154419200} +{"current_steps": 18860, "total_steps": 20825, "loss": 1.0051, "learning_rate": 1.2022547159529911e-06, "epoch": 0.9056422569027611, "percentage": 90.56, "elapsed_time": "4:54:52", "remaining_time": "0:30:43", "throughput": 8732.63, "total_tokens": 154501120} +{"current_steps": 18870, "total_steps": 20825, "loss": 0.8824, "learning_rate": 1.190146945641879e-06, "epoch": 0.9061224489795918, "percentage": 90.61, "elapsed_time": "4:55:37", "remaining_time": "0:30:37", "throughput": 8715.06, "total_tokens": 154583040} +{"current_steps": 18880, "total_steps": 20825, "loss": 0.997, "learning_rate": 1.1780989655268415e-06, "epoch": 0.9066026410564225, "percentage": 90.66, "elapsed_time": "4:56:22", "remaining_time": "0:30:31", "throughput": 8697.53, "total_tokens": 154664960} +{"current_steps": 18890, "total_steps": 20825, "loss": 0.824, "learning_rate": 1.1661108058622082e-06, "epoch": 0.9070828331332533, "percentage": 90.71, "elapsed_time": "4:57:08", "remaining_time": "0:30:26", "throughput": 8679.99, "total_tokens": 154746880} +{"current_steps": 18900, "total_steps": 20825, "loss": 0.7726, "learning_rate": 1.154182496752082e-06, "epoch": 0.907563025210084, "percentage": 90.76, "elapsed_time": "4:57:53", "remaining_time": "0:30:20", "throughput": 8662.6, "total_tokens": 154828800} +{"current_steps": 18910, "total_steps": 20825, "loss": 1.003, "learning_rate": 1.142314068150288e-06, "epoch": 0.9080432172869147, "percentage": 90.8, "elapsed_time": "4:58:38", "remaining_time": "0:30:14", "throughput": 8645.29, "total_tokens": 154910720} +{"current_steps": 18920, "total_steps": 20825, "loss": 0.8584, "learning_rate": 1.1305055498602584e-06, "epoch": 0.9085234093637455, "percentage": 90.85, "elapsed_time": "4:59:23", "remaining_time": "0:30:08", "throughput": 8628.11, "total_tokens": 154992640} +{"current_steps": 18930, "total_steps": 20825, "loss": 0.8205, "learning_rate": 1.1187569715350066e-06, "epoch": 0.9090036014405762, "percentage": 90.9, "elapsed_time": "5:00:09", "remaining_time": "0:30:02", "throughput": 8610.9, "total_tokens": 155074560} +{"current_steps": 18940, "total_steps": 20825, "loss": 0.7995, "learning_rate": 1.1070683626770162e-06, "epoch": 0.9094837935174069, "percentage": 90.95, "elapsed_time": "5:00:54", "remaining_time": "0:29:56", "throughput": 8593.94, "total_tokens": 155156480} +{"current_steps": 18950, "total_steps": 20825, "loss": 0.8801, "learning_rate": 1.0954397526381694e-06, "epoch": 0.9099639855942377, "percentage": 91.0, "elapsed_time": "5:01:39", "remaining_time": "0:29:50", "throughput": 8577.06, "total_tokens": 155238400} +{"current_steps": 18960, "total_steps": 20825, "loss": 0.9004, "learning_rate": 1.0838711706196992e-06, "epoch": 0.9104441776710684, "percentage": 91.04, "elapsed_time": "5:02:24", "remaining_time": "0:29:44", "throughput": 8560.19, "total_tokens": 155320320} +{"current_steps": 18970, "total_steps": 20825, "loss": 0.9954, "learning_rate": 1.0723626456720925e-06, "epoch": 0.9109243697478991, "percentage": 91.09, "elapsed_time": "5:03:10", "remaining_time": "0:29:38", "throughput": 8543.26, "total_tokens": 155402240} +{"current_steps": 18980, "total_steps": 20825, "loss": 1.032, "learning_rate": 1.0609142066950157e-06, "epoch": 0.9114045618247298, "percentage": 91.14, "elapsed_time": "5:03:55", "remaining_time": "0:29:32", "throughput": 8526.43, "total_tokens": 155484160} +{"current_steps": 18990, "total_steps": 20825, "loss": 0.8363, "learning_rate": 1.0495258824372578e-06, "epoch": 0.9118847539015607, "percentage": 91.19, "elapsed_time": "5:04:41", "remaining_time": "0:29:26", "throughput": 8509.66, "total_tokens": 155566080} +{"current_steps": 19000, "total_steps": 20825, "loss": 0.7728, "learning_rate": 1.0381977014966543e-06, "epoch": 0.9123649459783914, "percentage": 91.24, "elapsed_time": "5:05:26", "remaining_time": "0:29:20", "throughput": 8492.94, "total_tokens": 155648000} +{"current_steps": 19010, "total_steps": 20825, "loss": 1.018, "learning_rate": 1.0269296923199972e-06, "epoch": 0.912845138055222, "percentage": 91.28, "elapsed_time": "5:06:15", "remaining_time": "0:29:14", "throughput": 8474.68, "total_tokens": 155729920} +{"current_steps": 19020, "total_steps": 20825, "loss": 1.0119, "learning_rate": 1.0157218832029969e-06, "epoch": 0.9133253301320529, "percentage": 91.33, "elapsed_time": "5:07:01", "remaining_time": "0:29:08", "throughput": 8458.33, "total_tokens": 155811840} +{"current_steps": 19030, "total_steps": 20825, "loss": 1.0094, "learning_rate": 1.0045743022901787e-06, "epoch": 0.9138055222088836, "percentage": 91.38, "elapsed_time": "5:07:46", "remaining_time": "0:29:01", "throughput": 8442.1, "total_tokens": 155893760} +{"current_steps": 19040, "total_steps": 20825, "loss": 0.7286, "learning_rate": 9.934869775748258e-07, "epoch": 0.9142857142857143, "percentage": 91.43, "elapsed_time": "5:08:31", "remaining_time": "0:28:55", "throughput": 8425.93, "total_tokens": 155975680} +{"current_steps": 19050, "total_steps": 20825, "loss": 0.8924, "learning_rate": 9.824599368989163e-07, "epoch": 0.9147659063625451, "percentage": 91.48, "elapsed_time": "5:09:16", "remaining_time": "0:28:49", "throughput": 8409.93, "total_tokens": 156057600} +{"current_steps": 19060, "total_steps": 20825, "loss": 0.814, "learning_rate": 9.714932079530476e-07, "epoch": 0.9152460984393758, "percentage": 91.52, "elapsed_time": "5:10:01", "remaining_time": "0:28:42", "throughput": 8393.79, "total_tokens": 156139520} +{"current_steps": 19070, "total_steps": 20825, "loss": 0.7436, "learning_rate": 9.60586818276349e-07, "epoch": 0.9157262905162065, "percentage": 91.57, "elapsed_time": "5:10:47", "remaining_time": "0:28:36", "throughput": 8377.75, "total_tokens": 156221440} +{"current_steps": 19080, "total_steps": 20825, "loss": 0.7512, "learning_rate": 9.497407952564485e-07, "epoch": 0.9162064825930372, "percentage": 91.62, "elapsed_time": "5:11:32", "remaining_time": "0:28:29", "throughput": 8361.7, "total_tokens": 156303360} +{"current_steps": 19090, "total_steps": 20825, "loss": 0.9225, "learning_rate": 9.389551661293683e-07, "epoch": 0.916686674669868, "percentage": 91.67, "elapsed_time": "5:12:18", "remaining_time": "0:28:23", "throughput": 8345.67, "total_tokens": 156385280} +{"current_steps": 19100, "total_steps": 20825, "loss": 0.8426, "learning_rate": 9.282299579794789e-07, "epoch": 0.9171668667466987, "percentage": 91.72, "elapsed_time": "5:13:03", "remaining_time": "0:28:16", "throughput": 8329.97, "total_tokens": 156467200} +{"current_steps": 19110, "total_steps": 20825, "loss": 0.867, "learning_rate": 9.175651977394284e-07, "epoch": 0.9176470588235294, "percentage": 91.76, "elapsed_time": "5:13:48", "remaining_time": "0:28:09", "throughput": 8314.31, "total_tokens": 156549120} +{"current_steps": 19120, "total_steps": 20825, "loss": 0.8332, "learning_rate": 9.069609121900663e-07, "epoch": 0.9181272509003602, "percentage": 91.81, "elapsed_time": "5:14:34", "remaining_time": "0:28:03", "throughput": 8298.7, "total_tokens": 156631040} +{"current_steps": 19130, "total_steps": 20825, "loss": 0.7689, "learning_rate": 8.964171279603778e-07, "epoch": 0.9186074429771909, "percentage": 91.86, "elapsed_time": "5:15:19", "remaining_time": "0:27:56", "throughput": 8283.24, "total_tokens": 156712960} +{"current_steps": 19140, "total_steps": 20825, "loss": 0.7697, "learning_rate": 8.859338715274279e-07, "epoch": 0.9190876350540216, "percentage": 91.91, "elapsed_time": "5:16:04", "remaining_time": "0:27:49", "throughput": 8267.89, "total_tokens": 156794880} +{"current_steps": 19150, "total_steps": 20825, "loss": 0.9131, "learning_rate": 8.755111692162837e-07, "epoch": 0.9195678271308524, "percentage": 91.96, "elapsed_time": "5:16:50", "remaining_time": "0:27:42", "throughput": 8252.2, "total_tokens": 156876800} +{"current_steps": 19160, "total_steps": 20825, "loss": 0.9745, "learning_rate": 8.651490471999424e-07, "epoch": 0.9200480192076831, "percentage": 92.0, "elapsed_time": "5:17:35", "remaining_time": "0:27:35", "throughput": 8236.77, "total_tokens": 156958720} +{"current_steps": 19170, "total_steps": 20825, "loss": 0.9774, "learning_rate": 8.548475314992949e-07, "epoch": 0.9205282112845138, "percentage": 92.05, "elapsed_time": "5:18:21", "remaining_time": "0:27:29", "throughput": 8221.27, "total_tokens": 157040640} +{"current_steps": 19180, "total_steps": 20825, "loss": 0.9048, "learning_rate": 8.446066479830206e-07, "epoch": 0.9210084033613445, "percentage": 92.1, "elapsed_time": "5:19:06", "remaining_time": "0:27:22", "throughput": 8206.14, "total_tokens": 157122560} +{"current_steps": 19190, "total_steps": 20825, "loss": 0.8926, "learning_rate": 8.344264223675485e-07, "epoch": 0.9214885954381753, "percentage": 92.15, "elapsed_time": "5:19:52", "remaining_time": "0:27:15", "throughput": 8191.04, "total_tokens": 157204480} +{"current_steps": 19200, "total_steps": 20825, "loss": 0.8408, "learning_rate": 8.243068802169906e-07, "epoch": 0.921968787515006, "percentage": 92.2, "elapsed_time": "5:20:37", "remaining_time": "0:27:08", "throughput": 8176.04, "total_tokens": 157286400} +{"current_steps": 19210, "total_steps": 20825, "loss": 0.9799, "learning_rate": 8.14248046943078e-07, "epoch": 0.9224489795918367, "percentage": 92.24, "elapsed_time": "5:21:22", "remaining_time": "0:27:01", "throughput": 8161.18, "total_tokens": 157368320} +{"current_steps": 19220, "total_steps": 20825, "loss": 0.7224, "learning_rate": 8.042499478050719e-07, "epoch": 0.9229291716686675, "percentage": 92.29, "elapsed_time": "5:22:07", "remaining_time": "0:26:54", "throughput": 8146.29, "total_tokens": 157450240} +{"current_steps": 19230, "total_steps": 20825, "loss": 0.8495, "learning_rate": 7.943126079097418e-07, "epoch": 0.9234093637454982, "percentage": 92.34, "elapsed_time": "5:22:52", "remaining_time": "0:26:46", "throughput": 8131.57, "total_tokens": 157532160} +{"current_steps": 19240, "total_steps": 20825, "loss": 0.9701, "learning_rate": 7.844360522112737e-07, "epoch": 0.9238895558223289, "percentage": 92.39, "elapsed_time": "5:23:37", "remaining_time": "0:26:39", "throughput": 8116.93, "total_tokens": 157614080} +{"current_steps": 19250, "total_steps": 20825, "loss": 0.8682, "learning_rate": 7.746203055112145e-07, "epoch": 0.9243697478991597, "percentage": 92.44, "elapsed_time": "5:24:23", "remaining_time": "0:26:32", "throughput": 8102.33, "total_tokens": 157696000} +{"current_steps": 19260, "total_steps": 20825, "loss": 0.9395, "learning_rate": 7.648653924584137e-07, "epoch": 0.9248499399759904, "percentage": 92.48, "elapsed_time": "5:25:08", "remaining_time": "0:26:25", "throughput": 8087.78, "total_tokens": 157777920} +{"current_steps": 19270, "total_steps": 20825, "loss": 0.84, "learning_rate": 7.55171337548946e-07, "epoch": 0.9253301320528211, "percentage": 92.53, "elapsed_time": "5:25:53", "remaining_time": "0:26:17", "throughput": 8073.31, "total_tokens": 157859840} +{"current_steps": 19280, "total_steps": 20825, "loss": 0.7814, "learning_rate": 7.455381651260807e-07, "epoch": 0.9258103241296518, "percentage": 92.58, "elapsed_time": "5:26:38", "remaining_time": "0:26:10", "throughput": 8058.9, "total_tokens": 157941760} +{"current_steps": 19290, "total_steps": 20825, "loss": 0.9542, "learning_rate": 7.359658993801894e-07, "epoch": 0.9262905162064826, "percentage": 92.63, "elapsed_time": "5:27:23", "remaining_time": "0:26:03", "throughput": 8044.59, "total_tokens": 158023680} +{"current_steps": 19300, "total_steps": 20825, "loss": 0.9109, "learning_rate": 7.264545643486997e-07, "epoch": 0.9267707082833133, "percentage": 92.68, "elapsed_time": "5:28:08", "remaining_time": "0:25:55", "throughput": 8030.3, "total_tokens": 158105600} +{"current_steps": 19310, "total_steps": 20825, "loss": 0.9783, "learning_rate": 7.170041839160368e-07, "epoch": 0.927250900360144, "percentage": 92.73, "elapsed_time": "5:28:53", "remaining_time": "0:25:48", "throughput": 8016.16, "total_tokens": 158187520} +{"current_steps": 19320, "total_steps": 20825, "loss": 0.8147, "learning_rate": 7.076147818135537e-07, "epoch": 0.9277310924369748, "percentage": 92.77, "elapsed_time": "5:29:38", "remaining_time": "0:25:40", "throughput": 8002.04, "total_tokens": 158269440} +{"current_steps": 19330, "total_steps": 20825, "loss": 0.7043, "learning_rate": 6.982863816194812e-07, "epoch": 0.9282112845138055, "percentage": 92.82, "elapsed_time": "5:30:23", "remaining_time": "0:25:33", "throughput": 7987.87, "total_tokens": 158351360} +{"current_steps": 19340, "total_steps": 20825, "loss": 0.8402, "learning_rate": 6.890190067588648e-07, "epoch": 0.9286914765906362, "percentage": 92.87, "elapsed_time": "5:31:09", "remaining_time": "0:25:25", "throughput": 7973.87, "total_tokens": 158433280} +{"current_steps": 19350, "total_steps": 20825, "loss": 0.9634, "learning_rate": 6.798126805035082e-07, "epoch": 0.929171668667467, "percentage": 92.92, "elapsed_time": "5:31:54", "remaining_time": "0:25:18", "throughput": 7959.92, "total_tokens": 158515200} +{"current_steps": 19360, "total_steps": 20825, "loss": 0.9554, "learning_rate": 6.706674259719048e-07, "epoch": 0.9296518607442977, "percentage": 92.97, "elapsed_time": "5:32:39", "remaining_time": "0:25:10", "throughput": 7945.85, "total_tokens": 158597120} +{"current_steps": 19370, "total_steps": 20825, "loss": 0.8942, "learning_rate": 6.615832661291954e-07, "epoch": 0.9301320528211284, "percentage": 93.01, "elapsed_time": "5:33:24", "remaining_time": "0:25:02", "throughput": 7932.09, "total_tokens": 158679040} +{"current_steps": 19380, "total_steps": 20825, "loss": 0.7503, "learning_rate": 6.525602237870993e-07, "epoch": 0.9306122448979591, "percentage": 93.06, "elapsed_time": "5:34:09", "remaining_time": "0:24:54", "throughput": 7918.31, "total_tokens": 158760960} +{"current_steps": 19390, "total_steps": 20825, "loss": 0.6928, "learning_rate": 6.435983216038583e-07, "epoch": 0.9310924369747899, "percentage": 93.11, "elapsed_time": "5:34:55", "remaining_time": "0:24:47", "throughput": 7904.53, "total_tokens": 158842880} +{"current_steps": 19400, "total_steps": 20825, "loss": 0.8504, "learning_rate": 6.346975820841927e-07, "epoch": 0.9315726290516206, "percentage": 93.16, "elapsed_time": "5:35:40", "remaining_time": "0:24:39", "throughput": 7890.91, "total_tokens": 158924800} +{"current_steps": 19410, "total_steps": 20825, "loss": 0.9175, "learning_rate": 6.258580275792153e-07, "epoch": 0.9320528211284513, "percentage": 93.21, "elapsed_time": "5:36:25", "remaining_time": "0:24:31", "throughput": 7877.35, "total_tokens": 159006720} +{"current_steps": 19420, "total_steps": 20825, "loss": 0.7601, "learning_rate": 6.170796802864115e-07, "epoch": 0.9325330132052821, "percentage": 93.25, "elapsed_time": "5:37:10", "remaining_time": "0:24:23", "throughput": 7863.86, "total_tokens": 159088640} +{"current_steps": 19430, "total_steps": 20825, "loss": 0.8923, "learning_rate": 6.083625622495565e-07, "epoch": 0.9330132052821128, "percentage": 93.3, "elapsed_time": "5:37:55", "remaining_time": "0:24:15", "throughput": 7850.42, "total_tokens": 159170560} +{"current_steps": 19440, "total_steps": 20825, "loss": 0.8514, "learning_rate": 5.997066953586761e-07, "epoch": 0.9334933973589435, "percentage": 93.35, "elapsed_time": "5:38:40", "remaining_time": "0:24:07", "throughput": 7836.97, "total_tokens": 159252480} +{"current_steps": 19450, "total_steps": 20825, "loss": 0.8006, "learning_rate": 5.911121013499721e-07, "epoch": 0.9339735894357744, "percentage": 93.4, "elapsed_time": "5:39:25", "remaining_time": "0:23:59", "throughput": 7823.64, "total_tokens": 159334400} +{"current_steps": 19460, "total_steps": 20825, "loss": 0.8361, "learning_rate": 5.825788018057971e-07, "epoch": 0.934453781512605, "percentage": 93.45, "elapsed_time": "5:40:10", "remaining_time": "0:23:51", "throughput": 7810.33, "total_tokens": 159416320} +{"current_steps": 19470, "total_steps": 20825, "loss": 1.0557, "learning_rate": 5.741068181545684e-07, "epoch": 0.9349339735894358, "percentage": 93.49, "elapsed_time": "5:40:56", "remaining_time": "0:23:43", "throughput": 7797.12, "total_tokens": 159498240} +{"current_steps": 19480, "total_steps": 20825, "loss": 1.1845, "learning_rate": 5.656961716707459e-07, "epoch": 0.9354141656662666, "percentage": 93.54, "elapsed_time": "5:41:41", "remaining_time": "0:23:35", "throughput": 7783.87, "total_tokens": 159580160} +{"current_steps": 19490, "total_steps": 20825, "loss": 0.818, "learning_rate": 5.57346883474752e-07, "epoch": 0.9358943577430973, "percentage": 93.59, "elapsed_time": "5:42:26", "remaining_time": "0:23:27", "throughput": 7770.78, "total_tokens": 159662080} +{"current_steps": 19500, "total_steps": 20825, "loss": 0.9216, "learning_rate": 5.490589745329261e-07, "epoch": 0.936374549819928, "percentage": 93.64, "elapsed_time": "5:43:11", "remaining_time": "0:23:19", "throughput": 7757.67, "total_tokens": 159744000} +{"current_steps": 19510, "total_steps": 20825, "loss": 1.0933, "learning_rate": 5.408324656574842e-07, "epoch": 0.9368547418967587, "percentage": 93.69, "elapsed_time": "5:43:56", "remaining_time": "0:23:10", "throughput": 7744.68, "total_tokens": 159825920} +{"current_steps": 19520, "total_steps": 20825, "loss": 0.9709, "learning_rate": 5.326673775064545e-07, "epoch": 0.9373349339735895, "percentage": 93.73, "elapsed_time": "5:44:42", "remaining_time": "0:23:02", "throughput": 7731.6, "total_tokens": 159907840} +{"current_steps": 19530, "total_steps": 20825, "loss": 0.8722, "learning_rate": 5.245637305836243e-07, "epoch": 0.9378151260504202, "percentage": 93.78, "elapsed_time": "5:45:27", "remaining_time": "0:22:54", "throughput": 7718.74, "total_tokens": 159989760} +{"current_steps": 19540, "total_steps": 20825, "loss": 0.8854, "learning_rate": 5.165215452384936e-07, "epoch": 0.9382953181272509, "percentage": 93.83, "elapsed_time": "5:46:12", "remaining_time": "0:22:46", "throughput": 7705.88, "total_tokens": 160071680} +{"current_steps": 19550, "total_steps": 20825, "loss": 0.8518, "learning_rate": 5.085408416662274e-07, "epoch": 0.9387755102040817, "percentage": 93.88, "elapsed_time": "5:46:57", "remaining_time": "0:22:37", "throughput": 7693.05, "total_tokens": 160153600} +{"current_steps": 19560, "total_steps": 20825, "loss": 0.9801, "learning_rate": 5.006216399075947e-07, "epoch": 0.9392557022809124, "percentage": 93.93, "elapsed_time": "5:47:43", "remaining_time": "0:22:29", "throughput": 7680.23, "total_tokens": 160235520} +{"current_steps": 19570, "total_steps": 20825, "loss": 0.8329, "learning_rate": 4.92763959848927e-07, "epoch": 0.9397358943577431, "percentage": 93.97, "elapsed_time": "5:48:28", "remaining_time": "0:22:20", "throughput": 7667.64, "total_tokens": 160317440} +{"current_steps": 19580, "total_steps": 20825, "loss": 0.9552, "learning_rate": 4.849678212220682e-07, "epoch": 0.9402160864345739, "percentage": 94.02, "elapsed_time": "5:49:13", "remaining_time": "0:22:12", "throughput": 7654.96, "total_tokens": 160399360} +{"current_steps": 19590, "total_steps": 20825, "loss": 0.7305, "learning_rate": 4.772332436043165e-07, "epoch": 0.9406962785114046, "percentage": 94.07, "elapsed_time": "5:49:59", "remaining_time": "0:22:03", "throughput": 7642.24, "total_tokens": 160481280} +{"current_steps": 19600, "total_steps": 20825, "loss": 0.9516, "learning_rate": 4.6956024641838237e-07, "epoch": 0.9411764705882353, "percentage": 94.12, "elapsed_time": "5:50:44", "remaining_time": "0:21:55", "throughput": 7629.72, "total_tokens": 160563200} +{"current_steps": 19610, "total_steps": 20825, "loss": 0.9362, "learning_rate": 4.619488489323448e-07, "epoch": 0.941656662665066, "percentage": 94.17, "elapsed_time": "5:51:29", "remaining_time": "0:21:46", "throughput": 7617.3, "total_tokens": 160645120} +{"current_steps": 19620, "total_steps": 20825, "loss": 1.006, "learning_rate": 4.5439907025958405e-07, "epoch": 0.9421368547418968, "percentage": 94.21, "elapsed_time": "5:52:14", "remaining_time": "0:21:38", "throughput": 7604.88, "total_tokens": 160727040} +{"current_steps": 19630, "total_steps": 20825, "loss": 0.9851, "learning_rate": 4.4691092935876256e-07, "epoch": 0.9426170468187275, "percentage": 94.26, "elapsed_time": "5:52:59", "remaining_time": "0:21:29", "throughput": 7592.55, "total_tokens": 160808960} +{"current_steps": 19640, "total_steps": 20825, "loss": 1.1214, "learning_rate": 4.394844450337443e-07, "epoch": 0.9430972388955582, "percentage": 94.31, "elapsed_time": "5:53:45", "remaining_time": "0:21:20", "throughput": 7580.24, "total_tokens": 160890880} +{"current_steps": 19650, "total_steps": 20825, "loss": 1.0098, "learning_rate": 4.3211963593357275e-07, "epoch": 0.943577430972389, "percentage": 94.36, "elapsed_time": "5:54:30", "remaining_time": "0:21:11", "throughput": 7568.02, "total_tokens": 160972800} +{"current_steps": 19660, "total_steps": 20825, "loss": 0.8139, "learning_rate": 4.248165205524152e-07, "epoch": 0.9440576230492197, "percentage": 94.41, "elapsed_time": "5:55:15", "remaining_time": "0:21:03", "throughput": 7555.78, "total_tokens": 161054720} +{"current_steps": 19670, "total_steps": 20825, "loss": 0.9041, "learning_rate": 4.175751172295156e-07, "epoch": 0.9445378151260504, "percentage": 94.45, "elapsed_time": "5:56:00", "remaining_time": "0:20:54", "throughput": 7543.63, "total_tokens": 161136640} +{"current_steps": 19680, "total_steps": 20825, "loss": 0.8617, "learning_rate": 4.1039544414914753e-07, "epoch": 0.9450180072028812, "percentage": 94.5, "elapsed_time": "5:56:45", "remaining_time": "0:20:45", "throughput": 7531.58, "total_tokens": 161218560} +{"current_steps": 19690, "total_steps": 20825, "loss": 0.8918, "learning_rate": 4.032775193405752e-07, "epoch": 0.9454981992797119, "percentage": 94.55, "elapsed_time": "5:57:30", "remaining_time": "0:20:36", "throughput": 7519.58, "total_tokens": 161300480} +{"current_steps": 19700, "total_steps": 20825, "loss": 0.8151, "learning_rate": 3.96221360677998e-07, "epoch": 0.9459783913565426, "percentage": 94.6, "elapsed_time": "5:58:15", "remaining_time": "0:20:27", "throughput": 7507.59, "total_tokens": 161382400} +{"current_steps": 19710, "total_steps": 20825, "loss": 0.9074, "learning_rate": 3.892269858805142e-07, "epoch": 0.9464585834333733, "percentage": 94.65, "elapsed_time": "5:59:01", "remaining_time": "0:20:18", "throughput": 7495.67, "total_tokens": 161464320} +{"current_steps": 19720, "total_steps": 20825, "loss": 0.8005, "learning_rate": 3.82294412512077e-07, "epoch": 0.9469387755102041, "percentage": 94.69, "elapsed_time": "5:59:46", "remaining_time": "0:20:09", "throughput": 7483.82, "total_tokens": 161546240} +{"current_steps": 19730, "total_steps": 20825, "loss": 0.8381, "learning_rate": 3.7542365798143573e-07, "epoch": 0.9474189675870348, "percentage": 94.74, "elapsed_time": "6:00:31", "remaining_time": "0:20:00", "throughput": 7472.04, "total_tokens": 161628160} +{"current_steps": 19740, "total_steps": 20825, "loss": 1.0417, "learning_rate": 3.6861473954210855e-07, "epoch": 0.9478991596638655, "percentage": 94.79, "elapsed_time": "6:01:16", "remaining_time": "0:19:51", "throughput": 7460.26, "total_tokens": 161710080} +{"current_steps": 19750, "total_steps": 20825, "loss": 0.7395, "learning_rate": 3.6186767429234323e-07, "epoch": 0.9483793517406963, "percentage": 94.84, "elapsed_time": "6:02:01", "remaining_time": "0:19:42", "throughput": 7448.51, "total_tokens": 161792000} +{"current_steps": 19760, "total_steps": 20825, "loss": 0.8611, "learning_rate": 3.5518247917505077e-07, "epoch": 0.948859543817527, "percentage": 94.89, "elapsed_time": "6:02:46", "remaining_time": "0:19:33", "throughput": 7436.81, "total_tokens": 161873920} +{"current_steps": 19770, "total_steps": 20825, "loss": 1.0409, "learning_rate": 3.485591709777802e-07, "epoch": 0.9493397358943577, "percentage": 94.93, "elapsed_time": "6:03:31", "remaining_time": "0:19:23", "throughput": 7425.21, "total_tokens": 161955840} +{"current_steps": 19780, "total_steps": 20825, "loss": 0.8133, "learning_rate": 3.419977663326801e-07, "epoch": 0.9498199279711885, "percentage": 94.98, "elapsed_time": "6:04:16", "remaining_time": "0:19:14", "throughput": 7413.59, "total_tokens": 162037760} +{"current_steps": 19790, "total_steps": 20825, "loss": 1.2694, "learning_rate": 3.3549828171644537e-07, "epoch": 0.9503001200480192, "percentage": 95.03, "elapsed_time": "6:05:01", "remaining_time": "0:19:05", "throughput": 7402.06, "total_tokens": 162119680} +{"current_steps": 19800, "total_steps": 20825, "loss": 0.8892, "learning_rate": 3.29060733450276e-07, "epoch": 0.9507803121248499, "percentage": 95.08, "elapsed_time": "6:05:47", "remaining_time": "0:18:56", "throughput": 7390.58, "total_tokens": 162201600} +{"current_steps": 19810, "total_steps": 20825, "loss": 1.028, "learning_rate": 3.2268513769984634e-07, "epoch": 0.9512605042016806, "percentage": 95.13, "elapsed_time": "6:06:32", "remaining_time": "0:18:46", "throughput": 7379.12, "total_tokens": 162283520} +{"current_steps": 19820, "total_steps": 20825, "loss": 0.9548, "learning_rate": 3.163715104752524e-07, "epoch": 0.9517406962785114, "percentage": 95.17, "elapsed_time": "6:07:17", "remaining_time": "0:18:37", "throughput": 7367.61, "total_tokens": 162365440} +{"current_steps": 19830, "total_steps": 20825, "loss": 0.9059, "learning_rate": 3.101198676309841e-07, "epoch": 0.9522208883553421, "percentage": 95.22, "elapsed_time": "6:08:03", "remaining_time": "0:18:28", "throughput": 7356.14, "total_tokens": 162447360} +{"current_steps": 19840, "total_steps": 20825, "loss": 0.9254, "learning_rate": 3.039302248658754e-07, "epoch": 0.9527010804321728, "percentage": 95.27, "elapsed_time": "6:08:48", "remaining_time": "0:18:18", "throughput": 7344.85, "total_tokens": 162529280} +{"current_steps": 19850, "total_steps": 20825, "loss": 1.0085, "learning_rate": 2.978025977230736e-07, "epoch": 0.9531812725090036, "percentage": 95.32, "elapsed_time": "6:09:33", "remaining_time": "0:18:09", "throughput": 7333.53, "total_tokens": 162611200} +{"current_steps": 19860, "total_steps": 20825, "loss": 0.9163, "learning_rate": 2.91737001589984e-07, "epoch": 0.9536614645858343, "percentage": 95.37, "elapsed_time": "6:10:19", "remaining_time": "0:17:59", "throughput": 7322.23, "total_tokens": 162693120} +{"current_steps": 19870, "total_steps": 20825, "loss": 0.9455, "learning_rate": 2.8573345169825296e-07, "epoch": 0.954141656662665, "percentage": 95.41, "elapsed_time": "6:11:04", "remaining_time": "0:17:50", "throughput": 7310.96, "total_tokens": 162775040} +{"current_steps": 19880, "total_steps": 20825, "loss": 0.774, "learning_rate": 2.797919631237156e-07, "epoch": 0.9546218487394958, "percentage": 95.46, "elapsed_time": "6:11:50", "remaining_time": "0:17:40", "throughput": 7299.66, "total_tokens": 162856960} +{"current_steps": 19890, "total_steps": 20825, "loss": 0.935, "learning_rate": 2.739125507863649e-07, "epoch": 0.9551020408163265, "percentage": 95.51, "elapsed_time": "6:12:35", "remaining_time": "0:17:30", "throughput": 7288.58, "total_tokens": 162938880} +{"current_steps": 19900, "total_steps": 20825, "loss": 0.9552, "learning_rate": 2.680952294503075e-07, "epoch": 0.9555822328931572, "percentage": 95.56, "elapsed_time": "6:13:20", "remaining_time": "0:17:21", "throughput": 7277.58, "total_tokens": 163020800} +{"current_steps": 19910, "total_steps": 20825, "loss": 0.9321, "learning_rate": 2.6234001372372194e-07, "epoch": 0.956062424969988, "percentage": 95.61, "elapsed_time": "6:14:05", "remaining_time": "0:17:11", "throughput": 7266.57, "total_tokens": 163102720} +{"current_steps": 19920, "total_steps": 20825, "loss": 0.9948, "learning_rate": 2.5664691805884767e-07, "epoch": 0.9565426170468188, "percentage": 95.65, "elapsed_time": "6:14:50", "remaining_time": "0:17:01", "throughput": 7255.57, "total_tokens": 163184640} +{"current_steps": 19930, "total_steps": 20825, "loss": 0.9796, "learning_rate": 2.5101595675191827e-07, "epoch": 0.9570228091236495, "percentage": 95.7, "elapsed_time": "6:15:36", "remaining_time": "0:16:52", "throughput": 7244.63, "total_tokens": 163266560} +{"current_steps": 19940, "total_steps": 20825, "loss": 0.9892, "learning_rate": 2.4544714394314215e-07, "epoch": 0.9575030012004802, "percentage": 95.75, "elapsed_time": "6:16:21", "remaining_time": "0:16:42", "throughput": 7233.79, "total_tokens": 163348480} +{"current_steps": 19950, "total_steps": 20825, "loss": 1.1706, "learning_rate": 2.399404936166638e-07, "epoch": 0.957983193277311, "percentage": 95.8, "elapsed_time": "6:17:07", "remaining_time": "0:16:32", "throughput": 7222.75, "total_tokens": 163430400} +{"current_steps": 19960, "total_steps": 20825, "loss": 0.7551, "learning_rate": 2.3449601960052746e-07, "epoch": 0.9584633853541417, "percentage": 95.85, "elapsed_time": "6:17:52", "remaining_time": "0:16:22", "throughput": 7212.04, "total_tokens": 163512320} +{"current_steps": 19970, "total_steps": 20825, "loss": 0.7976, "learning_rate": 2.2911373556664118e-07, "epoch": 0.9589435774309724, "percentage": 95.89, "elapsed_time": "6:18:42", "remaining_time": "0:16:12", "throughput": 7199.68, "total_tokens": 163594240} +{"current_steps": 19980, "total_steps": 20825, "loss": 0.8963, "learning_rate": 2.23793655030749e-07, "epoch": 0.9594237695078032, "percentage": 95.94, "elapsed_time": "6:19:30", "remaining_time": "0:16:03", "throughput": 7188.14, "total_tokens": 163676160} +{"current_steps": 19990, "total_steps": 20825, "loss": 0.9375, "learning_rate": 2.1853579135238667e-07, "epoch": 0.9599039615846339, "percentage": 95.99, "elapsed_time": "6:20:16", "remaining_time": "0:15:53", "throughput": 7177.02, "total_tokens": 163758080} +{"current_steps": 20000, "total_steps": 20825, "loss": 1.0805, "learning_rate": 2.1334015773486203e-07, "epoch": 0.9603841536614646, "percentage": 96.04, "elapsed_time": "6:21:09", "remaining_time": "0:15:43", "throughput": 7164.23, "total_tokens": 163840000} +{"current_steps": 20010, "total_steps": 20825, "loss": 0.7723, "learning_rate": 2.0820676722520526e-07, "epoch": 0.9608643457382953, "percentage": 96.09, "elapsed_time": "6:22:05", "remaining_time": "0:15:33", "throughput": 7150.25, "total_tokens": 163921920} +{"current_steps": 20020, "total_steps": 20825, "loss": 0.8981, "learning_rate": 2.0313563271414927e-07, "epoch": 0.9613445378151261, "percentage": 96.13, "elapsed_time": "6:22:54", "remaining_time": "0:15:23", "throughput": 7138.44, "total_tokens": 164003840} +{"current_steps": 20030, "total_steps": 20825, "loss": 0.7376, "learning_rate": 1.9812676693608812e-07, "epoch": 0.9618247298919568, "percentage": 96.18, "elapsed_time": "6:23:41", "remaining_time": "0:15:13", "throughput": 7127.49, "total_tokens": 164085760} +{"current_steps": 20040, "total_steps": 20825, "loss": 0.8382, "learning_rate": 1.9318018246905488e-07, "epoch": 0.9623049219687875, "percentage": 96.23, "elapsed_time": "6:24:29", "remaining_time": "0:15:03", "throughput": 7116.15, "total_tokens": 164167680} +{"current_steps": 20050, "total_steps": 20825, "loss": 0.8877, "learning_rate": 1.8829589173468552e-07, "epoch": 0.9627851140456183, "percentage": 96.28, "elapsed_time": "6:25:17", "remaining_time": "0:14:53", "throughput": 7104.92, "total_tokens": 164249600} +{"current_steps": 20060, "total_steps": 20825, "loss": 0.7448, "learning_rate": 1.8347390699817724e-07, "epoch": 0.963265306122449, "percentage": 96.33, "elapsed_time": "6:26:06", "remaining_time": "0:14:43", "throughput": 7093.55, "total_tokens": 164331520} +{"current_steps": 20070, "total_steps": 20825, "loss": 0.9267, "learning_rate": 1.7871424036828288e-07, "epoch": 0.9637454981992797, "percentage": 96.37, "elapsed_time": "6:26:52", "remaining_time": "0:14:33", "throughput": 7082.92, "total_tokens": 164413440} +{"current_steps": 20080, "total_steps": 20825, "loss": 0.9753, "learning_rate": 1.7401690379724722e-07, "epoch": 0.9642256902761105, "percentage": 96.42, "elapsed_time": "6:27:38", "remaining_time": "0:14:22", "throughput": 7072.54, "total_tokens": 164495360} +{"current_steps": 20090, "total_steps": 20825, "loss": 0.8417, "learning_rate": 1.6938190908080688e-07, "epoch": 0.9647058823529412, "percentage": 96.47, "elapsed_time": "6:28:24", "remaining_time": "0:14:12", "throughput": 7062.14, "total_tokens": 164577280} +{"current_steps": 20100, "total_steps": 20825, "loss": 0.7834, "learning_rate": 1.6480926785814866e-07, "epoch": 0.9651860744297719, "percentage": 96.52, "elapsed_time": "6:29:09", "remaining_time": "0:14:02", "throughput": 7051.79, "total_tokens": 164659200} +{"current_steps": 20110, "total_steps": 20825, "loss": 1.0118, "learning_rate": 1.6029899161187079e-07, "epoch": 0.9656662665066026, "percentage": 96.57, "elapsed_time": "6:29:56", "remaining_time": "0:13:51", "throughput": 7041.42, "total_tokens": 164741120} +{"current_steps": 20120, "total_steps": 20825, "loss": 0.7969, "learning_rate": 1.5585109166796896e-07, "epoch": 0.9661464585834334, "percentage": 96.61, "elapsed_time": "6:30:42", "remaining_time": "0:13:41", "throughput": 7030.92, "total_tokens": 164823040} +{"current_steps": 20130, "total_steps": 20825, "loss": 0.9373, "learning_rate": 1.5146557919581138e-07, "epoch": 0.9666266506602641, "percentage": 96.66, "elapsed_time": "6:31:29", "remaining_time": "0:13:30", "throughput": 7020.47, "total_tokens": 164904960} +{"current_steps": 20140, "total_steps": 20825, "loss": 0.717, "learning_rate": 1.4714246520808328e-07, "epoch": 0.9671068427370948, "percentage": 96.71, "elapsed_time": "6:32:17", "remaining_time": "0:13:20", "throughput": 7009.56, "total_tokens": 164986880} +{"current_steps": 20150, "total_steps": 20825, "loss": 0.8529, "learning_rate": 1.4288176056079238e-07, "epoch": 0.9675870348139256, "percentage": 96.76, "elapsed_time": "6:33:05", "remaining_time": "0:13:10", "throughput": 6998.87, "total_tokens": 165068800} +{"current_steps": 20160, "total_steps": 20825, "loss": 0.8958, "learning_rate": 1.3868347595322184e-07, "epoch": 0.9680672268907563, "percentage": 96.81, "elapsed_time": "6:33:55", "remaining_time": "0:12:59", "throughput": 6987.47, "total_tokens": 165150720} +{"current_steps": 20170, "total_steps": 20825, "loss": 1.1627, "learning_rate": 1.3454762192790794e-07, "epoch": 0.968547418967587, "percentage": 96.85, "elapsed_time": "6:34:43", "remaining_time": "0:12:49", "throughput": 6976.74, "total_tokens": 165232640} +{"current_steps": 20180, "total_steps": 20825, "loss": 1.0033, "learning_rate": 1.3047420887061513e-07, "epoch": 0.9690276110444178, "percentage": 96.9, "elapsed_time": "6:35:30", "remaining_time": "0:12:38", "throughput": 6966.24, "total_tokens": 165314560} +{"current_steps": 20190, "total_steps": 20825, "loss": 0.8922, "learning_rate": 1.264632470103111e-07, "epoch": 0.9695078031212485, "percentage": 96.95, "elapsed_time": "6:36:16", "remaining_time": "0:12:27", "throughput": 6956.35, "total_tokens": 165396480} +{"current_steps": 20200, "total_steps": 20825, "loss": 0.9253, "learning_rate": 1.225147464191334e-07, "epoch": 0.9699879951980792, "percentage": 97.0, "elapsed_time": "6:37:01", "remaining_time": "0:12:17", "throughput": 6946.51, "total_tokens": 165478400} +{"current_steps": 20210, "total_steps": 20825, "loss": 0.7544, "learning_rate": 1.1862871701237288e-07, "epoch": 0.9704681872749099, "percentage": 97.05, "elapsed_time": "6:37:47", "remaining_time": "0:12:06", "throughput": 6936.67, "total_tokens": 165560320} +{"current_steps": 20220, "total_steps": 20825, "loss": 0.7983, "learning_rate": 1.1480516854844858e-07, "epoch": 0.9709483793517407, "percentage": 97.09, "elapsed_time": "6:38:33", "remaining_time": "0:11:55", "throughput": 6926.87, "total_tokens": 165642240} +{"current_steps": 20230, "total_steps": 20825, "loss": 0.7969, "learning_rate": 1.1104411062887732e-07, "epoch": 0.9714285714285714, "percentage": 97.14, "elapsed_time": "6:39:18", "remaining_time": "0:11:44", "throughput": 6917.14, "total_tokens": 165724160} +{"current_steps": 20240, "total_steps": 20825, "loss": 0.7713, "learning_rate": 1.0734555269825141e-07, "epoch": 0.9719087635054021, "percentage": 97.19, "elapsed_time": "6:40:04", "remaining_time": "0:11:33", "throughput": 6907.21, "total_tokens": 165806080} +{"current_steps": 20250, "total_steps": 20825, "loss": 0.7452, "learning_rate": 1.0370950404421931e-07, "epoch": 0.9723889555822329, "percentage": 97.24, "elapsed_time": "6:40:53", "remaining_time": "0:11:22", "throughput": 6896.71, "total_tokens": 165888000} +{"current_steps": 20260, "total_steps": 20825, "loss": 0.8992, "learning_rate": 1.0013597379745776e-07, "epoch": 0.9728691476590636, "percentage": 97.29, "elapsed_time": "6:41:43", "remaining_time": "0:11:12", "throughput": 6885.8, "total_tokens": 165969920} +{"current_steps": 20270, "total_steps": 20825, "loss": 0.7645, "learning_rate": 9.662497093164691e-08, "epoch": 0.9733493397358943, "percentage": 97.33, "elapsed_time": "6:42:33", "remaining_time": "0:11:01", "throughput": 6874.8, "total_tokens": 166051840} +{"current_steps": 20280, "total_steps": 20825, "loss": 0.9752, "learning_rate": 9.317650426345637e-08, "epoch": 0.9738295318127251, "percentage": 97.38, "elapsed_time": "6:43:23", "remaining_time": "0:10:50", "throughput": 6864.02, "total_tokens": 166133760} +{"current_steps": 20290, "total_steps": 20825, "loss": 0.8634, "learning_rate": 8.979058245251193e-08, "epoch": 0.9743097238895558, "percentage": 97.43, "elapsed_time": "6:44:09", "remaining_time": "0:10:39", "throughput": 6854.29, "total_tokens": 166215680} +{"current_steps": 20300, "total_steps": 20825, "loss": 1.0172, "learning_rate": 8.646721400138724e-08, "epoch": 0.9747899159663865, "percentage": 97.48, "elapsed_time": "6:44:55", "remaining_time": "0:10:28", "throughput": 6844.82, "total_tokens": 166297600} +{"current_steps": 20310, "total_steps": 20825, "loss": 0.9079, "learning_rate": 8.320640725556773e-08, "epoch": 0.9752701080432172, "percentage": 97.53, "elapsed_time": "6:45:41", "remaining_time": "0:10:17", "throughput": 6835.28, "total_tokens": 166379520} +{"current_steps": 20320, "total_steps": 20825, "loss": 0.9436, "learning_rate": 8.000817040344222e-08, "epoch": 0.975750300120048, "percentage": 97.58, "elapsed_time": "6:46:27", "remaining_time": "0:10:06", "throughput": 6825.72, "total_tokens": 166461440} +{"current_steps": 20330, "total_steps": 20825, "loss": 0.8307, "learning_rate": 7.687251147627251e-08, "epoch": 0.9762304921968787, "percentage": 97.62, "elapsed_time": "6:47:13", "remaining_time": "0:09:54", "throughput": 6816.32, "total_tokens": 166543360} +{"current_steps": 20340, "total_steps": 20825, "loss": 0.7941, "learning_rate": 7.379943834818214e-08, "epoch": 0.9767106842737094, "percentage": 97.67, "elapsed_time": "6:47:59", "remaining_time": "0:09:43", "throughput": 6806.75, "total_tokens": 166625280} +{"current_steps": 20350, "total_steps": 20825, "loss": 0.6886, "learning_rate": 7.0788958736126e-08, "epoch": 0.9771908763505402, "percentage": 97.72, "elapsed_time": "6:48:48", "remaining_time": "0:09:32", "throughput": 6796.37, "total_tokens": 166707200} +{"current_steps": 20360, "total_steps": 20825, "loss": 0.8575, "learning_rate": 6.784108019988189e-08, "epoch": 0.977671068427371, "percentage": 97.77, "elapsed_time": "6:49:38", "remaining_time": "0:09:21", "throughput": 6785.91, "total_tokens": 166789120} +{"current_steps": 20370, "total_steps": 20825, "loss": 0.7712, "learning_rate": 6.495581014202556e-08, "epoch": 0.9781512605042016, "percentage": 97.82, "elapsed_time": "6:50:28", "remaining_time": "0:09:10", "throughput": 6775.53, "total_tokens": 166871040} +{"current_steps": 20380, "total_steps": 20825, "loss": 0.9243, "learning_rate": 6.213315580791135e-08, "epoch": 0.9786314525810325, "percentage": 97.86, "elapsed_time": "6:51:18", "remaining_time": "0:08:58", "throughput": 6765.03, "total_tokens": 166952960} +{"current_steps": 20390, "total_steps": 20825, "loss": 0.8171, "learning_rate": 5.9373124285661e-08, "epoch": 0.9791116446578632, "percentage": 97.91, "elapsed_time": "6:52:08", "remaining_time": "0:08:47", "throughput": 6754.84, "total_tokens": 167034880} +{"current_steps": 20400, "total_steps": 20825, "loss": 0.86, "learning_rate": 5.6675722506135956e-08, "epoch": 0.9795918367346939, "percentage": 97.96, "elapsed_time": "6:52:58", "remaining_time": "0:08:36", "throughput": 6744.4, "total_tokens": 167116800} +{"current_steps": 20410, "total_steps": 20825, "loss": 0.9734, "learning_rate": 5.404095724292346e-08, "epoch": 0.9800720288115247, "percentage": 98.01, "elapsed_time": "6:53:47", "remaining_time": "0:08:24", "throughput": 6734.3, "total_tokens": 167198720} +{"current_steps": 20420, "total_steps": 20825, "loss": 0.9059, "learning_rate": 5.146883511232825e-08, "epoch": 0.9805522208883554, "percentage": 98.06, "elapsed_time": "6:54:35", "remaining_time": "0:08:13", "throughput": 6724.8, "total_tokens": 167280640} +{"current_steps": 20430, "total_steps": 20825, "loss": 0.8805, "learning_rate": 4.8959362573341995e-08, "epoch": 0.9810324129651861, "percentage": 98.1, "elapsed_time": "6:55:22", "remaining_time": "0:08:01", "throughput": 6715.37, "total_tokens": 167362560} +{"current_steps": 20440, "total_steps": 20825, "loss": 0.8186, "learning_rate": 4.6512545927632213e-08, "epoch": 0.9815126050420168, "percentage": 98.15, "elapsed_time": "6:56:09", "remaining_time": "0:07:50", "throughput": 6706.09, "total_tokens": 167444480} +{"current_steps": 20450, "total_steps": 20825, "loss": 0.9007, "learning_rate": 4.412839131953395e-08, "epoch": 0.9819927971188476, "percentage": 98.2, "elapsed_time": "6:56:56", "remaining_time": "0:07:38", "throughput": 6696.67, "total_tokens": 167526400} +{"current_steps": 20460, "total_steps": 20825, "loss": 1.0011, "learning_rate": 4.180690473602755e-08, "epoch": 0.9824729891956783, "percentage": 98.25, "elapsed_time": "6:57:43", "remaining_time": "0:07:27", "throughput": 6687.35, "total_tokens": 167608320} +{"current_steps": 20470, "total_steps": 20825, "loss": 0.7579, "learning_rate": 3.9548092006719275e-08, "epoch": 0.982953181272509, "percentage": 98.3, "elapsed_time": "6:58:29", "remaining_time": "0:07:15", "throughput": 6678.32, "total_tokens": 167690240} +{"current_steps": 20480, "total_steps": 20825, "loss": 1.0422, "learning_rate": 3.7351958803835685e-08, "epoch": 0.9834333733493398, "percentage": 98.34, "elapsed_time": "6:59:16", "remaining_time": "0:07:03", "throughput": 6669.08, "total_tokens": 167772160} +{"current_steps": 20490, "total_steps": 20825, "loss": 1.1318, "learning_rate": 3.5218510642201496e-08, "epoch": 0.9839135654261705, "percentage": 98.39, "elapsed_time": "7:00:04", "remaining_time": "0:06:52", "throughput": 6659.74, "total_tokens": 167854080} +{"current_steps": 20500, "total_steps": 20825, "loss": 1.0579, "learning_rate": 3.314775287923677e-08, "epoch": 0.9843937575030012, "percentage": 98.44, "elapsed_time": "7:00:52", "remaining_time": "0:06:40", "throughput": 6650.15, "total_tokens": 167936000} +{"current_steps": 20510, "total_steps": 20825, "loss": 0.9065, "learning_rate": 3.1139690714931945e-08, "epoch": 0.984873949579832, "percentage": 98.49, "elapsed_time": "7:01:42", "remaining_time": "0:06:28", "throughput": 6640.43, "total_tokens": 168017920} +{"current_steps": 20520, "total_steps": 20825, "loss": 0.7413, "learning_rate": 2.919432919183396e-08, "epoch": 0.9853541416566627, "percentage": 98.54, "elapsed_time": "7:02:27", "remaining_time": "0:06:16", "throughput": 6631.77, "total_tokens": 168099840} +{"current_steps": 20530, "total_steps": 20825, "loss": 0.7307, "learning_rate": 2.731167319505179e-08, "epoch": 0.9858343337334934, "percentage": 98.58, "elapsed_time": "7:03:14", "remaining_time": "0:06:04", "throughput": 6622.88, "total_tokens": 168181760} +{"current_steps": 20540, "total_steps": 20825, "loss": 0.7627, "learning_rate": 2.5491727452217616e-08, "epoch": 0.9863145258103241, "percentage": 98.63, "elapsed_time": "7:04:01", "remaining_time": "0:05:53", "throughput": 6613.81, "total_tokens": 168263680} +{"current_steps": 20550, "total_steps": 20825, "loss": 0.9042, "learning_rate": 2.3734496533497907e-08, "epoch": 0.9867947178871549, "percentage": 98.68, "elapsed_time": "7:04:48", "remaining_time": "0:05:41", "throughput": 6604.81, "total_tokens": 168345600} +{"current_steps": 20560, "total_steps": 20825, "loss": 0.9611, "learning_rate": 2.203998485156844e-08, "epoch": 0.9872749099639856, "percentage": 98.73, "elapsed_time": "7:05:37", "remaining_time": "0:05:29", "throughput": 6595.34, "total_tokens": 168427520} +{"current_steps": 20570, "total_steps": 20825, "loss": 1.0542, "learning_rate": 2.040819666160876e-08, "epoch": 0.9877551020408163, "percentage": 98.78, "elapsed_time": "7:06:25", "remaining_time": "0:05:17", "throughput": 6586.07, "total_tokens": 168509440} +{"current_steps": 20580, "total_steps": 20825, "loss": 1.0403, "learning_rate": 1.8839136061288288e-08, "epoch": 0.9882352941176471, "percentage": 98.82, "elapsed_time": "7:07:13", "remaining_time": "0:05:05", "throughput": 6576.92, "total_tokens": 168591360} +{"current_steps": 20590, "total_steps": 20825, "loss": 1.1069, "learning_rate": 1.7332806990758012e-08, "epoch": 0.9887154861944778, "percentage": 98.87, "elapsed_time": "7:08:04", "remaining_time": "0:04:53", "throughput": 6567.05, "total_tokens": 168673280} +{"current_steps": 20600, "total_steps": 20825, "loss": 0.8757, "learning_rate": 1.5889213232644917e-08, "epoch": 0.9891956782713085, "percentage": 98.92, "elapsed_time": "7:08:51", "remaining_time": "0:04:41", "throughput": 6558.3, "total_tokens": 168755200} +{"current_steps": 20610, "total_steps": 20825, "loss": 1.2612, "learning_rate": 1.4508358412032575e-08, "epoch": 0.9896758703481393, "percentage": 98.97, "elapsed_time": "7:09:38", "remaining_time": "0:04:28", "throughput": 6549.53, "total_tokens": 168837120} +{"current_steps": 20620, "total_steps": 20825, "loss": 0.9593, "learning_rate": 1.319024599645835e-08, "epoch": 0.99015606242497, "percentage": 99.02, "elapsed_time": "7:10:25", "remaining_time": "0:04:16", "throughput": 6540.73, "total_tokens": 168919040} +{"current_steps": 20630, "total_steps": 20825, "loss": 0.7466, "learning_rate": 1.1934879295905089e-08, "epoch": 0.9906362545018007, "percentage": 99.06, "elapsed_time": "7:11:12", "remaining_time": "0:04:04", "throughput": 6532.18, "total_tokens": 169000960} +{"current_steps": 20640, "total_steps": 20825, "loss": 1.0652, "learning_rate": 1.074226146279278e-08, "epoch": 0.9911164465786314, "percentage": 99.11, "elapsed_time": "7:11:58", "remaining_time": "0:03:52", "throughput": 6523.61, "total_tokens": 169082880} +{"current_steps": 20650, "total_steps": 20825, "loss": 1.0358, "learning_rate": 9.612395491970239e-09, "epoch": 0.9915966386554622, "percentage": 99.16, "elapsed_time": "7:12:45", "remaining_time": "0:03:40", "throughput": 6514.98, "total_tokens": 169164800} +{"current_steps": 20660, "total_steps": 20825, "loss": 0.8794, "learning_rate": 8.545284220698446e-09, "epoch": 0.9920768307322929, "percentage": 99.21, "elapsed_time": "7:13:31", "remaining_time": "0:03:27", "throughput": 6506.57, "total_tokens": 169246720} +{"current_steps": 20670, "total_steps": 20825, "loss": 0.8482, "learning_rate": 7.540930328658879e-09, "epoch": 0.9925570228091236, "percentage": 99.26, "elapsed_time": "7:14:17", "remaining_time": "0:03:15", "throughput": 6498.31, "total_tokens": 169328640} +{"current_steps": 20680, "total_steps": 20825, "loss": 1.0116, "learning_rate": 6.599336337942408e-09, "epoch": 0.9930372148859544, "percentage": 99.3, "elapsed_time": "7:15:03", "remaining_time": "0:03:03", "throughput": 6490.03, "total_tokens": 169410560} +{"current_steps": 20690, "total_steps": 20825, "loss": 0.7456, "learning_rate": 5.720504613035416e-09, "epoch": 0.9935174069627851, "percentage": 99.35, "elapsed_time": "7:15:49", "remaining_time": "0:02:50", "throughput": 6481.65, "total_tokens": 169492480} +{"current_steps": 20700, "total_steps": 20825, "loss": 0.8412, "learning_rate": 4.904437360814252e-09, "epoch": 0.9939975990396158, "percentage": 99.4, "elapsed_time": "7:16:36", "remaining_time": "0:02:38", "throughput": 6473.12, "total_tokens": 169574400} +{"current_steps": 20710, "total_steps": 20825, "loss": 1.024, "learning_rate": 4.151136630553554e-09, "epoch": 0.9944777911164466, "percentage": 99.45, "elapsed_time": "7:17:25", "remaining_time": "0:02:25", "throughput": 6464.23, "total_tokens": 169656320} +{"current_steps": 20720, "total_steps": 20825, "loss": 1.1113, "learning_rate": 3.4606043139068234e-09, "epoch": 0.9949579831932773, "percentage": 99.5, "elapsed_time": "7:18:13", "remaining_time": "0:02:13", "throughput": 6455.63, "total_tokens": 169738240} +{"current_steps": 20730, "total_steps": 20825, "loss": 0.9721, "learning_rate": 2.832842144903647e-09, "epoch": 0.995438175270108, "percentage": 99.54, "elapsed_time": "7:19:01", "remaining_time": "0:02:00", "throughput": 6446.84, "total_tokens": 169820160} +{"current_steps": 20740, "total_steps": 20825, "loss": 0.7684, "learning_rate": 2.2678516999552478e-09, "epoch": 0.9959183673469387, "percentage": 99.59, "elapsed_time": "7:19:49", "remaining_time": "0:01:48", "throughput": 6438.29, "total_tokens": 169902080} +{"current_steps": 20750, "total_steps": 20825, "loss": 0.9727, "learning_rate": 1.7656343978378342e-09, "epoch": 0.9963985594237695, "percentage": 99.64, "elapsed_time": "7:20:37", "remaining_time": "0:01:35", "throughput": 6429.72, "total_tokens": 169984000} +{"current_steps": 20760, "total_steps": 20825, "loss": 1.121, "learning_rate": 1.3261914996953728e-09, "epoch": 0.9968787515006002, "percentage": 99.69, "elapsed_time": "7:21:24", "remaining_time": "0:01:22", "throughput": 6421.3, "total_tokens": 170065920} +{"current_steps": 20770, "total_steps": 20825, "loss": 0.9879, "learning_rate": 9.49524109034039e-10, "epoch": 0.9973589435774309, "percentage": 99.74, "elapsed_time": "7:22:14", "remaining_time": "0:01:10", "throughput": 6412.43, "total_tokens": 170147840} +{"current_steps": 20780, "total_steps": 20825, "loss": 0.8828, "learning_rate": 6.356331717305431e-10, "epoch": 0.9978391356542617, "percentage": 99.78, "elapsed_time": "7:23:02", "remaining_time": "0:00:57", "throughput": 6403.76, "total_tokens": 170229760} +{"current_steps": 20790, "total_steps": 20825, "loss": 0.9171, "learning_rate": 3.8451947600437466e-10, "epoch": 0.9983193277310924, "percentage": 99.83, "elapsed_time": "7:23:51", "remaining_time": "0:00:44", "throughput": 6395.15, "total_tokens": 170311680} +{"current_steps": 20800, "total_steps": 20825, "loss": 0.803, "learning_rate": 1.9618365244833404e-10, "epoch": 0.9987995198079231, "percentage": 99.88, "elapsed_time": "7:24:40", "remaining_time": "0:00:32", "throughput": 6386.41, "total_tokens": 170393600} +{"current_steps": 20810, "total_steps": 20825, "loss": 0.9032, "learning_rate": 7.062617399800075e-11, "epoch": 0.999279711884754, "percentage": 99.93, "elapsed_time": "7:25:28", "remaining_time": "0:00:19", "throughput": 6378.12, "total_tokens": 170475520} +{"current_steps": 20820, "total_steps": 20825, "loss": 0.9376, "learning_rate": 7.847355951162705e-12, "epoch": 0.9997599039615847, "percentage": 99.98, "elapsed_time": "7:26:16", "remaining_time": "0:00:06", "throughput": 6369.63, "total_tokens": 170557440} +{"current_steps": 20825, "total_steps": 20825, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "7:26:45", "remaining_time": "0:00:00", "throughput": 6364.37, "total_tokens": 170598400}