{ "best_metric": null, "best_model_checkpoint": null, "epoch": 0.9945838423368396, "eval_steps": 500, "global_step": 92000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 7.204610951008646e-08, "loss": 40.7934, "step": 10 }, { "epoch": 0.0, "learning_rate": 1.4409221902017293e-07, "loss": 41.0886, "step": 20 }, { "epoch": 0.0, "learning_rate": 2.161383285302594e-07, "loss": 41.8685, "step": 30 }, { "epoch": 0.0, "learning_rate": 2.8818443804034586e-07, "loss": 41.0512, "step": 40 }, { "epoch": 0.0, "learning_rate": 3.602305475504323e-07, "loss": 41.2927, "step": 50 }, { "epoch": 0.0, "learning_rate": 4.322766570605188e-07, "loss": 41.1536, "step": 60 }, { "epoch": 0.0, "learning_rate": 5.043227665706053e-07, "loss": 40.2115, "step": 70 }, { "epoch": 0.0, "learning_rate": 5.763688760806917e-07, "loss": 40.967, "step": 80 }, { "epoch": 0.0, "learning_rate": 6.484149855907781e-07, "loss": 39.5403, "step": 90 }, { "epoch": 0.0, "learning_rate": 7.204610951008646e-07, "loss": 40.4143, "step": 100 }, { "epoch": 0.0, "learning_rate": 7.925072046109511e-07, "loss": 40.5635, "step": 110 }, { "epoch": 0.0, "learning_rate": 8.645533141210376e-07, "loss": 40.3297, "step": 120 }, { "epoch": 0.0, "learning_rate": 9.36599423631124e-07, "loss": 38.3564, "step": 130 }, { "epoch": 0.0, "learning_rate": 1.0086455331412106e-06, "loss": 39.4037, "step": 140 }, { "epoch": 0.0, "learning_rate": 1.0806916426512968e-06, "loss": 38.8617, "step": 150 }, { "epoch": 0.0, "learning_rate": 1.1527377521613834e-06, "loss": 39.2414, "step": 160 }, { "epoch": 0.0, "learning_rate": 1.2247838616714698e-06, "loss": 37.3156, "step": 170 }, { "epoch": 0.0, "learning_rate": 1.2968299711815562e-06, "loss": 38.5521, "step": 180 }, { "epoch": 0.0, "learning_rate": 1.3688760806916426e-06, "loss": 37.5909, "step": 190 }, { "epoch": 0.0, "learning_rate": 1.4409221902017292e-06, "loss": 37.2313, "step": 200 }, { "epoch": 0.0, "learning_rate": 1.5129682997118156e-06, "loss": 37.6566, "step": 210 }, { "epoch": 0.0, "learning_rate": 1.5850144092219022e-06, "loss": 35.8199, "step": 220 }, { "epoch": 0.0, "learning_rate": 1.6570605187319886e-06, "loss": 37.0948, "step": 230 }, { "epoch": 0.0, "learning_rate": 1.7291066282420752e-06, "loss": 35.7497, "step": 240 }, { "epoch": 0.0, "learning_rate": 1.8011527377521614e-06, "loss": 34.7709, "step": 250 }, { "epoch": 0.0, "learning_rate": 1.873198847262248e-06, "loss": 34.1054, "step": 260 }, { "epoch": 0.0, "learning_rate": 1.9452449567723344e-06, "loss": 31.4402, "step": 270 }, { "epoch": 0.0, "learning_rate": 2.0172910662824213e-06, "loss": 31.3028, "step": 280 }, { "epoch": 0.0, "learning_rate": 2.0893371757925072e-06, "loss": 31.2182, "step": 290 }, { "epoch": 0.0, "learning_rate": 2.1613832853025936e-06, "loss": 30.2191, "step": 300 }, { "epoch": 0.0, "learning_rate": 2.2334293948126804e-06, "loss": 30.3314, "step": 310 }, { "epoch": 0.0, "learning_rate": 2.305475504322767e-06, "loss": 29.9731, "step": 320 }, { "epoch": 0.0, "learning_rate": 2.3775216138328532e-06, "loss": 29.1036, "step": 330 }, { "epoch": 0.0, "learning_rate": 2.4495677233429396e-06, "loss": 28.6919, "step": 340 }, { "epoch": 0.0, "learning_rate": 2.521613832853026e-06, "loss": 28.3299, "step": 350 }, { "epoch": 0.0, "learning_rate": 2.5936599423631124e-06, "loss": 28.5708, "step": 360 }, { "epoch": 0.0, "learning_rate": 2.6657060518731993e-06, "loss": 28.4714, "step": 370 }, { "epoch": 0.0, "learning_rate": 2.7377521613832852e-06, "loss": 28.7939, "step": 380 }, { "epoch": 0.0, "learning_rate": 2.809798270893372e-06, "loss": 27.8217, "step": 390 }, { "epoch": 0.0, "learning_rate": 2.8818443804034585e-06, "loss": 27.9538, "step": 400 }, { "epoch": 0.0, "learning_rate": 2.9538904899135453e-06, "loss": 27.6477, "step": 410 }, { "epoch": 0.0, "learning_rate": 3.0259365994236312e-06, "loss": 28.4057, "step": 420 }, { "epoch": 0.0, "learning_rate": 3.0979827089337176e-06, "loss": 28.0097, "step": 430 }, { "epoch": 0.0, "learning_rate": 3.1700288184438045e-06, "loss": 27.9475, "step": 440 }, { "epoch": 0.0, "learning_rate": 3.242074927953891e-06, "loss": 27.4961, "step": 450 }, { "epoch": 0.0, "learning_rate": 3.3141210374639773e-06, "loss": 28.3134, "step": 460 }, { "epoch": 0.01, "learning_rate": 3.3861671469740637e-06, "loss": 27.8873, "step": 470 }, { "epoch": 0.01, "learning_rate": 3.4582132564841505e-06, "loss": 27.2717, "step": 480 }, { "epoch": 0.01, "learning_rate": 3.5302593659942365e-06, "loss": 27.4766, "step": 490 }, { "epoch": 0.01, "learning_rate": 3.602305475504323e-06, "loss": 26.5888, "step": 500 }, { "epoch": 0.01, "learning_rate": 3.6743515850144097e-06, "loss": 27.3916, "step": 510 }, { "epoch": 0.01, "learning_rate": 3.746397694524496e-06, "loss": 26.5531, "step": 520 }, { "epoch": 0.01, "learning_rate": 3.8184438040345825e-06, "loss": 27.0254, "step": 530 }, { "epoch": 0.01, "learning_rate": 3.890489913544669e-06, "loss": 26.8229, "step": 540 }, { "epoch": 0.01, "learning_rate": 3.962536023054755e-06, "loss": 27.0594, "step": 550 }, { "epoch": 0.01, "learning_rate": 4.0345821325648425e-06, "loss": 26.4456, "step": 560 }, { "epoch": 0.01, "learning_rate": 4.106628242074928e-06, "loss": 26.9111, "step": 570 }, { "epoch": 0.01, "learning_rate": 4.1786743515850145e-06, "loss": 25.9854, "step": 580 }, { "epoch": 0.01, "learning_rate": 4.250720461095102e-06, "loss": 26.2041, "step": 590 }, { "epoch": 0.01, "learning_rate": 4.322766570605187e-06, "loss": 26.3374, "step": 600 }, { "epoch": 0.01, "learning_rate": 4.394812680115274e-06, "loss": 26.101, "step": 610 }, { "epoch": 0.01, "learning_rate": 4.466858789625361e-06, "loss": 25.7367, "step": 620 }, { "epoch": 0.01, "learning_rate": 4.538904899135447e-06, "loss": 25.5494, "step": 630 }, { "epoch": 0.01, "learning_rate": 4.610951008645534e-06, "loss": 27.2019, "step": 640 }, { "epoch": 0.01, "learning_rate": 4.68299711815562e-06, "loss": 26.8521, "step": 650 }, { "epoch": 0.01, "learning_rate": 4.7550432276657065e-06, "loss": 26.0675, "step": 660 }, { "epoch": 0.01, "learning_rate": 4.827089337175793e-06, "loss": 25.2451, "step": 670 }, { "epoch": 0.01, "learning_rate": 4.899135446685879e-06, "loss": 25.8683, "step": 680 }, { "epoch": 0.01, "learning_rate": 4.971181556195966e-06, "loss": 25.3715, "step": 690 }, { "epoch": 0.01, "learning_rate": 5.043227665706052e-06, "loss": 26.3587, "step": 700 }, { "epoch": 0.01, "learning_rate": 5.1152737752161385e-06, "loss": 26.8675, "step": 710 }, { "epoch": 0.01, "learning_rate": 5.187319884726225e-06, "loss": 25.66, "step": 720 }, { "epoch": 0.01, "learning_rate": 5.259365994236312e-06, "loss": 25.7181, "step": 730 }, { "epoch": 0.01, "learning_rate": 5.3314121037463985e-06, "loss": 26.5402, "step": 740 }, { "epoch": 0.01, "learning_rate": 5.403458213256485e-06, "loss": 26.038, "step": 750 }, { "epoch": 0.01, "learning_rate": 5.4755043227665705e-06, "loss": 26.2257, "step": 760 }, { "epoch": 0.01, "learning_rate": 5.547550432276657e-06, "loss": 26.0365, "step": 770 }, { "epoch": 0.01, "learning_rate": 5.619596541786744e-06, "loss": 25.544, "step": 780 }, { "epoch": 0.01, "learning_rate": 5.6916426512968305e-06, "loss": 25.4091, "step": 790 }, { "epoch": 0.01, "learning_rate": 5.763688760806917e-06, "loss": 25.4503, "step": 800 }, { "epoch": 0.01, "learning_rate": 5.835734870317003e-06, "loss": 25.2717, "step": 810 }, { "epoch": 0.01, "learning_rate": 5.9077809798270905e-06, "loss": 25.3723, "step": 820 }, { "epoch": 0.01, "learning_rate": 5.979827089337177e-06, "loss": 25.0774, "step": 830 }, { "epoch": 0.01, "learning_rate": 6.0518731988472625e-06, "loss": 26.0952, "step": 840 }, { "epoch": 0.01, "learning_rate": 6.123919308357349e-06, "loss": 25.7269, "step": 850 }, { "epoch": 0.01, "learning_rate": 6.195965417867435e-06, "loss": 25.1514, "step": 860 }, { "epoch": 0.01, "learning_rate": 6.2680115273775225e-06, "loss": 25.7952, "step": 870 }, { "epoch": 0.01, "learning_rate": 6.340057636887609e-06, "loss": 25.5564, "step": 880 }, { "epoch": 0.01, "learning_rate": 6.412103746397695e-06, "loss": 25.1046, "step": 890 }, { "epoch": 0.01, "learning_rate": 6.484149855907782e-06, "loss": 24.5227, "step": 900 }, { "epoch": 0.01, "learning_rate": 6.556195965417867e-06, "loss": 25.8436, "step": 910 }, { "epoch": 0.01, "learning_rate": 6.6282420749279545e-06, "loss": 25.1957, "step": 920 }, { "epoch": 0.01, "learning_rate": 6.700288184438041e-06, "loss": 25.2908, "step": 930 }, { "epoch": 0.01, "learning_rate": 6.772334293948127e-06, "loss": 24.8572, "step": 940 }, { "epoch": 0.01, "learning_rate": 6.844380403458214e-06, "loss": 25.1435, "step": 950 }, { "epoch": 0.01, "learning_rate": 6.916426512968301e-06, "loss": 25.9543, "step": 960 }, { "epoch": 0.01, "learning_rate": 6.988472622478387e-06, "loss": 24.8998, "step": 970 }, { "epoch": 0.01, "learning_rate": 7.060518731988473e-06, "loss": 25.1284, "step": 980 }, { "epoch": 0.01, "learning_rate": 7.132564841498559e-06, "loss": 25.4522, "step": 990 }, { "epoch": 0.01, "learning_rate": 7.204610951008646e-06, "loss": 25.0667, "step": 1000 }, { "epoch": 0.01, "learning_rate": 7.276657060518733e-06, "loss": 25.3568, "step": 1010 }, { "epoch": 0.01, "learning_rate": 7.348703170028819e-06, "loss": 25.0221, "step": 1020 }, { "epoch": 0.01, "learning_rate": 7.420749279538906e-06, "loss": 25.1098, "step": 1030 }, { "epoch": 0.01, "learning_rate": 7.492795389048992e-06, "loss": 25.2133, "step": 1040 }, { "epoch": 0.01, "learning_rate": 7.564841498559078e-06, "loss": 24.9687, "step": 1050 }, { "epoch": 0.01, "learning_rate": 7.636887608069165e-06, "loss": 25.0376, "step": 1060 }, { "epoch": 0.01, "learning_rate": 7.70893371757925e-06, "loss": 25.7512, "step": 1070 }, { "epoch": 0.01, "learning_rate": 7.780979827089338e-06, "loss": 25.2528, "step": 1080 }, { "epoch": 0.01, "learning_rate": 7.853025936599425e-06, "loss": 25.5825, "step": 1090 }, { "epoch": 0.01, "learning_rate": 7.92507204610951e-06, "loss": 25.2662, "step": 1100 }, { "epoch": 0.01, "learning_rate": 7.997118155619598e-06, "loss": 25.0687, "step": 1110 }, { "epoch": 0.01, "learning_rate": 8.069164265129685e-06, "loss": 24.891, "step": 1120 }, { "epoch": 0.01, "learning_rate": 8.141210374639769e-06, "loss": 25.0254, "step": 1130 }, { "epoch": 0.01, "learning_rate": 8.213256484149856e-06, "loss": 25.4397, "step": 1140 }, { "epoch": 0.01, "learning_rate": 8.285302593659943e-06, "loss": 25.0585, "step": 1150 }, { "epoch": 0.01, "learning_rate": 8.357348703170029e-06, "loss": 24.7829, "step": 1160 }, { "epoch": 0.01, "learning_rate": 8.429394812680116e-06, "loss": 25.7702, "step": 1170 }, { "epoch": 0.01, "learning_rate": 8.501440922190203e-06, "loss": 24.5915, "step": 1180 }, { "epoch": 0.01, "learning_rate": 8.573487031700289e-06, "loss": 25.071, "step": 1190 }, { "epoch": 0.01, "learning_rate": 8.645533141210375e-06, "loss": 24.988, "step": 1200 }, { "epoch": 0.01, "learning_rate": 8.717579250720462e-06, "loss": 26.0045, "step": 1210 }, { "epoch": 0.01, "learning_rate": 8.789625360230547e-06, "loss": 25.0847, "step": 1220 }, { "epoch": 0.01, "learning_rate": 8.861671469740635e-06, "loss": 24.2152, "step": 1230 }, { "epoch": 0.01, "learning_rate": 8.933717579250722e-06, "loss": 24.6915, "step": 1240 }, { "epoch": 0.01, "learning_rate": 9.005763688760807e-06, "loss": 24.8996, "step": 1250 }, { "epoch": 0.01, "learning_rate": 9.077809798270895e-06, "loss": 24.0085, "step": 1260 }, { "epoch": 0.01, "learning_rate": 9.14985590778098e-06, "loss": 24.9859, "step": 1270 }, { "epoch": 0.01, "learning_rate": 9.221902017291067e-06, "loss": 25.5182, "step": 1280 }, { "epoch": 0.01, "learning_rate": 9.293948126801153e-06, "loss": 24.6764, "step": 1290 }, { "epoch": 0.01, "learning_rate": 9.36599423631124e-06, "loss": 24.1223, "step": 1300 }, { "epoch": 0.01, "learning_rate": 9.438040345821326e-06, "loss": 25.0583, "step": 1310 }, { "epoch": 0.01, "learning_rate": 9.510086455331413e-06, "loss": 24.8809, "step": 1320 }, { "epoch": 0.01, "learning_rate": 9.5821325648415e-06, "loss": 24.6698, "step": 1330 }, { "epoch": 0.01, "learning_rate": 9.654178674351586e-06, "loss": 25.1736, "step": 1340 }, { "epoch": 0.01, "learning_rate": 9.726224783861671e-06, "loss": 24.0949, "step": 1350 }, { "epoch": 0.01, "learning_rate": 9.798270893371759e-06, "loss": 25.406, "step": 1360 }, { "epoch": 0.01, "learning_rate": 9.870317002881846e-06, "loss": 23.9296, "step": 1370 }, { "epoch": 0.01, "learning_rate": 9.942363112391931e-06, "loss": 24.4972, "step": 1380 }, { "epoch": 0.02, "learning_rate": 1.0014409221902017e-05, "loss": 24.4295, "step": 1390 }, { "epoch": 0.02, "learning_rate": 1.0086455331412104e-05, "loss": 24.6469, "step": 1400 }, { "epoch": 0.02, "learning_rate": 1.015850144092219e-05, "loss": 24.0605, "step": 1410 }, { "epoch": 0.02, "learning_rate": 1.0230547550432277e-05, "loss": 23.8814, "step": 1420 }, { "epoch": 0.02, "learning_rate": 1.0302593659942364e-05, "loss": 24.5173, "step": 1430 }, { "epoch": 0.02, "learning_rate": 1.037463976945245e-05, "loss": 25.0064, "step": 1440 }, { "epoch": 0.02, "learning_rate": 1.0446685878962537e-05, "loss": 24.8376, "step": 1450 }, { "epoch": 0.02, "learning_rate": 1.0518731988472624e-05, "loss": 24.5235, "step": 1460 }, { "epoch": 0.02, "learning_rate": 1.059077809798271e-05, "loss": 24.0377, "step": 1470 }, { "epoch": 0.02, "learning_rate": 1.0662824207492797e-05, "loss": 24.1052, "step": 1480 }, { "epoch": 0.02, "learning_rate": 1.0734870317002883e-05, "loss": 24.0113, "step": 1490 }, { "epoch": 0.02, "learning_rate": 1.080691642651297e-05, "loss": 24.9926, "step": 1500 }, { "epoch": 0.02, "learning_rate": 1.0878962536023057e-05, "loss": 24.5731, "step": 1510 }, { "epoch": 0.02, "learning_rate": 1.0951008645533141e-05, "loss": 24.1713, "step": 1520 }, { "epoch": 0.02, "learning_rate": 1.1023054755043228e-05, "loss": 24.1355, "step": 1530 }, { "epoch": 0.02, "learning_rate": 1.1095100864553314e-05, "loss": 24.2953, "step": 1540 }, { "epoch": 0.02, "learning_rate": 1.1167146974063401e-05, "loss": 24.7342, "step": 1550 }, { "epoch": 0.02, "learning_rate": 1.1239193083573488e-05, "loss": 24.169, "step": 1560 }, { "epoch": 0.02, "learning_rate": 1.1311239193083574e-05, "loss": 24.0786, "step": 1570 }, { "epoch": 0.02, "learning_rate": 1.1383285302593661e-05, "loss": 24.6816, "step": 1580 }, { "epoch": 0.02, "learning_rate": 1.1455331412103747e-05, "loss": 24.1285, "step": 1590 }, { "epoch": 0.02, "learning_rate": 1.1527377521613834e-05, "loss": 24.4567, "step": 1600 }, { "epoch": 0.02, "learning_rate": 1.1599423631123921e-05, "loss": 24.3644, "step": 1610 }, { "epoch": 0.02, "learning_rate": 1.1671469740634007e-05, "loss": 24.4427, "step": 1620 }, { "epoch": 0.02, "learning_rate": 1.1743515850144094e-05, "loss": 24.6232, "step": 1630 }, { "epoch": 0.02, "learning_rate": 1.1815561959654181e-05, "loss": 24.2558, "step": 1640 }, { "epoch": 0.02, "learning_rate": 1.1887608069164267e-05, "loss": 24.2927, "step": 1650 }, { "epoch": 0.02, "learning_rate": 1.1959654178674354e-05, "loss": 24.1733, "step": 1660 }, { "epoch": 0.02, "learning_rate": 1.2031700288184438e-05, "loss": 24.6859, "step": 1670 }, { "epoch": 0.02, "learning_rate": 1.2103746397694525e-05, "loss": 24.8219, "step": 1680 }, { "epoch": 0.02, "learning_rate": 1.217579250720461e-05, "loss": 24.3416, "step": 1690 }, { "epoch": 0.02, "learning_rate": 1.2247838616714698e-05, "loss": 23.8413, "step": 1700 }, { "epoch": 0.02, "learning_rate": 1.2319884726224785e-05, "loss": 24.7674, "step": 1710 }, { "epoch": 0.02, "learning_rate": 1.239193083573487e-05, "loss": 24.1939, "step": 1720 }, { "epoch": 0.02, "learning_rate": 1.2463976945244958e-05, "loss": 24.1799, "step": 1730 }, { "epoch": 0.02, "learning_rate": 1.2536023054755045e-05, "loss": 24.4055, "step": 1740 }, { "epoch": 0.02, "learning_rate": 1.260806916426513e-05, "loss": 23.1332, "step": 1750 }, { "epoch": 0.02, "learning_rate": 1.2680115273775218e-05, "loss": 23.8954, "step": 1760 }, { "epoch": 0.02, "learning_rate": 1.2752161383285303e-05, "loss": 23.8778, "step": 1770 }, { "epoch": 0.02, "learning_rate": 1.282420749279539e-05, "loss": 24.2986, "step": 1780 }, { "epoch": 0.02, "learning_rate": 1.2896253602305478e-05, "loss": 23.9736, "step": 1790 }, { "epoch": 0.02, "learning_rate": 1.2968299711815563e-05, "loss": 24.3441, "step": 1800 }, { "epoch": 0.02, "learning_rate": 1.3040345821325649e-05, "loss": 24.1234, "step": 1810 }, { "epoch": 0.02, "learning_rate": 1.3112391930835735e-05, "loss": 24.8563, "step": 1820 }, { "epoch": 0.02, "learning_rate": 1.3184438040345822e-05, "loss": 23.4756, "step": 1830 }, { "epoch": 0.02, "learning_rate": 1.3256484149855909e-05, "loss": 23.8359, "step": 1840 }, { "epoch": 0.02, "learning_rate": 1.3328530259365995e-05, "loss": 23.3531, "step": 1850 }, { "epoch": 0.02, "learning_rate": 1.3400576368876082e-05, "loss": 23.6364, "step": 1860 }, { "epoch": 0.02, "learning_rate": 1.3472622478386167e-05, "loss": 24.3837, "step": 1870 }, { "epoch": 0.02, "learning_rate": 1.3544668587896255e-05, "loss": 23.8666, "step": 1880 }, { "epoch": 0.02, "learning_rate": 1.3616714697406342e-05, "loss": 24.3507, "step": 1890 }, { "epoch": 0.02, "learning_rate": 1.3688760806916427e-05, "loss": 23.8538, "step": 1900 }, { "epoch": 0.02, "learning_rate": 1.3760806916426515e-05, "loss": 23.6057, "step": 1910 }, { "epoch": 0.02, "learning_rate": 1.3832853025936602e-05, "loss": 24.0122, "step": 1920 }, { "epoch": 0.02, "learning_rate": 1.3904899135446687e-05, "loss": 23.402, "step": 1930 }, { "epoch": 0.02, "learning_rate": 1.3976945244956775e-05, "loss": 22.7755, "step": 1940 }, { "epoch": 0.02, "learning_rate": 1.404899135446686e-05, "loss": 24.2195, "step": 1950 }, { "epoch": 0.02, "learning_rate": 1.4121037463976946e-05, "loss": 24.4893, "step": 1960 }, { "epoch": 0.02, "learning_rate": 1.4193083573487031e-05, "loss": 24.4069, "step": 1970 }, { "epoch": 0.02, "learning_rate": 1.4265129682997119e-05, "loss": 23.5268, "step": 1980 }, { "epoch": 0.02, "learning_rate": 1.4337175792507206e-05, "loss": 23.8058, "step": 1990 }, { "epoch": 0.02, "learning_rate": 1.4409221902017291e-05, "loss": 23.1635, "step": 2000 }, { "epoch": 0.02, "learning_rate": 1.4481268011527379e-05, "loss": 23.9204, "step": 2010 }, { "epoch": 0.02, "learning_rate": 1.4553314121037466e-05, "loss": 24.2166, "step": 2020 }, { "epoch": 0.02, "learning_rate": 1.4625360230547551e-05, "loss": 24.3209, "step": 2030 }, { "epoch": 0.02, "learning_rate": 1.4697406340057639e-05, "loss": 23.0454, "step": 2040 }, { "epoch": 0.02, "learning_rate": 1.4769452449567724e-05, "loss": 23.9805, "step": 2050 }, { "epoch": 0.02, "learning_rate": 1.4841498559077811e-05, "loss": 23.5839, "step": 2060 }, { "epoch": 0.02, "learning_rate": 1.4913544668587899e-05, "loss": 23.7281, "step": 2070 }, { "epoch": 0.02, "learning_rate": 1.4985590778097984e-05, "loss": 24.0283, "step": 2080 }, { "epoch": 0.02, "learning_rate": 1.5057636887608072e-05, "loss": 23.9452, "step": 2090 }, { "epoch": 0.02, "learning_rate": 1.5129682997118155e-05, "loss": 23.7523, "step": 2100 }, { "epoch": 0.02, "learning_rate": 1.5201729106628243e-05, "loss": 24.3393, "step": 2110 }, { "epoch": 0.02, "learning_rate": 1.527377521613833e-05, "loss": 24.0495, "step": 2120 }, { "epoch": 0.02, "learning_rate": 1.5345821325648415e-05, "loss": 24.4389, "step": 2130 }, { "epoch": 0.02, "learning_rate": 1.54178674351585e-05, "loss": 24.2428, "step": 2140 }, { "epoch": 0.02, "learning_rate": 1.548991354466859e-05, "loss": 23.4263, "step": 2150 }, { "epoch": 0.02, "learning_rate": 1.5561959654178675e-05, "loss": 23.499, "step": 2160 }, { "epoch": 0.02, "learning_rate": 1.563400576368876e-05, "loss": 23.7408, "step": 2170 }, { "epoch": 0.02, "learning_rate": 1.570605187319885e-05, "loss": 24.158, "step": 2180 }, { "epoch": 0.02, "learning_rate": 1.5778097982708936e-05, "loss": 23.8987, "step": 2190 }, { "epoch": 0.02, "learning_rate": 1.585014409221902e-05, "loss": 24.3963, "step": 2200 }, { "epoch": 0.02, "learning_rate": 1.592219020172911e-05, "loss": 23.8468, "step": 2210 }, { "epoch": 0.02, "learning_rate": 1.5994236311239196e-05, "loss": 24.5168, "step": 2220 }, { "epoch": 0.02, "learning_rate": 1.606628242074928e-05, "loss": 24.2562, "step": 2230 }, { "epoch": 0.02, "learning_rate": 1.613832853025937e-05, "loss": 23.8724, "step": 2240 }, { "epoch": 0.02, "learning_rate": 1.6210374639769452e-05, "loss": 23.7856, "step": 2250 }, { "epoch": 0.02, "learning_rate": 1.6282420749279538e-05, "loss": 23.9331, "step": 2260 }, { "epoch": 0.02, "learning_rate": 1.6354466858789627e-05, "loss": 23.9456, "step": 2270 }, { "epoch": 0.02, "learning_rate": 1.6426512968299712e-05, "loss": 23.6608, "step": 2280 }, { "epoch": 0.02, "learning_rate": 1.6498559077809798e-05, "loss": 24.0208, "step": 2290 }, { "epoch": 0.02, "learning_rate": 1.6570605187319887e-05, "loss": 23.0318, "step": 2300 }, { "epoch": 0.02, "learning_rate": 1.6642651296829972e-05, "loss": 23.6424, "step": 2310 }, { "epoch": 0.03, "learning_rate": 1.6714697406340058e-05, "loss": 24.5698, "step": 2320 }, { "epoch": 0.03, "learning_rate": 1.6786743515850147e-05, "loss": 23.8851, "step": 2330 }, { "epoch": 0.03, "learning_rate": 1.6858789625360232e-05, "loss": 23.8498, "step": 2340 }, { "epoch": 0.03, "learning_rate": 1.6930835734870318e-05, "loss": 23.4063, "step": 2350 }, { "epoch": 0.03, "learning_rate": 1.7002881844380407e-05, "loss": 23.724, "step": 2360 }, { "epoch": 0.03, "learning_rate": 1.7074927953890492e-05, "loss": 23.4106, "step": 2370 }, { "epoch": 0.03, "learning_rate": 1.7146974063400578e-05, "loss": 24.2054, "step": 2380 }, { "epoch": 0.03, "learning_rate": 1.7219020172910663e-05, "loss": 23.1836, "step": 2390 }, { "epoch": 0.03, "learning_rate": 1.729106628242075e-05, "loss": 23.7821, "step": 2400 }, { "epoch": 0.03, "learning_rate": 1.7363112391930838e-05, "loss": 24.0888, "step": 2410 }, { "epoch": 0.03, "learning_rate": 1.7435158501440924e-05, "loss": 23.4072, "step": 2420 }, { "epoch": 0.03, "learning_rate": 1.750720461095101e-05, "loss": 23.5795, "step": 2430 }, { "epoch": 0.03, "learning_rate": 1.7579250720461095e-05, "loss": 23.2243, "step": 2440 }, { "epoch": 0.03, "learning_rate": 1.7651296829971184e-05, "loss": 23.008, "step": 2450 }, { "epoch": 0.03, "learning_rate": 1.772334293948127e-05, "loss": 23.6165, "step": 2460 }, { "epoch": 0.03, "learning_rate": 1.7795389048991355e-05, "loss": 23.6785, "step": 2470 }, { "epoch": 0.03, "learning_rate": 1.7867435158501444e-05, "loss": 23.4426, "step": 2480 }, { "epoch": 0.03, "learning_rate": 1.793948126801153e-05, "loss": 23.0971, "step": 2490 }, { "epoch": 0.03, "learning_rate": 1.8011527377521615e-05, "loss": 23.6063, "step": 2500 }, { "epoch": 0.03, "learning_rate": 1.8083573487031704e-05, "loss": 23.9692, "step": 2510 }, { "epoch": 0.03, "learning_rate": 1.815561959654179e-05, "loss": 24.1209, "step": 2520 }, { "epoch": 0.03, "learning_rate": 1.8227665706051875e-05, "loss": 23.6899, "step": 2530 }, { "epoch": 0.03, "learning_rate": 1.829971181556196e-05, "loss": 23.6814, "step": 2540 }, { "epoch": 0.03, "learning_rate": 1.8371757925072046e-05, "loss": 23.1915, "step": 2550 }, { "epoch": 0.03, "learning_rate": 1.8443804034582135e-05, "loss": 23.3122, "step": 2560 }, { "epoch": 0.03, "learning_rate": 1.851585014409222e-05, "loss": 23.4673, "step": 2570 }, { "epoch": 0.03, "learning_rate": 1.8587896253602306e-05, "loss": 23.2601, "step": 2580 }, { "epoch": 0.03, "learning_rate": 1.8659942363112395e-05, "loss": 23.3742, "step": 2590 }, { "epoch": 0.03, "learning_rate": 1.873198847262248e-05, "loss": 24.074, "step": 2600 }, { "epoch": 0.03, "learning_rate": 1.8804034582132566e-05, "loss": 23.2797, "step": 2610 }, { "epoch": 0.03, "learning_rate": 1.887608069164265e-05, "loss": 24.7054, "step": 2620 }, { "epoch": 0.03, "learning_rate": 1.894812680115274e-05, "loss": 23.6886, "step": 2630 }, { "epoch": 0.03, "learning_rate": 1.9020172910662826e-05, "loss": 23.4811, "step": 2640 }, { "epoch": 0.03, "learning_rate": 1.909221902017291e-05, "loss": 23.3659, "step": 2650 }, { "epoch": 0.03, "learning_rate": 1.9164265129683e-05, "loss": 23.2814, "step": 2660 }, { "epoch": 0.03, "learning_rate": 1.9236311239193086e-05, "loss": 23.0724, "step": 2670 }, { "epoch": 0.03, "learning_rate": 1.930835734870317e-05, "loss": 23.4088, "step": 2680 }, { "epoch": 0.03, "learning_rate": 1.9380403458213257e-05, "loss": 23.6146, "step": 2690 }, { "epoch": 0.03, "learning_rate": 1.9452449567723343e-05, "loss": 23.4213, "step": 2700 }, { "epoch": 0.03, "learning_rate": 1.952449567723343e-05, "loss": 22.5163, "step": 2710 }, { "epoch": 0.03, "learning_rate": 1.9596541786743517e-05, "loss": 23.9956, "step": 2720 }, { "epoch": 0.03, "learning_rate": 1.9668587896253603e-05, "loss": 23.5393, "step": 2730 }, { "epoch": 0.03, "learning_rate": 1.974063400576369e-05, "loss": 23.5978, "step": 2740 }, { "epoch": 0.03, "learning_rate": 1.9812680115273777e-05, "loss": 24.1504, "step": 2750 }, { "epoch": 0.03, "learning_rate": 1.9884726224783863e-05, "loss": 23.1519, "step": 2760 }, { "epoch": 0.03, "learning_rate": 1.995677233429395e-05, "loss": 22.8054, "step": 2770 }, { "epoch": 0.03, "learning_rate": 1.999999990192399e-05, "loss": 24.1455, "step": 2780 }, { "epoch": 0.03, "learning_rate": 1.999999879856888e-05, "loss": 23.7068, "step": 2790 }, { "epoch": 0.03, "learning_rate": 1.9999996469263775e-05, "loss": 22.9734, "step": 2800 }, { "epoch": 0.03, "learning_rate": 1.9999992914008967e-05, "loss": 23.3376, "step": 2810 }, { "epoch": 0.03, "learning_rate": 1.9999988132804892e-05, "loss": 23.6753, "step": 2820 }, { "epoch": 0.03, "learning_rate": 1.999998212565213e-05, "loss": 23.4004, "step": 2830 }, { "epoch": 0.03, "learning_rate": 1.999997489255142e-05, "loss": 23.7849, "step": 2840 }, { "epoch": 0.03, "learning_rate": 1.999996643350365e-05, "loss": 23.0225, "step": 2850 }, { "epoch": 0.03, "learning_rate": 1.999995674850986e-05, "loss": 23.7763, "step": 2860 }, { "epoch": 0.03, "learning_rate": 1.9999945837571235e-05, "loss": 23.4875, "step": 2870 }, { "epoch": 0.03, "learning_rate": 1.999993370068911e-05, "loss": 23.3275, "step": 2880 }, { "epoch": 0.03, "learning_rate": 1.9999920337864976e-05, "loss": 23.8817, "step": 2890 }, { "epoch": 0.03, "learning_rate": 1.9999905749100467e-05, "loss": 23.6653, "step": 2900 }, { "epoch": 0.03, "learning_rate": 1.9999889934397373e-05, "loss": 23.1983, "step": 2910 }, { "epoch": 0.03, "learning_rate": 1.999987289375764e-05, "loss": 23.6002, "step": 2920 }, { "epoch": 0.03, "learning_rate": 1.999985462718335e-05, "loss": 23.0934, "step": 2930 }, { "epoch": 0.03, "learning_rate": 1.999983513467674e-05, "loss": 23.4912, "step": 2940 }, { "epoch": 0.03, "learning_rate": 1.9999814416240206e-05, "loss": 23.4084, "step": 2950 }, { "epoch": 0.03, "learning_rate": 1.9999792471876284e-05, "loss": 23.2838, "step": 2960 }, { "epoch": 0.03, "learning_rate": 1.999976930158767e-05, "loss": 23.8423, "step": 2970 }, { "epoch": 0.03, "learning_rate": 1.9999744905377195e-05, "loss": 23.6738, "step": 2980 }, { "epoch": 0.03, "learning_rate": 1.9999719283247858e-05, "loss": 23.6689, "step": 2990 }, { "epoch": 0.03, "learning_rate": 1.9999692435202797e-05, "loss": 23.3334, "step": 3000 }, { "epoch": 0.03, "learning_rate": 1.99996643612453e-05, "loss": 22.9461, "step": 3010 }, { "epoch": 0.03, "learning_rate": 1.9999635061378816e-05, "loss": 22.4148, "step": 3020 }, { "epoch": 0.03, "learning_rate": 1.9999604535606934e-05, "loss": 23.7635, "step": 3030 }, { "epoch": 0.03, "learning_rate": 1.9999572783933398e-05, "loss": 23.0397, "step": 3040 }, { "epoch": 0.03, "learning_rate": 1.9999539806362095e-05, "loss": 24.0576, "step": 3050 }, { "epoch": 0.03, "learning_rate": 1.999950560289707e-05, "loss": 23.8885, "step": 3060 }, { "epoch": 0.03, "learning_rate": 1.9999470173542518e-05, "loss": 23.7561, "step": 3070 }, { "epoch": 0.03, "learning_rate": 1.999943351830278e-05, "loss": 23.5078, "step": 3080 }, { "epoch": 0.03, "learning_rate": 1.9999395637182357e-05, "loss": 22.983, "step": 3090 }, { "epoch": 0.03, "learning_rate": 1.9999356530185884e-05, "loss": 23.3123, "step": 3100 }, { "epoch": 0.03, "learning_rate": 1.999931619731816e-05, "loss": 24.043, "step": 3110 }, { "epoch": 0.03, "learning_rate": 1.9999274638584128e-05, "loss": 23.4319, "step": 3120 }, { "epoch": 0.03, "learning_rate": 1.9999231853988885e-05, "loss": 23.4853, "step": 3130 }, { "epoch": 0.03, "learning_rate": 1.9999187843537674e-05, "loss": 23.0404, "step": 3140 }, { "epoch": 0.03, "learning_rate": 1.999914260723589e-05, "loss": 24.0672, "step": 3150 }, { "epoch": 0.03, "learning_rate": 1.9999096145089082e-05, "loss": 23.7692, "step": 3160 }, { "epoch": 0.03, "learning_rate": 1.999904845710294e-05, "loss": 22.9394, "step": 3170 }, { "epoch": 0.03, "learning_rate": 1.9998999543283317e-05, "loss": 23.4395, "step": 3180 }, { "epoch": 0.03, "learning_rate": 1.9998949403636207e-05, "loss": 23.0396, "step": 3190 }, { "epoch": 0.03, "learning_rate": 1.9998898038167756e-05, "loss": 24.0323, "step": 3200 }, { "epoch": 0.03, "learning_rate": 1.999884544688426e-05, "loss": 23.8503, "step": 3210 }, { "epoch": 0.03, "learning_rate": 1.9998791629792172e-05, "loss": 23.4083, "step": 3220 }, { "epoch": 0.03, "learning_rate": 1.999873658689808e-05, "loss": 23.436, "step": 3230 }, { "epoch": 0.04, "learning_rate": 1.9998680318208744e-05, "loss": 22.5681, "step": 3240 }, { "epoch": 0.04, "learning_rate": 1.9998622823731056e-05, "loss": 23.8742, "step": 3250 }, { "epoch": 0.04, "learning_rate": 1.999856410347206e-05, "loss": 24.3248, "step": 3260 }, { "epoch": 0.04, "learning_rate": 1.9998504157438962e-05, "loss": 23.3768, "step": 3270 }, { "epoch": 0.04, "learning_rate": 1.999844298563911e-05, "loss": 22.5053, "step": 3280 }, { "epoch": 0.04, "learning_rate": 1.9998380588080003e-05, "loss": 23.9692, "step": 3290 }, { "epoch": 0.04, "learning_rate": 1.9998316964769285e-05, "loss": 22.581, "step": 3300 }, { "epoch": 0.04, "learning_rate": 1.9998252115714763e-05, "loss": 23.1311, "step": 3310 }, { "epoch": 0.04, "learning_rate": 1.9998186040924386e-05, "loss": 23.0084, "step": 3320 }, { "epoch": 0.04, "learning_rate": 1.999811874040625e-05, "loss": 23.8092, "step": 3330 }, { "epoch": 0.04, "learning_rate": 1.9998050214168612e-05, "loss": 24.9683, "step": 3340 }, { "epoch": 0.04, "learning_rate": 1.9997980462219868e-05, "loss": 22.7675, "step": 3350 }, { "epoch": 0.04, "learning_rate": 1.999790948456857e-05, "loss": 23.3315, "step": 3360 }, { "epoch": 0.04, "learning_rate": 1.9997837281223424e-05, "loss": 23.2976, "step": 3370 }, { "epoch": 0.04, "learning_rate": 1.9997763852193274e-05, "loss": 22.7865, "step": 3380 }, { "epoch": 0.04, "learning_rate": 1.9997689197487127e-05, "loss": 22.6399, "step": 3390 }, { "epoch": 0.04, "learning_rate": 1.9997613317114138e-05, "loss": 23.3145, "step": 3400 }, { "epoch": 0.04, "learning_rate": 1.9997536211083607e-05, "loss": 23.2507, "step": 3410 }, { "epoch": 0.04, "learning_rate": 1.9997457879404983e-05, "loss": 23.4962, "step": 3420 }, { "epoch": 0.04, "learning_rate": 1.9997378322087872e-05, "loss": 23.5404, "step": 3430 }, { "epoch": 0.04, "learning_rate": 1.9997297539142025e-05, "loss": 23.1175, "step": 3440 }, { "epoch": 0.04, "learning_rate": 1.9997215530577355e-05, "loss": 23.1048, "step": 3450 }, { "epoch": 0.04, "learning_rate": 1.9997132296403902e-05, "loss": 23.4079, "step": 3460 }, { "epoch": 0.04, "learning_rate": 1.999704783663188e-05, "loss": 22.6693, "step": 3470 }, { "epoch": 0.04, "learning_rate": 1.9996962151271642e-05, "loss": 23.1111, "step": 3480 }, { "epoch": 0.04, "learning_rate": 1.999687524033369e-05, "loss": 23.0769, "step": 3490 }, { "epoch": 0.04, "learning_rate": 1.9996787103828678e-05, "loss": 22.7996, "step": 3500 }, { "epoch": 0.04, "learning_rate": 1.9996697741767412e-05, "loss": 23.4002, "step": 3510 }, { "epoch": 0.04, "learning_rate": 1.999660715416085e-05, "loss": 22.7146, "step": 3520 }, { "epoch": 0.04, "learning_rate": 1.9996515341020095e-05, "loss": 22.9093, "step": 3530 }, { "epoch": 0.04, "learning_rate": 1.9996422302356404e-05, "loss": 23.1059, "step": 3540 }, { "epoch": 0.04, "learning_rate": 1.9996328038181183e-05, "loss": 23.4788, "step": 3550 }, { "epoch": 0.04, "learning_rate": 1.9996232548505988e-05, "loss": 23.2708, "step": 3560 }, { "epoch": 0.04, "learning_rate": 1.9996135833342525e-05, "loss": 23.0164, "step": 3570 }, { "epoch": 0.04, "learning_rate": 1.999603789270265e-05, "loss": 23.7824, "step": 3580 }, { "epoch": 0.04, "learning_rate": 1.9995938726598374e-05, "loss": 23.2301, "step": 3590 }, { "epoch": 0.04, "learning_rate": 1.999583833504185e-05, "loss": 22.4213, "step": 3600 }, { "epoch": 0.04, "learning_rate": 1.999573671804539e-05, "loss": 23.216, "step": 3610 }, { "epoch": 0.04, "learning_rate": 1.9995633875621447e-05, "loss": 23.2294, "step": 3620 }, { "epoch": 0.04, "learning_rate": 1.9995529807782628e-05, "loss": 22.6359, "step": 3630 }, { "epoch": 0.04, "learning_rate": 1.9995424514541698e-05, "loss": 23.3712, "step": 3640 }, { "epoch": 0.04, "learning_rate": 1.999531799591156e-05, "loss": 23.6198, "step": 3650 }, { "epoch": 0.04, "learning_rate": 1.9995210251905273e-05, "loss": 23.1176, "step": 3660 }, { "epoch": 0.04, "learning_rate": 1.9995101282536046e-05, "loss": 23.3428, "step": 3670 }, { "epoch": 0.04, "learning_rate": 1.9994991087817245e-05, "loss": 23.0174, "step": 3680 }, { "epoch": 0.04, "learning_rate": 1.9994879667762368e-05, "loss": 23.1881, "step": 3690 }, { "epoch": 0.04, "learning_rate": 1.9994767022385082e-05, "loss": 22.6289, "step": 3700 }, { "epoch": 0.04, "learning_rate": 1.9994653151699195e-05, "loss": 22.7081, "step": 3710 }, { "epoch": 0.04, "learning_rate": 1.9994538055718668e-05, "loss": 23.28, "step": 3720 }, { "epoch": 0.04, "learning_rate": 1.9994421734457607e-05, "loss": 23.5222, "step": 3730 }, { "epoch": 0.04, "learning_rate": 1.9994304187930272e-05, "loss": 23.8568, "step": 3740 }, { "epoch": 0.04, "learning_rate": 1.9994185416151083e-05, "loss": 24.071, "step": 3750 }, { "epoch": 0.04, "learning_rate": 1.9994065419134592e-05, "loss": 23.5641, "step": 3760 }, { "epoch": 0.04, "learning_rate": 1.9993944196895514e-05, "loss": 23.4622, "step": 3770 }, { "epoch": 0.04, "learning_rate": 1.999382174944871e-05, "loss": 22.8073, "step": 3780 }, { "epoch": 0.04, "learning_rate": 1.999369807680919e-05, "loss": 22.6733, "step": 3790 }, { "epoch": 0.04, "learning_rate": 1.9993573178992113e-05, "loss": 23.1542, "step": 3800 }, { "epoch": 0.04, "learning_rate": 1.9993447056012797e-05, "loss": 23.7904, "step": 3810 }, { "epoch": 0.04, "learning_rate": 1.9993319707886704e-05, "loss": 22.9512, "step": 3820 }, { "epoch": 0.04, "learning_rate": 1.999319113462944e-05, "loss": 22.8647, "step": 3830 }, { "epoch": 0.04, "learning_rate": 1.9993061336256766e-05, "loss": 23.3025, "step": 3840 }, { "epoch": 0.04, "learning_rate": 1.9992930312784607e-05, "loss": 22.6696, "step": 3850 }, { "epoch": 0.04, "learning_rate": 1.9992798064229015e-05, "loss": 22.6776, "step": 3860 }, { "epoch": 0.04, "learning_rate": 1.99926645906062e-05, "loss": 22.9946, "step": 3870 }, { "epoch": 0.04, "learning_rate": 1.9992529891932542e-05, "loss": 22.7207, "step": 3880 }, { "epoch": 0.04, "learning_rate": 1.999239396822454e-05, "loss": 23.1151, "step": 3890 }, { "epoch": 0.04, "learning_rate": 1.9992256819498862e-05, "loss": 23.4824, "step": 3900 }, { "epoch": 0.04, "learning_rate": 1.9992118445772316e-05, "loss": 23.2746, "step": 3910 }, { "epoch": 0.04, "learning_rate": 1.9991978847061876e-05, "loss": 23.3912, "step": 3920 }, { "epoch": 0.04, "learning_rate": 1.999183802338465e-05, "loss": 23.5626, "step": 3930 }, { "epoch": 0.04, "learning_rate": 1.9991695974757906e-05, "loss": 23.2177, "step": 3940 }, { "epoch": 0.04, "learning_rate": 1.9991552701199053e-05, "loss": 23.1728, "step": 3950 }, { "epoch": 0.04, "learning_rate": 1.999140820272566e-05, "loss": 22.736, "step": 3960 }, { "epoch": 0.04, "learning_rate": 1.999126247935544e-05, "loss": 23.7334, "step": 3970 }, { "epoch": 0.04, "learning_rate": 1.9991115531106253e-05, "loss": 22.7125, "step": 3980 }, { "epoch": 0.04, "learning_rate": 1.9990967357996122e-05, "loss": 22.5268, "step": 3990 }, { "epoch": 0.04, "learning_rate": 1.999081796004321e-05, "loss": 22.9913, "step": 4000 }, { "epoch": 0.04, "learning_rate": 1.9990667337265837e-05, "loss": 22.552, "step": 4010 }, { "epoch": 0.04, "learning_rate": 1.9990515489682458e-05, "loss": 23.094, "step": 4020 }, { "epoch": 0.04, "learning_rate": 1.9990362417311697e-05, "loss": 22.8053, "step": 4030 }, { "epoch": 0.04, "learning_rate": 1.9990208120172317e-05, "loss": 22.6895, "step": 4040 }, { "epoch": 0.04, "learning_rate": 1.9990052598283232e-05, "loss": 22.6651, "step": 4050 }, { "epoch": 0.04, "learning_rate": 1.9989895851663513e-05, "loss": 23.6961, "step": 4060 }, { "epoch": 0.04, "learning_rate": 1.9989737880332378e-05, "loss": 22.3778, "step": 4070 }, { "epoch": 0.04, "learning_rate": 1.9989578684309182e-05, "loss": 23.8524, "step": 4080 }, { "epoch": 0.04, "learning_rate": 1.9989418263613456e-05, "loss": 22.6364, "step": 4090 }, { "epoch": 0.04, "learning_rate": 1.9989256618264857e-05, "loss": 22.6428, "step": 4100 }, { "epoch": 0.04, "learning_rate": 1.9989093748283202e-05, "loss": 23.3724, "step": 4110 }, { "epoch": 0.04, "learning_rate": 1.9988929653688465e-05, "loss": 22.3722, "step": 4120 }, { "epoch": 0.04, "learning_rate": 1.9988764334500757e-05, "loss": 23.2526, "step": 4130 }, { "epoch": 0.04, "learning_rate": 1.9988597790740346e-05, "loss": 23.3811, "step": 4140 }, { "epoch": 0.04, "learning_rate": 1.9988430022427652e-05, "loss": 23.6332, "step": 4150 }, { "epoch": 0.04, "learning_rate": 1.998826102958324e-05, "loss": 23.9196, "step": 4160 }, { "epoch": 0.05, "learning_rate": 1.998809081222783e-05, "loss": 23.2708, "step": 4170 }, { "epoch": 0.05, "learning_rate": 1.998791937038229e-05, "loss": 23.9487, "step": 4180 }, { "epoch": 0.05, "learning_rate": 1.9987746704067637e-05, "loss": 22.6714, "step": 4190 }, { "epoch": 0.05, "learning_rate": 1.998757281330504e-05, "loss": 22.8097, "step": 4200 }, { "epoch": 0.05, "learning_rate": 1.998739769811581e-05, "loss": 23.505, "step": 4210 }, { "epoch": 0.05, "learning_rate": 1.9987221358521425e-05, "loss": 23.692, "step": 4220 }, { "epoch": 0.05, "learning_rate": 1.99870437945435e-05, "loss": 22.5914, "step": 4230 }, { "epoch": 0.05, "learning_rate": 1.9986865006203802e-05, "loss": 22.7768, "step": 4240 }, { "epoch": 0.05, "learning_rate": 1.9986684993524252e-05, "loss": 22.2718, "step": 4250 }, { "epoch": 0.05, "learning_rate": 1.9986503756526915e-05, "loss": 23.1815, "step": 4260 }, { "epoch": 0.05, "learning_rate": 1.998632129523401e-05, "loss": 23.4093, "step": 4270 }, { "epoch": 0.05, "learning_rate": 1.9986137609667915e-05, "loss": 22.8384, "step": 4280 }, { "epoch": 0.05, "learning_rate": 1.9985952699851137e-05, "loss": 22.9612, "step": 4290 }, { "epoch": 0.05, "learning_rate": 1.998576656580635e-05, "loss": 22.5312, "step": 4300 }, { "epoch": 0.05, "learning_rate": 1.9985579207556374e-05, "loss": 22.9832, "step": 4310 }, { "epoch": 0.05, "learning_rate": 1.9985390625124175e-05, "loss": 22.7408, "step": 4320 }, { "epoch": 0.05, "learning_rate": 1.9985200818532873e-05, "loss": 22.2013, "step": 4330 }, { "epoch": 0.05, "learning_rate": 1.9985009787805744e-05, "loss": 22.9995, "step": 4340 }, { "epoch": 0.05, "learning_rate": 1.9984817532966197e-05, "loss": 22.9388, "step": 4350 }, { "epoch": 0.05, "learning_rate": 1.998462405403781e-05, "loss": 22.5072, "step": 4360 }, { "epoch": 0.05, "learning_rate": 1.9984429351044298e-05, "loss": 22.4785, "step": 4370 }, { "epoch": 0.05, "learning_rate": 1.998423342400953e-05, "loss": 23.0037, "step": 4380 }, { "epoch": 0.05, "learning_rate": 1.9984036272957528e-05, "loss": 22.9426, "step": 4390 }, { "epoch": 0.05, "learning_rate": 1.9983837897912463e-05, "loss": 23.0697, "step": 4400 }, { "epoch": 0.05, "learning_rate": 1.9983638298898652e-05, "loss": 22.6722, "step": 4410 }, { "epoch": 0.05, "learning_rate": 1.9983437475940566e-05, "loss": 22.677, "step": 4420 }, { "epoch": 0.05, "learning_rate": 1.9983235429062823e-05, "loss": 23.0484, "step": 4430 }, { "epoch": 0.05, "learning_rate": 1.9983032158290196e-05, "loss": 23.3695, "step": 4440 }, { "epoch": 0.05, "learning_rate": 1.9982827663647605e-05, "loss": 22.9834, "step": 4450 }, { "epoch": 0.05, "learning_rate": 1.9982621945160113e-05, "loss": 22.8521, "step": 4460 }, { "epoch": 0.05, "learning_rate": 1.9982415002852954e-05, "loss": 23.5219, "step": 4470 }, { "epoch": 0.05, "learning_rate": 1.9982206836751485e-05, "loss": 23.2897, "step": 4480 }, { "epoch": 0.05, "learning_rate": 1.9981997446881228e-05, "loss": 22.9464, "step": 4490 }, { "epoch": 0.05, "learning_rate": 1.998178683326786e-05, "loss": 23.4142, "step": 4500 }, { "epoch": 0.05, "learning_rate": 1.9981574995937197e-05, "loss": 23.6156, "step": 4510 }, { "epoch": 0.05, "learning_rate": 1.998136193491521e-05, "loss": 22.7497, "step": 4520 }, { "epoch": 0.05, "learning_rate": 1.9981147650228016e-05, "loss": 22.8336, "step": 4530 }, { "epoch": 0.05, "learning_rate": 1.9980932141901886e-05, "loss": 22.865, "step": 4540 }, { "epoch": 0.05, "learning_rate": 1.9980715409963246e-05, "loss": 22.6739, "step": 4550 }, { "epoch": 0.05, "learning_rate": 1.9980497454438663e-05, "loss": 22.7609, "step": 4560 }, { "epoch": 0.05, "learning_rate": 1.9980278275354855e-05, "loss": 23.192, "step": 4570 }, { "epoch": 0.05, "learning_rate": 1.9980057872738694e-05, "loss": 22.102, "step": 4580 }, { "epoch": 0.05, "learning_rate": 1.99798362466172e-05, "loss": 23.3057, "step": 4590 }, { "epoch": 0.05, "learning_rate": 1.9979613397017546e-05, "loss": 23.1354, "step": 4600 }, { "epoch": 0.05, "learning_rate": 1.9979389323967047e-05, "loss": 22.5115, "step": 4610 }, { "epoch": 0.05, "learning_rate": 1.9979164027493177e-05, "loss": 23.3927, "step": 4620 }, { "epoch": 0.05, "learning_rate": 1.9978937507623553e-05, "loss": 22.6488, "step": 4630 }, { "epoch": 0.05, "learning_rate": 1.9978709764385947e-05, "loss": 22.8063, "step": 4640 }, { "epoch": 0.05, "learning_rate": 1.9978480797808282e-05, "loss": 23.3071, "step": 4650 }, { "epoch": 0.05, "learning_rate": 1.9978250607918624e-05, "loss": 23.6343, "step": 4660 }, { "epoch": 0.05, "learning_rate": 1.9978019194745197e-05, "loss": 22.2536, "step": 4670 }, { "epoch": 0.05, "learning_rate": 1.997778655831637e-05, "loss": 24.0055, "step": 4680 }, { "epoch": 0.05, "learning_rate": 1.9977552698660658e-05, "loss": 22.5085, "step": 4690 }, { "epoch": 0.05, "learning_rate": 1.9977317615806738e-05, "loss": 21.8136, "step": 4700 }, { "epoch": 0.05, "learning_rate": 1.9977081309783425e-05, "loss": 22.5816, "step": 4710 }, { "epoch": 0.05, "learning_rate": 1.9976843780619692e-05, "loss": 21.9018, "step": 4720 }, { "epoch": 0.05, "learning_rate": 1.9976605028344655e-05, "loss": 23.3509, "step": 4730 }, { "epoch": 0.05, "learning_rate": 1.997636505298759e-05, "loss": 22.0944, "step": 4740 }, { "epoch": 0.05, "learning_rate": 1.997612385457791e-05, "loss": 22.8603, "step": 4750 }, { "epoch": 0.05, "learning_rate": 1.997588143314519e-05, "loss": 23.2222, "step": 4760 }, { "epoch": 0.05, "learning_rate": 1.997563778871915e-05, "loss": 23.0413, "step": 4770 }, { "epoch": 0.05, "learning_rate": 1.9975392921329656e-05, "loss": 22.7477, "step": 4780 }, { "epoch": 0.05, "learning_rate": 1.997514683100673e-05, "loss": 23.1867, "step": 4790 }, { "epoch": 0.05, "learning_rate": 1.9974899517780536e-05, "loss": 22.5147, "step": 4800 }, { "epoch": 0.05, "learning_rate": 1.99746509816814e-05, "loss": 22.7036, "step": 4810 }, { "epoch": 0.05, "learning_rate": 1.997440122273979e-05, "loss": 22.6762, "step": 4820 }, { "epoch": 0.05, "learning_rate": 1.9974150240986324e-05, "loss": 23.1902, "step": 4830 }, { "epoch": 0.05, "learning_rate": 1.9973898036451775e-05, "loss": 22.755, "step": 4840 }, { "epoch": 0.05, "learning_rate": 1.9973644609167053e-05, "loss": 22.4434, "step": 4850 }, { "epoch": 0.05, "learning_rate": 1.9973389959163234e-05, "loss": 22.4561, "step": 4860 }, { "epoch": 0.05, "learning_rate": 1.9973134086471534e-05, "loss": 22.4479, "step": 4870 }, { "epoch": 0.05, "learning_rate": 1.9972876991123322e-05, "loss": 22.2112, "step": 4880 }, { "epoch": 0.05, "learning_rate": 1.997261867315012e-05, "loss": 23.3283, "step": 4890 }, { "epoch": 0.05, "learning_rate": 1.9972359132583594e-05, "loss": 21.9255, "step": 4900 }, { "epoch": 0.05, "learning_rate": 1.997209836945556e-05, "loss": 22.6726, "step": 4910 }, { "epoch": 0.05, "learning_rate": 1.997183638379799e-05, "loss": 22.6462, "step": 4920 }, { "epoch": 0.05, "learning_rate": 1.9971573175643e-05, "loss": 23.4261, "step": 4930 }, { "epoch": 0.05, "learning_rate": 1.997130874502286e-05, "loss": 22.9856, "step": 4940 }, { "epoch": 0.05, "learning_rate": 1.9971043091969987e-05, "loss": 22.4863, "step": 4950 }, { "epoch": 0.05, "learning_rate": 1.997077621651695e-05, "loss": 24.1642, "step": 4960 }, { "epoch": 0.05, "learning_rate": 1.997050811869646e-05, "loss": 22.8106, "step": 4970 }, { "epoch": 0.05, "learning_rate": 1.997023879854139e-05, "loss": 22.3176, "step": 4980 }, { "epoch": 0.05, "learning_rate": 1.996996825608476e-05, "loss": 22.2527, "step": 4990 }, { "epoch": 0.05, "learning_rate": 1.9969696491359732e-05, "loss": 23.1285, "step": 5000 }, { "epoch": 0.05, "learning_rate": 1.9969423504399625e-05, "loss": 22.9666, "step": 5010 }, { "epoch": 0.05, "learning_rate": 1.9969149295237903e-05, "loss": 22.9205, "step": 5020 }, { "epoch": 0.05, "learning_rate": 1.9968873863908192e-05, "loss": 22.9765, "step": 5030 }, { "epoch": 0.05, "learning_rate": 1.9968597210444244e-05, "loss": 22.9401, "step": 5040 }, { "epoch": 0.05, "learning_rate": 1.996831933487999e-05, "loss": 22.54, "step": 5050 }, { "epoch": 0.05, "learning_rate": 1.9968040237249485e-05, "loss": 22.8458, "step": 5060 }, { "epoch": 0.05, "learning_rate": 1.9967759917586953e-05, "loss": 22.3054, "step": 5070 }, { "epoch": 0.05, "learning_rate": 1.9967478375926752e-05, "loss": 23.3615, "step": 5080 }, { "epoch": 0.06, "learning_rate": 1.9967195612303404e-05, "loss": 22.7512, "step": 5090 }, { "epoch": 0.06, "learning_rate": 1.9966911626751574e-05, "loss": 23.4175, "step": 5100 }, { "epoch": 0.06, "learning_rate": 1.996662641930607e-05, "loss": 23.0259, "step": 5110 }, { "epoch": 0.06, "learning_rate": 1.9966339990001865e-05, "loss": 22.7915, "step": 5120 }, { "epoch": 0.06, "learning_rate": 1.996605233887407e-05, "loss": 22.4058, "step": 5130 }, { "epoch": 0.06, "learning_rate": 1.9965763465957954e-05, "loss": 23.3641, "step": 5140 }, { "epoch": 0.06, "learning_rate": 1.9965473371288927e-05, "loss": 21.963, "step": 5150 }, { "epoch": 0.06, "learning_rate": 1.9965182054902555e-05, "loss": 22.2421, "step": 5160 }, { "epoch": 0.06, "learning_rate": 1.996488951683455e-05, "loss": 22.7186, "step": 5170 }, { "epoch": 0.06, "learning_rate": 1.9964595757120774e-05, "loss": 22.9108, "step": 5180 }, { "epoch": 0.06, "learning_rate": 1.9964300775797247e-05, "loss": 22.7651, "step": 5190 }, { "epoch": 0.06, "learning_rate": 1.996400457290013e-05, "loss": 22.615, "step": 5200 }, { "epoch": 0.06, "learning_rate": 1.9963707148465732e-05, "loss": 22.6458, "step": 5210 }, { "epoch": 0.06, "learning_rate": 1.996340850253052e-05, "loss": 22.687, "step": 5220 }, { "epoch": 0.06, "learning_rate": 1.99631086351311e-05, "loss": 22.8464, "step": 5230 }, { "epoch": 0.06, "learning_rate": 1.9962807546304247e-05, "loss": 22.4666, "step": 5240 }, { "epoch": 0.06, "learning_rate": 1.996250523608686e-05, "loss": 23.3706, "step": 5250 }, { "epoch": 0.06, "learning_rate": 1.9962201704516008e-05, "loss": 23.401, "step": 5260 }, { "epoch": 0.06, "learning_rate": 1.9961896951628897e-05, "loss": 23.1275, "step": 5270 }, { "epoch": 0.06, "learning_rate": 1.9961590977462897e-05, "loss": 22.9646, "step": 5280 }, { "epoch": 0.06, "learning_rate": 1.996128378205551e-05, "loss": 22.0093, "step": 5290 }, { "epoch": 0.06, "learning_rate": 1.99609753654444e-05, "loss": 21.8558, "step": 5300 }, { "epoch": 0.06, "learning_rate": 1.9960665727667378e-05, "loss": 22.9048, "step": 5310 }, { "epoch": 0.06, "learning_rate": 1.9960354868762402e-05, "loss": 22.334, "step": 5320 }, { "epoch": 0.06, "learning_rate": 1.9960042788767587e-05, "loss": 22.5916, "step": 5330 }, { "epoch": 0.06, "learning_rate": 1.9959729487721185e-05, "loss": 22.7278, "step": 5340 }, { "epoch": 0.06, "learning_rate": 1.995941496566161e-05, "loss": 22.7611, "step": 5350 }, { "epoch": 0.06, "learning_rate": 1.9959099222627422e-05, "loss": 22.3592, "step": 5360 }, { "epoch": 0.06, "learning_rate": 1.9958782258657323e-05, "loss": 22.2867, "step": 5370 }, { "epoch": 0.06, "learning_rate": 1.9958464073790177e-05, "loss": 22.3558, "step": 5380 }, { "epoch": 0.06, "learning_rate": 1.995814466806499e-05, "loss": 23.0664, "step": 5390 }, { "epoch": 0.06, "learning_rate": 1.995782404152092e-05, "loss": 22.3403, "step": 5400 }, { "epoch": 0.06, "learning_rate": 1.9957502194197274e-05, "loss": 23.3688, "step": 5410 }, { "epoch": 0.06, "learning_rate": 1.9957179126133508e-05, "loss": 22.9702, "step": 5420 }, { "epoch": 0.06, "learning_rate": 1.995685483736923e-05, "loss": 22.4875, "step": 5430 }, { "epoch": 0.06, "learning_rate": 1.9956529327944198e-05, "loss": 22.4243, "step": 5440 }, { "epoch": 0.06, "learning_rate": 1.9956202597898314e-05, "loss": 22.9618, "step": 5450 }, { "epoch": 0.06, "learning_rate": 1.995587464727163e-05, "loss": 22.5904, "step": 5460 }, { "epoch": 0.06, "learning_rate": 1.9955545476104364e-05, "loss": 22.7998, "step": 5470 }, { "epoch": 0.06, "learning_rate": 1.9955215084436855e-05, "loss": 22.2374, "step": 5480 }, { "epoch": 0.06, "learning_rate": 1.995488347230962e-05, "loss": 22.5487, "step": 5490 }, { "epoch": 0.06, "learning_rate": 1.9954550639763308e-05, "loss": 23.0267, "step": 5500 }, { "epoch": 0.06, "learning_rate": 1.9954216586838724e-05, "loss": 23.3002, "step": 5510 }, { "epoch": 0.06, "learning_rate": 1.9953881313576815e-05, "loss": 22.7421, "step": 5520 }, { "epoch": 0.06, "learning_rate": 1.9953544820018693e-05, "loss": 22.0801, "step": 5530 }, { "epoch": 0.06, "learning_rate": 1.9953207106205605e-05, "loss": 22.9826, "step": 5540 }, { "epoch": 0.06, "learning_rate": 1.9952868172178955e-05, "loss": 22.54, "step": 5550 }, { "epoch": 0.06, "learning_rate": 1.9952528017980293e-05, "loss": 23.4186, "step": 5560 }, { "epoch": 0.06, "learning_rate": 1.9952186643651318e-05, "loss": 22.2264, "step": 5570 }, { "epoch": 0.06, "learning_rate": 1.995184404923389e-05, "loss": 23.0668, "step": 5580 }, { "epoch": 0.06, "learning_rate": 1.9951500234769998e-05, "loss": 22.4558, "step": 5590 }, { "epoch": 0.06, "learning_rate": 1.99511552003018e-05, "loss": 23.2645, "step": 5600 }, { "epoch": 0.06, "learning_rate": 1.9950808945871593e-05, "loss": 23.8545, "step": 5610 }, { "epoch": 0.06, "learning_rate": 1.9950461471521823e-05, "loss": 22.9281, "step": 5620 }, { "epoch": 0.06, "learning_rate": 1.9950112777295095e-05, "loss": 21.8414, "step": 5630 }, { "epoch": 0.06, "learning_rate": 1.994976286323415e-05, "loss": 22.7098, "step": 5640 }, { "epoch": 0.06, "learning_rate": 1.994941172938189e-05, "loss": 23.351, "step": 5650 }, { "epoch": 0.06, "learning_rate": 1.9949059375781362e-05, "loss": 22.9102, "step": 5660 }, { "epoch": 0.06, "learning_rate": 1.9948705802475766e-05, "loss": 22.2236, "step": 5670 }, { "epoch": 0.06, "learning_rate": 1.994835100950844e-05, "loss": 23.3583, "step": 5680 }, { "epoch": 0.06, "learning_rate": 1.9947994996922884e-05, "loss": 23.6094, "step": 5690 }, { "epoch": 0.06, "learning_rate": 1.9947637764762748e-05, "loss": 22.3137, "step": 5700 }, { "epoch": 0.06, "learning_rate": 1.9947279313071818e-05, "loss": 22.609, "step": 5710 }, { "epoch": 0.06, "learning_rate": 1.9946919641894045e-05, "loss": 22.846, "step": 5720 }, { "epoch": 0.06, "learning_rate": 1.9946558751273523e-05, "loss": 22.6247, "step": 5730 }, { "epoch": 0.06, "learning_rate": 1.9946196641254493e-05, "loss": 23.3639, "step": 5740 }, { "epoch": 0.06, "learning_rate": 1.9945833311881344e-05, "loss": 22.5493, "step": 5750 }, { "epoch": 0.06, "learning_rate": 1.9945468763198627e-05, "loss": 22.8434, "step": 5760 }, { "epoch": 0.06, "learning_rate": 1.9945102995251026e-05, "loss": 21.7272, "step": 5770 }, { "epoch": 0.06, "learning_rate": 1.994473600808339e-05, "loss": 22.0284, "step": 5780 }, { "epoch": 0.06, "learning_rate": 1.99443678017407e-05, "loss": 23.5576, "step": 5790 }, { "epoch": 0.06, "learning_rate": 1.994399837626811e-05, "loss": 21.8763, "step": 5800 }, { "epoch": 0.06, "learning_rate": 1.9943627731710896e-05, "loss": 22.905, "step": 5810 }, { "epoch": 0.06, "learning_rate": 1.9943255868114506e-05, "loss": 22.4359, "step": 5820 }, { "epoch": 0.06, "learning_rate": 1.994288278552452e-05, "loss": 21.8577, "step": 5830 }, { "epoch": 0.06, "learning_rate": 1.9942508483986687e-05, "loss": 22.891, "step": 5840 }, { "epoch": 0.06, "learning_rate": 1.9942132963546887e-05, "loss": 22.5632, "step": 5850 }, { "epoch": 0.06, "learning_rate": 1.994175622425116e-05, "loss": 22.0237, "step": 5860 }, { "epoch": 0.06, "learning_rate": 1.994137826614569e-05, "loss": 22.9202, "step": 5870 }, { "epoch": 0.06, "learning_rate": 1.994099908927681e-05, "loss": 22.8352, "step": 5880 }, { "epoch": 0.06, "learning_rate": 1.9940618693691015e-05, "loss": 22.6329, "step": 5890 }, { "epoch": 0.06, "learning_rate": 1.9940237079434933e-05, "loss": 22.354, "step": 5900 }, { "epoch": 0.06, "learning_rate": 1.993985424655535e-05, "loss": 23.395, "step": 5910 }, { "epoch": 0.06, "learning_rate": 1.9939470195099195e-05, "loss": 22.6675, "step": 5920 }, { "epoch": 0.06, "learning_rate": 1.9939084925113555e-05, "loss": 22.6847, "step": 5930 }, { "epoch": 0.06, "learning_rate": 1.993869843664566e-05, "loss": 22.8449, "step": 5940 }, { "epoch": 0.06, "learning_rate": 1.9938310729742895e-05, "loss": 22.111, "step": 5950 }, { "epoch": 0.06, "learning_rate": 1.993792180445279e-05, "loss": 22.9115, "step": 5960 }, { "epoch": 0.06, "learning_rate": 1.993753166082302e-05, "loss": 22.6392, "step": 5970 }, { "epoch": 0.06, "learning_rate": 1.9937140298901422e-05, "loss": 22.8791, "step": 5980 }, { "epoch": 0.06, "learning_rate": 1.993674771873597e-05, "loss": 22.6394, "step": 5990 }, { "epoch": 0.06, "learning_rate": 1.9936353920374795e-05, "loss": 22.9223, "step": 6000 }, { "epoch": 0.06, "learning_rate": 1.9935958903866173e-05, "loss": 22.4588, "step": 6010 }, { "epoch": 0.07, "learning_rate": 1.993556266925853e-05, "loss": 22.3152, "step": 6020 }, { "epoch": 0.07, "learning_rate": 1.9935165216600446e-05, "loss": 22.8604, "step": 6030 }, { "epoch": 0.07, "learning_rate": 1.9934766545940647e-05, "loss": 22.14, "step": 6040 }, { "epoch": 0.07, "learning_rate": 1.9934366657328006e-05, "loss": 23.2578, "step": 6050 }, { "epoch": 0.07, "learning_rate": 1.9933965550811543e-05, "loss": 22.8557, "step": 6060 }, { "epoch": 0.07, "learning_rate": 1.993356322644044e-05, "loss": 22.6012, "step": 6070 }, { "epoch": 0.07, "learning_rate": 1.9933159684264015e-05, "loss": 22.3504, "step": 6080 }, { "epoch": 0.07, "learning_rate": 1.993275492433174e-05, "loss": 22.2587, "step": 6090 }, { "epoch": 0.07, "learning_rate": 1.9932348946693238e-05, "loss": 22.5058, "step": 6100 }, { "epoch": 0.07, "learning_rate": 1.993194175139828e-05, "loss": 22.0218, "step": 6110 }, { "epoch": 0.07, "learning_rate": 1.9931533338496786e-05, "loss": 22.5369, "step": 6120 }, { "epoch": 0.07, "learning_rate": 1.9931123708038824e-05, "loss": 22.2647, "step": 6130 }, { "epoch": 0.07, "learning_rate": 1.9930712860074614e-05, "loss": 23.5524, "step": 6140 }, { "epoch": 0.07, "learning_rate": 1.993030079465453e-05, "loss": 23.1402, "step": 6150 }, { "epoch": 0.07, "learning_rate": 1.9929887511829072e-05, "loss": 22.3597, "step": 6160 }, { "epoch": 0.07, "learning_rate": 1.9929473011648925e-05, "loss": 22.8036, "step": 6170 }, { "epoch": 0.07, "learning_rate": 1.9929057294164894e-05, "loss": 22.7004, "step": 6180 }, { "epoch": 0.07, "learning_rate": 1.9928640359427945e-05, "loss": 22.8469, "step": 6190 }, { "epoch": 0.07, "learning_rate": 1.9928222207489198e-05, "loss": 22.9678, "step": 6200 }, { "epoch": 0.07, "learning_rate": 1.992780283839991e-05, "loss": 22.8241, "step": 6210 }, { "epoch": 0.07, "learning_rate": 1.9927382252211496e-05, "loss": 22.0811, "step": 6220 }, { "epoch": 0.07, "learning_rate": 1.9926960448975517e-05, "loss": 22.6818, "step": 6230 }, { "epoch": 0.07, "learning_rate": 1.9926537428743684e-05, "loss": 23.5941, "step": 6240 }, { "epoch": 0.07, "learning_rate": 1.9926113191567856e-05, "loss": 22.981, "step": 6250 }, { "epoch": 0.07, "learning_rate": 1.992568773750005e-05, "loss": 22.6202, "step": 6260 }, { "epoch": 0.07, "learning_rate": 1.9925261066592413e-05, "loss": 23.0299, "step": 6270 }, { "epoch": 0.07, "learning_rate": 1.992483317889726e-05, "loss": 22.4094, "step": 6280 }, { "epoch": 0.07, "learning_rate": 1.992440407446705e-05, "loss": 22.1502, "step": 6290 }, { "epoch": 0.07, "learning_rate": 1.9923973753354383e-05, "loss": 22.4092, "step": 6300 }, { "epoch": 0.07, "learning_rate": 1.9923542215612015e-05, "loss": 22.0255, "step": 6310 }, { "epoch": 0.07, "learning_rate": 1.9923109461292853e-05, "loss": 22.5646, "step": 6320 }, { "epoch": 0.07, "learning_rate": 1.992267549044995e-05, "loss": 22.3691, "step": 6330 }, { "epoch": 0.07, "learning_rate": 1.9922240303136507e-05, "loss": 22.097, "step": 6340 }, { "epoch": 0.07, "learning_rate": 1.9921803899405876e-05, "loss": 22.908, "step": 6350 }, { "epoch": 0.07, "learning_rate": 1.992136627931156e-05, "loss": 22.6168, "step": 6360 }, { "epoch": 0.07, "learning_rate": 1.9920927442907207e-05, "loss": 21.7583, "step": 6370 }, { "epoch": 0.07, "learning_rate": 1.992048739024662e-05, "loss": 22.7601, "step": 6380 }, { "epoch": 0.07, "learning_rate": 1.992004612138374e-05, "loss": 21.7482, "step": 6390 }, { "epoch": 0.07, "learning_rate": 1.991960363637267e-05, "loss": 22.5959, "step": 6400 }, { "epoch": 0.07, "learning_rate": 1.9919159935267656e-05, "loss": 22.2549, "step": 6410 }, { "epoch": 0.07, "learning_rate": 1.9918715018123094e-05, "loss": 22.7502, "step": 6420 }, { "epoch": 0.07, "learning_rate": 1.9918268884993526e-05, "loss": 22.2126, "step": 6430 }, { "epoch": 0.07, "learning_rate": 1.9917821535933645e-05, "loss": 22.1471, "step": 6440 }, { "epoch": 0.07, "learning_rate": 1.99173729709983e-05, "loss": 22.2894, "step": 6450 }, { "epoch": 0.07, "learning_rate": 1.9916923190242477e-05, "loss": 22.4435, "step": 6460 }, { "epoch": 0.07, "learning_rate": 1.9916472193721316e-05, "loss": 22.062, "step": 6470 }, { "epoch": 0.07, "learning_rate": 1.991601998149011e-05, "loss": 21.8555, "step": 6480 }, { "epoch": 0.07, "learning_rate": 1.99155665536043e-05, "loss": 22.3092, "step": 6490 }, { "epoch": 0.07, "learning_rate": 1.991511191011947e-05, "loss": 22.7107, "step": 6500 }, { "epoch": 0.07, "learning_rate": 1.9914656051091354e-05, "loss": 22.774, "step": 6510 }, { "epoch": 0.07, "learning_rate": 1.9914198976575846e-05, "loss": 21.9911, "step": 6520 }, { "epoch": 0.07, "learning_rate": 1.9913740686628978e-05, "loss": 21.9927, "step": 6530 }, { "epoch": 0.07, "learning_rate": 1.991328118130693e-05, "loss": 22.5576, "step": 6540 }, { "epoch": 0.07, "learning_rate": 1.9912820460666046e-05, "loss": 22.2702, "step": 6550 }, { "epoch": 0.07, "learning_rate": 1.9912358524762797e-05, "loss": 21.7872, "step": 6560 }, { "epoch": 0.07, "learning_rate": 1.9911895373653817e-05, "loss": 22.6762, "step": 6570 }, { "epoch": 0.07, "learning_rate": 1.9911431007395884e-05, "loss": 22.6476, "step": 6580 }, { "epoch": 0.07, "learning_rate": 1.991096542604593e-05, "loss": 21.2559, "step": 6590 }, { "epoch": 0.07, "learning_rate": 1.9910498629661033e-05, "loss": 22.5836, "step": 6600 }, { "epoch": 0.07, "learning_rate": 1.9910030618298425e-05, "loss": 23.4106, "step": 6610 }, { "epoch": 0.07, "learning_rate": 1.990956139201547e-05, "loss": 21.7695, "step": 6620 }, { "epoch": 0.07, "learning_rate": 1.99090909508697e-05, "loss": 22.1888, "step": 6630 }, { "epoch": 0.07, "learning_rate": 1.9908619294918793e-05, "loss": 22.3342, "step": 6640 }, { "epoch": 0.07, "learning_rate": 1.9908146424220564e-05, "loss": 22.874, "step": 6650 }, { "epoch": 0.07, "learning_rate": 1.9907672338832985e-05, "loss": 22.7846, "step": 6660 }, { "epoch": 0.07, "learning_rate": 1.990719703881418e-05, "loss": 22.3309, "step": 6670 }, { "epoch": 0.07, "learning_rate": 1.9906720524222418e-05, "loss": 22.6872, "step": 6680 }, { "epoch": 0.07, "learning_rate": 1.9906242795116117e-05, "loss": 23.4091, "step": 6690 }, { "epoch": 0.07, "learning_rate": 1.990576385155384e-05, "loss": 21.8633, "step": 6700 }, { "epoch": 0.07, "learning_rate": 1.990528369359431e-05, "loss": 22.3145, "step": 6710 }, { "epoch": 0.07, "learning_rate": 1.9904802321296387e-05, "loss": 22.9146, "step": 6720 }, { "epoch": 0.07, "learning_rate": 1.9904319734719086e-05, "loss": 22.2751, "step": 6730 }, { "epoch": 0.07, "learning_rate": 1.990383593392157e-05, "loss": 21.5602, "step": 6740 }, { "epoch": 0.07, "learning_rate": 1.9903350918963154e-05, "loss": 22.6016, "step": 6750 }, { "epoch": 0.07, "learning_rate": 1.990286468990329e-05, "loss": 22.6476, "step": 6760 }, { "epoch": 0.07, "learning_rate": 1.9902377246801597e-05, "loss": 22.0509, "step": 6770 }, { "epoch": 0.07, "learning_rate": 1.9901888589717827e-05, "loss": 22.5551, "step": 6780 }, { "epoch": 0.07, "learning_rate": 1.9901398718711888e-05, "loss": 22.1589, "step": 6790 }, { "epoch": 0.07, "learning_rate": 1.990090763384384e-05, "loss": 22.879, "step": 6800 }, { "epoch": 0.07, "learning_rate": 1.990041533517388e-05, "loss": 23.2176, "step": 6810 }, { "epoch": 0.07, "learning_rate": 1.9899921822762363e-05, "loss": 21.8877, "step": 6820 }, { "epoch": 0.07, "learning_rate": 1.9899427096669795e-05, "loss": 23.1625, "step": 6830 }, { "epoch": 0.07, "learning_rate": 1.989893115695683e-05, "loss": 22.0288, "step": 6840 }, { "epoch": 0.07, "learning_rate": 1.9898434003684257e-05, "loss": 22.5714, "step": 6850 }, { "epoch": 0.07, "learning_rate": 1.9897935636913035e-05, "loss": 22.4654, "step": 6860 }, { "epoch": 0.07, "learning_rate": 1.9897436056704253e-05, "loss": 22.3483, "step": 6870 }, { "epoch": 0.07, "learning_rate": 1.9896935263119162e-05, "loss": 22.5176, "step": 6880 }, { "epoch": 0.07, "learning_rate": 1.9896433256219157e-05, "loss": 22.6795, "step": 6890 }, { "epoch": 0.07, "learning_rate": 1.989593003606578e-05, "loss": 22.5448, "step": 6900 }, { "epoch": 0.07, "learning_rate": 1.989542560272072e-05, "loss": 21.9615, "step": 6910 }, { "epoch": 0.07, "learning_rate": 1.9894919956245825e-05, "loss": 23.2688, "step": 6920 }, { "epoch": 0.07, "learning_rate": 1.989441309670308e-05, "loss": 22.0932, "step": 6930 }, { "epoch": 0.08, "learning_rate": 1.9893905024154625e-05, "loss": 22.4169, "step": 6940 }, { "epoch": 0.08, "learning_rate": 1.9893395738662747e-05, "loss": 22.4926, "step": 6950 }, { "epoch": 0.08, "learning_rate": 1.989288524028988e-05, "loss": 22.1864, "step": 6960 }, { "epoch": 0.08, "learning_rate": 1.9892373529098614e-05, "loss": 21.7906, "step": 6970 }, { "epoch": 0.08, "learning_rate": 1.9891860605151677e-05, "loss": 22.0968, "step": 6980 }, { "epoch": 0.08, "learning_rate": 1.989134646851195e-05, "loss": 23.2825, "step": 6990 }, { "epoch": 0.08, "learning_rate": 1.989083111924247e-05, "loss": 22.0138, "step": 7000 }, { "epoch": 0.08, "learning_rate": 1.9890314557406406e-05, "loss": 22.4026, "step": 7010 }, { "epoch": 0.08, "learning_rate": 1.9889796783067096e-05, "loss": 23.7143, "step": 7020 }, { "epoch": 0.08, "learning_rate": 1.9889277796288013e-05, "loss": 22.8238, "step": 7030 }, { "epoch": 0.08, "learning_rate": 1.988875759713278e-05, "loss": 22.4116, "step": 7040 }, { "epoch": 0.08, "learning_rate": 1.9888236185665176e-05, "loss": 22.02, "step": 7050 }, { "epoch": 0.08, "learning_rate": 1.988771356194912e-05, "loss": 22.341, "step": 7060 }, { "epoch": 0.08, "learning_rate": 1.9887189726048678e-05, "loss": 23.0206, "step": 7070 }, { "epoch": 0.08, "learning_rate": 1.988666467802808e-05, "loss": 22.342, "step": 7080 }, { "epoch": 0.08, "learning_rate": 1.9886138417951687e-05, "loss": 22.1228, "step": 7090 }, { "epoch": 0.08, "learning_rate": 1.988561094588402e-05, "loss": 22.5713, "step": 7100 }, { "epoch": 0.08, "learning_rate": 1.9885082261889737e-05, "loss": 22.4073, "step": 7110 }, { "epoch": 0.08, "learning_rate": 1.9884552366033665e-05, "loss": 22.1888, "step": 7120 }, { "epoch": 0.08, "learning_rate": 1.9884021258380755e-05, "loss": 22.4996, "step": 7130 }, { "epoch": 0.08, "learning_rate": 1.988348893899612e-05, "loss": 22.7835, "step": 7140 }, { "epoch": 0.08, "learning_rate": 1.9882955407945026e-05, "loss": 22.7124, "step": 7150 }, { "epoch": 0.08, "learning_rate": 1.9882420665292876e-05, "loss": 23.2753, "step": 7160 }, { "epoch": 0.08, "learning_rate": 1.988188471110523e-05, "loss": 22.669, "step": 7170 }, { "epoch": 0.08, "learning_rate": 1.9881347545447785e-05, "loss": 22.1648, "step": 7180 }, { "epoch": 0.08, "learning_rate": 1.9880809168386405e-05, "loss": 22.1945, "step": 7190 }, { "epoch": 0.08, "learning_rate": 1.988026957998709e-05, "loss": 21.4844, "step": 7200 }, { "epoch": 0.08, "learning_rate": 1.987972878031599e-05, "loss": 22.986, "step": 7210 }, { "epoch": 0.08, "learning_rate": 1.98791867694394e-05, "loss": 22.0596, "step": 7220 }, { "epoch": 0.08, "learning_rate": 1.987864354742377e-05, "loss": 22.6223, "step": 7230 }, { "epoch": 0.08, "learning_rate": 1.98780991143357e-05, "loss": 22.8781, "step": 7240 }, { "epoch": 0.08, "learning_rate": 1.9877553470241934e-05, "loss": 22.2249, "step": 7250 }, { "epoch": 0.08, "learning_rate": 1.9877006615209363e-05, "loss": 22.2568, "step": 7260 }, { "epoch": 0.08, "learning_rate": 1.9876458549305027e-05, "loss": 22.8147, "step": 7270 }, { "epoch": 0.08, "learning_rate": 1.9875909272596123e-05, "loss": 22.8667, "step": 7280 }, { "epoch": 0.08, "learning_rate": 1.9875358785149982e-05, "loss": 22.5868, "step": 7290 }, { "epoch": 0.08, "learning_rate": 1.9874807087034096e-05, "loss": 22.1419, "step": 7300 }, { "epoch": 0.08, "learning_rate": 1.9874254178316097e-05, "loss": 22.1212, "step": 7310 }, { "epoch": 0.08, "learning_rate": 1.9873700059063773e-05, "loss": 22.3108, "step": 7320 }, { "epoch": 0.08, "learning_rate": 1.987314472934505e-05, "loss": 22.4554, "step": 7330 }, { "epoch": 0.08, "learning_rate": 1.9872588189228015e-05, "loss": 22.4261, "step": 7340 }, { "epoch": 0.08, "learning_rate": 1.9872030438780893e-05, "loss": 22.377, "step": 7350 }, { "epoch": 0.08, "learning_rate": 1.9871471478072065e-05, "loss": 22.5668, "step": 7360 }, { "epoch": 0.08, "learning_rate": 1.9870911307170054e-05, "loss": 22.3814, "step": 7370 }, { "epoch": 0.08, "learning_rate": 1.9870349926143537e-05, "loss": 22.5671, "step": 7380 }, { "epoch": 0.08, "learning_rate": 1.986978733506133e-05, "loss": 22.5533, "step": 7390 }, { "epoch": 0.08, "learning_rate": 1.986922353399241e-05, "loss": 23.0004, "step": 7400 }, { "epoch": 0.08, "learning_rate": 1.9868658523005894e-05, "loss": 22.7751, "step": 7410 }, { "epoch": 0.08, "learning_rate": 1.986809230217105e-05, "loss": 22.3897, "step": 7420 }, { "epoch": 0.08, "learning_rate": 1.9867524871557297e-05, "loss": 22.3395, "step": 7430 }, { "epoch": 0.08, "learning_rate": 1.9866956231234195e-05, "loss": 22.2394, "step": 7440 }, { "epoch": 0.08, "learning_rate": 1.9866386381271453e-05, "loss": 22.3317, "step": 7450 }, { "epoch": 0.08, "learning_rate": 1.986581532173894e-05, "loss": 22.4909, "step": 7460 }, { "epoch": 0.08, "learning_rate": 1.986524305270666e-05, "loss": 22.5665, "step": 7470 }, { "epoch": 0.08, "learning_rate": 1.9864669574244772e-05, "loss": 22.634, "step": 7480 }, { "epoch": 0.08, "learning_rate": 1.986409488642358e-05, "loss": 23.1084, "step": 7490 }, { "epoch": 0.08, "learning_rate": 1.986351898931354e-05, "loss": 22.0803, "step": 7500 }, { "epoch": 0.08, "learning_rate": 1.9862941882985255e-05, "loss": 22.2945, "step": 7510 }, { "epoch": 0.08, "learning_rate": 1.986236356750947e-05, "loss": 22.8401, "step": 7520 }, { "epoch": 0.08, "learning_rate": 1.986178404295709e-05, "loss": 22.0117, "step": 7530 }, { "epoch": 0.08, "learning_rate": 1.9861203309399157e-05, "loss": 22.2028, "step": 7540 }, { "epoch": 0.08, "learning_rate": 1.9860621366906868e-05, "loss": 22.0615, "step": 7550 }, { "epoch": 0.08, "learning_rate": 1.9860038215551566e-05, "loss": 21.9796, "step": 7560 }, { "epoch": 0.08, "learning_rate": 1.9859453855404743e-05, "loss": 22.535, "step": 7570 }, { "epoch": 0.08, "learning_rate": 1.9858868286538042e-05, "loss": 22.5217, "step": 7580 }, { "epoch": 0.08, "learning_rate": 1.9858281509023244e-05, "loss": 22.1542, "step": 7590 }, { "epoch": 0.08, "learning_rate": 1.985769352293229e-05, "loss": 22.5591, "step": 7600 }, { "epoch": 0.08, "learning_rate": 1.985710432833726e-05, "loss": 22.2153, "step": 7610 }, { "epoch": 0.08, "learning_rate": 1.9856513925310387e-05, "loss": 22.5209, "step": 7620 }, { "epoch": 0.08, "learning_rate": 1.9855922313924055e-05, "loss": 22.1433, "step": 7630 }, { "epoch": 0.08, "learning_rate": 1.985532949425079e-05, "loss": 22.4384, "step": 7640 }, { "epoch": 0.08, "learning_rate": 1.9854735466363273e-05, "loss": 21.7606, "step": 7650 }, { "epoch": 0.08, "learning_rate": 1.9854140230334323e-05, "loss": 22.9493, "step": 7660 }, { "epoch": 0.08, "learning_rate": 1.9853543786236917e-05, "loss": 23.003, "step": 7670 }, { "epoch": 0.08, "learning_rate": 1.9852946134144168e-05, "loss": 22.6114, "step": 7680 }, { "epoch": 0.08, "learning_rate": 1.9852347274129357e-05, "loss": 22.504, "step": 7690 }, { "epoch": 0.08, "learning_rate": 1.9851747206265896e-05, "loss": 23.1473, "step": 7700 }, { "epoch": 0.08, "learning_rate": 1.985114593062735e-05, "loss": 22.5574, "step": 7710 }, { "epoch": 0.08, "learning_rate": 1.985054344728743e-05, "loss": 22.048, "step": 7720 }, { "epoch": 0.08, "learning_rate": 1.984993975632e-05, "loss": 22.2188, "step": 7730 }, { "epoch": 0.08, "learning_rate": 1.984933485779907e-05, "loss": 21.9245, "step": 7740 }, { "epoch": 0.08, "learning_rate": 1.98487287517988e-05, "loss": 22.7155, "step": 7750 }, { "epoch": 0.08, "learning_rate": 1.9848121438393487e-05, "loss": 22.4059, "step": 7760 }, { "epoch": 0.08, "learning_rate": 1.9847512917657594e-05, "loss": 22.3355, "step": 7770 }, { "epoch": 0.08, "learning_rate": 1.984690318966572e-05, "loss": 22.8916, "step": 7780 }, { "epoch": 0.08, "learning_rate": 1.984629225449261e-05, "loss": 22.1316, "step": 7790 }, { "epoch": 0.08, "learning_rate": 1.9845680112213167e-05, "loss": 22.3822, "step": 7800 }, { "epoch": 0.08, "learning_rate": 1.984506676290243e-05, "loss": 22.126, "step": 7810 }, { "epoch": 0.08, "learning_rate": 1.9844452206635603e-05, "loss": 23.174, "step": 7820 }, { "epoch": 0.08, "learning_rate": 1.984383644348802e-05, "loss": 22.8219, "step": 7830 }, { "epoch": 0.08, "learning_rate": 1.984321947353517e-05, "loss": 22.6234, "step": 7840 }, { "epoch": 0.08, "learning_rate": 1.9842601296852696e-05, "loss": 21.6545, "step": 7850 }, { "epoch": 0.08, "learning_rate": 1.9841981913516376e-05, "loss": 22.8472, "step": 7860 }, { "epoch": 0.09, "learning_rate": 1.984136132360215e-05, "loss": 21.7502, "step": 7870 }, { "epoch": 0.09, "learning_rate": 1.9840739527186098e-05, "loss": 23.2029, "step": 7880 }, { "epoch": 0.09, "learning_rate": 1.9840116524344447e-05, "loss": 22.1608, "step": 7890 }, { "epoch": 0.09, "learning_rate": 1.9839492315153574e-05, "loss": 22.8948, "step": 7900 }, { "epoch": 0.09, "learning_rate": 1.983886689969e-05, "loss": 22.6493, "step": 7910 }, { "epoch": 0.09, "learning_rate": 1.983824027803041e-05, "loss": 22.1568, "step": 7920 }, { "epoch": 0.09, "learning_rate": 1.9837612450251612e-05, "loss": 22.3637, "step": 7930 }, { "epoch": 0.09, "learning_rate": 1.983698341643058e-05, "loss": 21.9492, "step": 7940 }, { "epoch": 0.09, "learning_rate": 1.983635317664443e-05, "loss": 22.4759, "step": 7950 }, { "epoch": 0.09, "learning_rate": 1.9835721730970427e-05, "loss": 22.441, "step": 7960 }, { "epoch": 0.09, "learning_rate": 1.9835089079485984e-05, "loss": 22.5087, "step": 7970 }, { "epoch": 0.09, "learning_rate": 1.9834455222268657e-05, "loss": 22.6362, "step": 7980 }, { "epoch": 0.09, "learning_rate": 1.983382015939616e-05, "loss": 22.3624, "step": 7990 }, { "epoch": 0.09, "learning_rate": 1.9833183890946342e-05, "loss": 22.2513, "step": 8000 }, { "epoch": 0.09, "learning_rate": 1.9832546416997206e-05, "loss": 22.9373, "step": 8010 }, { "epoch": 0.09, "learning_rate": 1.983190773762691e-05, "loss": 22.9572, "step": 8020 }, { "epoch": 0.09, "learning_rate": 1.983126785291375e-05, "loss": 21.913, "step": 8030 }, { "epoch": 0.09, "learning_rate": 1.983062676293617e-05, "loss": 21.9885, "step": 8040 }, { "epoch": 0.09, "learning_rate": 1.9829984467772764e-05, "loss": 22.0822, "step": 8050 }, { "epoch": 0.09, "learning_rate": 1.982934096750228e-05, "loss": 22.6822, "step": 8060 }, { "epoch": 0.09, "learning_rate": 1.98286962622036e-05, "loss": 22.1133, "step": 8070 }, { "epoch": 0.09, "learning_rate": 1.982805035195577e-05, "loss": 22.4799, "step": 8080 }, { "epoch": 0.09, "learning_rate": 1.982740323683797e-05, "loss": 22.0333, "step": 8090 }, { "epoch": 0.09, "learning_rate": 1.9826754916929532e-05, "loss": 22.1621, "step": 8100 }, { "epoch": 0.09, "learning_rate": 1.9826105392309944e-05, "loss": 22.5172, "step": 8110 }, { "epoch": 0.09, "learning_rate": 1.9825454663058824e-05, "loss": 23.0169, "step": 8120 }, { "epoch": 0.09, "learning_rate": 1.982480272925596e-05, "loss": 22.7866, "step": 8130 }, { "epoch": 0.09, "learning_rate": 1.9824149590981263e-05, "loss": 22.4221, "step": 8140 }, { "epoch": 0.09, "learning_rate": 1.9823495248314814e-05, "loss": 22.5707, "step": 8150 }, { "epoch": 0.09, "learning_rate": 1.9822839701336832e-05, "loss": 22.6994, "step": 8160 }, { "epoch": 0.09, "learning_rate": 1.9822182950127677e-05, "loss": 22.8287, "step": 8170 }, { "epoch": 0.09, "learning_rate": 1.982152499476787e-05, "loss": 22.4817, "step": 8180 }, { "epoch": 0.09, "learning_rate": 1.9820865835338068e-05, "loss": 22.281, "step": 8190 }, { "epoch": 0.09, "learning_rate": 1.9820205471919085e-05, "loss": 21.5993, "step": 8200 }, { "epoch": 0.09, "learning_rate": 1.9819543904591875e-05, "loss": 22.5997, "step": 8210 }, { "epoch": 0.09, "learning_rate": 1.9818881133437548e-05, "loss": 22.2533, "step": 8220 }, { "epoch": 0.09, "learning_rate": 1.9818217158537347e-05, "loss": 22.2239, "step": 8230 }, { "epoch": 0.09, "learning_rate": 1.9817551979972682e-05, "loss": 22.9191, "step": 8240 }, { "epoch": 0.09, "learning_rate": 1.9816885597825096e-05, "loss": 23.0481, "step": 8250 }, { "epoch": 0.09, "learning_rate": 1.9816218012176283e-05, "loss": 22.453, "step": 8260 }, { "epoch": 0.09, "learning_rate": 1.981554922310809e-05, "loss": 22.2139, "step": 8270 }, { "epoch": 0.09, "learning_rate": 1.9814879230702496e-05, "loss": 22.4737, "step": 8280 }, { "epoch": 0.09, "learning_rate": 1.9814208035041654e-05, "loss": 22.6306, "step": 8290 }, { "epoch": 0.09, "learning_rate": 1.9813535636207844e-05, "loss": 22.7563, "step": 8300 }, { "epoch": 0.09, "learning_rate": 1.9812862034283493e-05, "loss": 22.665, "step": 8310 }, { "epoch": 0.09, "learning_rate": 1.9812187229351187e-05, "loss": 22.4544, "step": 8320 }, { "epoch": 0.09, "learning_rate": 1.9811511221493652e-05, "loss": 22.5641, "step": 8330 }, { "epoch": 0.09, "learning_rate": 1.981083401079376e-05, "loss": 21.9096, "step": 8340 }, { "epoch": 0.09, "learning_rate": 1.9810155597334542e-05, "loss": 23.2169, "step": 8350 }, { "epoch": 0.09, "learning_rate": 1.980947598119916e-05, "loss": 22.4326, "step": 8360 }, { "epoch": 0.09, "learning_rate": 1.9808795162470937e-05, "loss": 22.1952, "step": 8370 }, { "epoch": 0.09, "learning_rate": 1.980811314123333e-05, "loss": 22.7957, "step": 8380 }, { "epoch": 0.09, "learning_rate": 1.980742991756996e-05, "loss": 21.5948, "step": 8390 }, { "epoch": 0.09, "learning_rate": 1.9806745491564588e-05, "loss": 22.2107, "step": 8400 }, { "epoch": 0.09, "learning_rate": 1.980605986330111e-05, "loss": 22.3343, "step": 8410 }, { "epoch": 0.09, "learning_rate": 1.9805373032863592e-05, "loss": 22.1508, "step": 8420 }, { "epoch": 0.09, "learning_rate": 1.9804685000336227e-05, "loss": 22.2618, "step": 8430 }, { "epoch": 0.09, "learning_rate": 1.9803995765803374e-05, "loss": 22.1805, "step": 8440 }, { "epoch": 0.09, "learning_rate": 1.980330532934952e-05, "loss": 22.3253, "step": 8450 }, { "epoch": 0.09, "learning_rate": 1.980261369105932e-05, "loss": 22.9123, "step": 8460 }, { "epoch": 0.09, "learning_rate": 1.9801920851017552e-05, "loss": 22.7734, "step": 8470 }, { "epoch": 0.09, "learning_rate": 1.9801226809309167e-05, "loss": 22.0237, "step": 8480 }, { "epoch": 0.09, "learning_rate": 1.9800531566019243e-05, "loss": 22.4507, "step": 8490 }, { "epoch": 0.09, "learning_rate": 1.979983512123302e-05, "loss": 22.135, "step": 8500 }, { "epoch": 0.09, "learning_rate": 1.979913747503587e-05, "loss": 22.3816, "step": 8510 }, { "epoch": 0.09, "learning_rate": 1.9798438627513324e-05, "loss": 22.334, "step": 8520 }, { "epoch": 0.09, "learning_rate": 1.9797738578751066e-05, "loss": 22.7797, "step": 8530 }, { "epoch": 0.09, "learning_rate": 1.979703732883491e-05, "loss": 22.5544, "step": 8540 }, { "epoch": 0.09, "learning_rate": 1.9796334877850823e-05, "loss": 21.9679, "step": 8550 }, { "epoch": 0.09, "learning_rate": 1.979563122588493e-05, "loss": 22.0756, "step": 8560 }, { "epoch": 0.09, "learning_rate": 1.9794926373023488e-05, "loss": 22.5049, "step": 8570 }, { "epoch": 0.09, "learning_rate": 1.9794220319352914e-05, "loss": 22.6664, "step": 8580 }, { "epoch": 0.09, "learning_rate": 1.9793513064959765e-05, "loss": 22.2088, "step": 8590 }, { "epoch": 0.09, "learning_rate": 1.979280460993075e-05, "loss": 21.812, "step": 8600 }, { "epoch": 0.09, "learning_rate": 1.979209495435271e-05, "loss": 23.0863, "step": 8610 }, { "epoch": 0.09, "learning_rate": 1.979138409831266e-05, "loss": 21.3415, "step": 8620 }, { "epoch": 0.09, "learning_rate": 1.979067204189774e-05, "loss": 22.4694, "step": 8630 }, { "epoch": 0.09, "learning_rate": 1.9789958785195243e-05, "loss": 21.332, "step": 8640 }, { "epoch": 0.09, "learning_rate": 1.9789244328292617e-05, "loss": 21.9797, "step": 8650 }, { "epoch": 0.09, "learning_rate": 1.978852867127744e-05, "loss": 22.2054, "step": 8660 }, { "epoch": 0.09, "learning_rate": 1.9787811814237465e-05, "loss": 23.0766, "step": 8670 }, { "epoch": 0.09, "learning_rate": 1.978709375726056e-05, "loss": 22.0747, "step": 8680 }, { "epoch": 0.09, "learning_rate": 1.9786374500434763e-05, "loss": 21.8373, "step": 8690 }, { "epoch": 0.09, "learning_rate": 1.9785654043848246e-05, "loss": 21.7155, "step": 8700 }, { "epoch": 0.09, "learning_rate": 1.978493238758934e-05, "loss": 22.254, "step": 8710 }, { "epoch": 0.09, "learning_rate": 1.978420953174651e-05, "loss": 21.9914, "step": 8720 }, { "epoch": 0.09, "learning_rate": 1.9783485476408376e-05, "loss": 22.5451, "step": 8730 }, { "epoch": 0.09, "learning_rate": 1.9782760221663708e-05, "loss": 22.2527, "step": 8740 }, { "epoch": 0.09, "learning_rate": 1.9782033767601414e-05, "loss": 21.8357, "step": 8750 }, { "epoch": 0.09, "learning_rate": 1.9781306114310555e-05, "loss": 22.4629, "step": 8760 }, { "epoch": 0.09, "learning_rate": 1.9780577261880336e-05, "loss": 22.8638, "step": 8770 }, { "epoch": 0.09, "learning_rate": 1.9779847210400116e-05, "loss": 22.3736, "step": 8780 }, { "epoch": 0.1, "learning_rate": 1.977911595995939e-05, "loss": 22.5582, "step": 8790 }, { "epoch": 0.1, "learning_rate": 1.9778383510647806e-05, "loss": 21.2458, "step": 8800 }, { "epoch": 0.1, "learning_rate": 1.9777649862555164e-05, "loss": 22.3624, "step": 8810 }, { "epoch": 0.1, "learning_rate": 1.97769150157714e-05, "loss": 22.4439, "step": 8820 }, { "epoch": 0.1, "learning_rate": 1.9776178970386605e-05, "loss": 21.4448, "step": 8830 }, { "epoch": 0.1, "learning_rate": 1.9775441726491014e-05, "loss": 22.6108, "step": 8840 }, { "epoch": 0.1, "learning_rate": 1.9774703284175007e-05, "loss": 22.5167, "step": 8850 }, { "epoch": 0.1, "learning_rate": 1.977396364352912e-05, "loss": 22.2773, "step": 8860 }, { "epoch": 0.1, "learning_rate": 1.977322280464402e-05, "loss": 22.1836, "step": 8870 }, { "epoch": 0.1, "learning_rate": 1.977248076761054e-05, "loss": 22.3235, "step": 8880 }, { "epoch": 0.1, "learning_rate": 1.9771737532519643e-05, "loss": 22.6518, "step": 8890 }, { "epoch": 0.1, "learning_rate": 1.977099309946245e-05, "loss": 22.3411, "step": 8900 }, { "epoch": 0.1, "learning_rate": 1.9770247468530218e-05, "loss": 21.5256, "step": 8910 }, { "epoch": 0.1, "learning_rate": 1.9769500639814368e-05, "loss": 22.7612, "step": 8920 }, { "epoch": 0.1, "learning_rate": 1.976875261340645e-05, "loss": 22.4767, "step": 8930 }, { "epoch": 0.1, "learning_rate": 1.9768003389398172e-05, "loss": 23.2569, "step": 8940 }, { "epoch": 0.1, "learning_rate": 1.976725296788138e-05, "loss": 22.2023, "step": 8950 }, { "epoch": 0.1, "learning_rate": 1.9766501348948078e-05, "loss": 21.3606, "step": 8960 }, { "epoch": 0.1, "learning_rate": 1.9765748532690405e-05, "loss": 21.7161, "step": 8970 }, { "epoch": 0.1, "learning_rate": 1.976499451920066e-05, "loss": 22.0827, "step": 8980 }, { "epoch": 0.1, "learning_rate": 1.9764239308571273e-05, "loss": 22.3857, "step": 8990 }, { "epoch": 0.1, "learning_rate": 1.9763482900894836e-05, "loss": 21.9206, "step": 9000 }, { "epoch": 0.1, "learning_rate": 1.9762725296264076e-05, "loss": 22.5823, "step": 9010 }, { "epoch": 0.1, "learning_rate": 1.9761966494771875e-05, "loss": 22.3261, "step": 9020 }, { "epoch": 0.1, "learning_rate": 1.9761206496511255e-05, "loss": 22.3733, "step": 9030 }, { "epoch": 0.1, "learning_rate": 1.976044530157539e-05, "loss": 22.4899, "step": 9040 }, { "epoch": 0.1, "learning_rate": 1.97596829100576e-05, "loss": 22.111, "step": 9050 }, { "epoch": 0.1, "learning_rate": 1.9758919322051346e-05, "loss": 21.6758, "step": 9060 }, { "epoch": 0.1, "learning_rate": 1.9758154537650244e-05, "loss": 22.6582, "step": 9070 }, { "epoch": 0.1, "learning_rate": 1.975738855694805e-05, "loss": 21.9253, "step": 9080 }, { "epoch": 0.1, "learning_rate": 1.9756621380038673e-05, "loss": 22.0479, "step": 9090 }, { "epoch": 0.1, "learning_rate": 1.9755853007016163e-05, "loss": 22.3259, "step": 9100 }, { "epoch": 0.1, "learning_rate": 1.975508343797472e-05, "loss": 22.2871, "step": 9110 }, { "epoch": 0.1, "learning_rate": 1.9754312673008688e-05, "loss": 22.8079, "step": 9120 }, { "epoch": 0.1, "learning_rate": 1.9753540712212555e-05, "loss": 22.2761, "step": 9130 }, { "epoch": 0.1, "learning_rate": 1.9752767555680967e-05, "loss": 23.2419, "step": 9140 }, { "epoch": 0.1, "learning_rate": 1.9751993203508703e-05, "loss": 22.6165, "step": 9150 }, { "epoch": 0.1, "learning_rate": 1.9751217655790704e-05, "loss": 22.1106, "step": 9160 }, { "epoch": 0.1, "learning_rate": 1.9750440912622035e-05, "loss": 22.2859, "step": 9170 }, { "epoch": 0.1, "learning_rate": 1.9749662974097926e-05, "loss": 22.5384, "step": 9180 }, { "epoch": 0.1, "learning_rate": 1.9748883840313757e-05, "loss": 22.5279, "step": 9190 }, { "epoch": 0.1, "learning_rate": 1.9748103511365032e-05, "loss": 22.0872, "step": 9200 }, { "epoch": 0.1, "learning_rate": 1.974732198734743e-05, "loss": 23.0751, "step": 9210 }, { "epoch": 0.1, "learning_rate": 1.9746539268356746e-05, "loss": 22.3167, "step": 9220 }, { "epoch": 0.1, "learning_rate": 1.974575535448895e-05, "loss": 22.4099, "step": 9230 }, { "epoch": 0.1, "learning_rate": 1.9744970245840142e-05, "loss": 22.3727, "step": 9240 }, { "epoch": 0.1, "learning_rate": 1.974418394250657e-05, "loss": 23.0867, "step": 9250 }, { "epoch": 0.1, "learning_rate": 1.9743396444584636e-05, "loss": 23.011, "step": 9260 }, { "epoch": 0.1, "learning_rate": 1.9742607752170877e-05, "loss": 21.7936, "step": 9270 }, { "epoch": 0.1, "learning_rate": 1.9741817865361986e-05, "loss": 22.3713, "step": 9280 }, { "epoch": 0.1, "learning_rate": 1.9741026784254803e-05, "loss": 22.2159, "step": 9290 }, { "epoch": 0.1, "learning_rate": 1.97402345089463e-05, "loss": 21.9769, "step": 9300 }, { "epoch": 0.1, "learning_rate": 1.973944103953362e-05, "loss": 22.767, "step": 9310 }, { "epoch": 0.1, "learning_rate": 1.9738646376114027e-05, "loss": 22.4063, "step": 9320 }, { "epoch": 0.1, "learning_rate": 1.973785051878495e-05, "loss": 22.5836, "step": 9330 }, { "epoch": 0.1, "learning_rate": 1.973705346764395e-05, "loss": 22.7621, "step": 9340 }, { "epoch": 0.1, "learning_rate": 1.9736255222788747e-05, "loss": 22.4365, "step": 9350 }, { "epoch": 0.1, "learning_rate": 1.9735455784317203e-05, "loss": 21.8655, "step": 9360 }, { "epoch": 0.1, "learning_rate": 1.9734655152327318e-05, "loss": 22.3261, "step": 9370 }, { "epoch": 0.1, "learning_rate": 1.9733853326917254e-05, "loss": 22.2667, "step": 9380 }, { "epoch": 0.1, "learning_rate": 1.9733050308185303e-05, "loss": 21.9363, "step": 9390 }, { "epoch": 0.1, "learning_rate": 1.973224609622992e-05, "loss": 21.8901, "step": 9400 }, { "epoch": 0.1, "learning_rate": 1.9731440691149688e-05, "loss": 21.6763, "step": 9410 }, { "epoch": 0.1, "learning_rate": 1.973063409304335e-05, "loss": 22.027, "step": 9420 }, { "epoch": 0.1, "learning_rate": 1.9729826302009794e-05, "loss": 23.1716, "step": 9430 }, { "epoch": 0.1, "learning_rate": 1.972901731814805e-05, "loss": 22.3958, "step": 9440 }, { "epoch": 0.1, "learning_rate": 1.9728207141557286e-05, "loss": 21.8741, "step": 9450 }, { "epoch": 0.1, "learning_rate": 1.9727395772336835e-05, "loss": 22.4497, "step": 9460 }, { "epoch": 0.1, "learning_rate": 1.972658321058617e-05, "loss": 21.789, "step": 9470 }, { "epoch": 0.1, "learning_rate": 1.9725769456404898e-05, "loss": 21.8141, "step": 9480 }, { "epoch": 0.1, "learning_rate": 1.9724954509892783e-05, "loss": 22.1832, "step": 9490 }, { "epoch": 0.1, "learning_rate": 1.972413837114974e-05, "loss": 21.8269, "step": 9500 }, { "epoch": 0.1, "learning_rate": 1.9723321040275816e-05, "loss": 21.9382, "step": 9510 }, { "epoch": 0.1, "learning_rate": 1.9722502517371212e-05, "loss": 22.4583, "step": 9520 }, { "epoch": 0.1, "learning_rate": 1.9721682802536282e-05, "loss": 21.6018, "step": 9530 }, { "epoch": 0.1, "learning_rate": 1.9720861895871515e-05, "loss": 21.4993, "step": 9540 }, { "epoch": 0.1, "learning_rate": 1.9720039797477547e-05, "loss": 22.8721, "step": 9550 }, { "epoch": 0.1, "learning_rate": 1.9719216507455168e-05, "loss": 21.7815, "step": 9560 }, { "epoch": 0.1, "learning_rate": 1.9718392025905306e-05, "loss": 22.5982, "step": 9570 }, { "epoch": 0.1, "learning_rate": 1.971756635292904e-05, "loss": 21.7278, "step": 9580 }, { "epoch": 0.1, "learning_rate": 1.971673948862759e-05, "loss": 22.421, "step": 9590 }, { "epoch": 0.1, "learning_rate": 1.9715911433102327e-05, "loss": 21.9228, "step": 9600 }, { "epoch": 0.1, "learning_rate": 1.9715082186454772e-05, "loss": 21.8127, "step": 9610 }, { "epoch": 0.1, "learning_rate": 1.971425174878658e-05, "loss": 22.3355, "step": 9620 }, { "epoch": 0.1, "learning_rate": 1.9713420120199564e-05, "loss": 21.8916, "step": 9630 }, { "epoch": 0.1, "learning_rate": 1.971258730079567e-05, "loss": 22.2734, "step": 9640 }, { "epoch": 0.1, "learning_rate": 1.9711753290677e-05, "loss": 22.7067, "step": 9650 }, { "epoch": 0.1, "learning_rate": 1.9710918089945802e-05, "loss": 22.6771, "step": 9660 }, { "epoch": 0.1, "learning_rate": 1.9710081698704472e-05, "loss": 22.7201, "step": 9670 }, { "epoch": 0.1, "learning_rate": 1.9709244117055537e-05, "loss": 22.1995, "step": 9680 }, { "epoch": 0.1, "learning_rate": 1.9708405345101687e-05, "loss": 22.7311, "step": 9690 }, { "epoch": 0.1, "learning_rate": 1.9707565382945745e-05, "loss": 22.2568, "step": 9700 }, { "epoch": 0.1, "learning_rate": 1.97067242306907e-05, "loss": 22.1973, "step": 9710 }, { "epoch": 0.11, "learning_rate": 1.9705881888439657e-05, "loss": 22.2168, "step": 9720 }, { "epoch": 0.11, "learning_rate": 1.970503835629589e-05, "loss": 21.7675, "step": 9730 }, { "epoch": 0.11, "learning_rate": 1.9704193634362813e-05, "loss": 22.0703, "step": 9740 }, { "epoch": 0.11, "learning_rate": 1.970334772274398e-05, "loss": 22.318, "step": 9750 }, { "epoch": 0.11, "learning_rate": 1.9702500621543103e-05, "loss": 22.7218, "step": 9760 }, { "epoch": 0.11, "learning_rate": 1.9701652330864026e-05, "loss": 22.4363, "step": 9770 }, { "epoch": 0.11, "learning_rate": 1.9700802850810746e-05, "loss": 22.8381, "step": 9780 }, { "epoch": 0.11, "learning_rate": 1.969995218148741e-05, "loss": 23.0439, "step": 9790 }, { "epoch": 0.11, "learning_rate": 1.96991003229983e-05, "loss": 22.6166, "step": 9800 }, { "epoch": 0.11, "learning_rate": 1.9698247275447856e-05, "loss": 22.3761, "step": 9810 }, { "epoch": 0.11, "learning_rate": 1.969739303894065e-05, "loss": 21.9843, "step": 9820 }, { "epoch": 0.11, "learning_rate": 1.969653761358141e-05, "loss": 22.423, "step": 9830 }, { "epoch": 0.11, "learning_rate": 1.9695680999475005e-05, "loss": 22.7124, "step": 9840 }, { "epoch": 0.11, "learning_rate": 1.9694823196726458e-05, "loss": 22.5035, "step": 9850 }, { "epoch": 0.11, "learning_rate": 1.9693964205440926e-05, "loss": 22.0959, "step": 9860 }, { "epoch": 0.11, "learning_rate": 1.9693104025723717e-05, "loss": 22.3004, "step": 9870 }, { "epoch": 0.11, "learning_rate": 1.9692242657680286e-05, "loss": 22.4527, "step": 9880 }, { "epoch": 0.11, "learning_rate": 1.9691380101416232e-05, "loss": 22.6178, "step": 9890 }, { "epoch": 0.11, "learning_rate": 1.9690516357037304e-05, "loss": 22.0049, "step": 9900 }, { "epoch": 0.11, "learning_rate": 1.9689651424649385e-05, "loss": 23.5045, "step": 9910 }, { "epoch": 0.11, "learning_rate": 1.968878530435852e-05, "loss": 22.5754, "step": 9920 }, { "epoch": 0.11, "learning_rate": 1.968791799627088e-05, "loss": 22.6668, "step": 9930 }, { "epoch": 0.11, "learning_rate": 1.968704950049281e-05, "loss": 22.4251, "step": 9940 }, { "epoch": 0.11, "learning_rate": 1.9686179817130764e-05, "loss": 22.0733, "step": 9950 }, { "epoch": 0.11, "learning_rate": 1.968530894629137e-05, "loss": 22.3479, "step": 9960 }, { "epoch": 0.11, "learning_rate": 1.9684436888081396e-05, "loss": 21.8775, "step": 9970 }, { "epoch": 0.11, "learning_rate": 1.9683563642607744e-05, "loss": 21.9054, "step": 9980 }, { "epoch": 0.11, "learning_rate": 1.9682689209977476e-05, "loss": 21.9702, "step": 9990 }, { "epoch": 0.11, "learning_rate": 1.968181359029779e-05, "loss": 22.5098, "step": 10000 }, { "epoch": 0.11, "learning_rate": 1.968093678367603e-05, "loss": 22.1775, "step": 10010 }, { "epoch": 0.11, "learning_rate": 1.9680058790219693e-05, "loss": 22.3435, "step": 10020 }, { "epoch": 0.11, "learning_rate": 1.9679179610036417e-05, "loss": 22.4357, "step": 10030 }, { "epoch": 0.11, "learning_rate": 1.967829924323398e-05, "loss": 22.933, "step": 10040 }, { "epoch": 0.11, "learning_rate": 1.9677417689920315e-05, "loss": 22.3662, "step": 10050 }, { "epoch": 0.11, "learning_rate": 1.9676534950203495e-05, "loss": 21.9968, "step": 10060 }, { "epoch": 0.11, "learning_rate": 1.9675651024191737e-05, "loss": 22.7253, "step": 10070 }, { "epoch": 0.11, "learning_rate": 1.9674765911993406e-05, "loss": 22.1825, "step": 10080 }, { "epoch": 0.11, "learning_rate": 1.967387961371702e-05, "loss": 22.3061, "step": 10090 }, { "epoch": 0.11, "learning_rate": 1.9672992129471227e-05, "loss": 21.9596, "step": 10100 }, { "epoch": 0.11, "learning_rate": 1.9672103459364828e-05, "loss": 21.9697, "step": 10110 }, { "epoch": 0.11, "learning_rate": 1.9671213603506775e-05, "loss": 22.0598, "step": 10120 }, { "epoch": 0.11, "learning_rate": 1.9670322562006158e-05, "loss": 22.0738, "step": 10130 }, { "epoch": 0.11, "learning_rate": 1.9669430334972207e-05, "loss": 21.8778, "step": 10140 }, { "epoch": 0.11, "learning_rate": 1.9668536922514315e-05, "loss": 21.7454, "step": 10150 }, { "epoch": 0.11, "learning_rate": 1.9667642324742003e-05, "loss": 23.126, "step": 10160 }, { "epoch": 0.11, "learning_rate": 1.9666746541764948e-05, "loss": 22.6752, "step": 10170 }, { "epoch": 0.11, "learning_rate": 1.9665849573692967e-05, "loss": 22.0614, "step": 10180 }, { "epoch": 0.11, "learning_rate": 1.966495142063602e-05, "loss": 22.3988, "step": 10190 }, { "epoch": 0.11, "learning_rate": 1.9664052082704225e-05, "loss": 21.9375, "step": 10200 }, { "epoch": 0.11, "learning_rate": 1.9663151560007828e-05, "loss": 21.7196, "step": 10210 }, { "epoch": 0.11, "learning_rate": 1.9662249852657233e-05, "loss": 22.0273, "step": 10220 }, { "epoch": 0.11, "learning_rate": 1.9661346960762984e-05, "loss": 21.4134, "step": 10230 }, { "epoch": 0.11, "learning_rate": 1.9660442884435775e-05, "loss": 21.3947, "step": 10240 }, { "epoch": 0.11, "learning_rate": 1.9659537623786428e-05, "loss": 21.8906, "step": 10250 }, { "epoch": 0.11, "learning_rate": 1.965863117892594e-05, "loss": 22.601, "step": 10260 }, { "epoch": 0.11, "learning_rate": 1.9657723549965427e-05, "loss": 22.1457, "step": 10270 }, { "epoch": 0.11, "learning_rate": 1.965681473701616e-05, "loss": 21.9678, "step": 10280 }, { "epoch": 0.11, "learning_rate": 1.965590474018956e-05, "loss": 22.3199, "step": 10290 }, { "epoch": 0.11, "learning_rate": 1.9654993559597184e-05, "loss": 22.6193, "step": 10300 }, { "epoch": 0.11, "learning_rate": 1.9654081195350734e-05, "loss": 22.6572, "step": 10310 }, { "epoch": 0.11, "learning_rate": 1.9653167647562075e-05, "loss": 22.4667, "step": 10320 }, { "epoch": 0.11, "learning_rate": 1.9652252916343187e-05, "loss": 22.8543, "step": 10330 }, { "epoch": 0.11, "learning_rate": 1.9651337001806224e-05, "loss": 21.8373, "step": 10340 }, { "epoch": 0.11, "learning_rate": 1.965041990406347e-05, "loss": 20.8873, "step": 10350 }, { "epoch": 0.11, "learning_rate": 1.964950162322735e-05, "loss": 21.817, "step": 10360 }, { "epoch": 0.11, "learning_rate": 1.9648582159410446e-05, "loss": 22.9783, "step": 10370 }, { "epoch": 0.11, "learning_rate": 1.964766151272548e-05, "loss": 21.1805, "step": 10380 }, { "epoch": 0.11, "learning_rate": 1.9646739683285317e-05, "loss": 21.8749, "step": 10390 }, { "epoch": 0.11, "learning_rate": 1.964581667120297e-05, "loss": 22.3982, "step": 10400 }, { "epoch": 0.11, "learning_rate": 1.964489247659159e-05, "loss": 21.705, "step": 10410 }, { "epoch": 0.11, "learning_rate": 1.9643967099564488e-05, "loss": 22.0315, "step": 10420 }, { "epoch": 0.11, "learning_rate": 1.9643040540235104e-05, "loss": 21.5918, "step": 10430 }, { "epoch": 0.11, "learning_rate": 1.9642112798717035e-05, "loss": 22.2883, "step": 10440 }, { "epoch": 0.11, "learning_rate": 1.964118387512401e-05, "loss": 22.1141, "step": 10450 }, { "epoch": 0.11, "learning_rate": 1.9640253769569918e-05, "loss": 21.9348, "step": 10460 }, { "epoch": 0.11, "learning_rate": 1.9639322482168783e-05, "loss": 22.1923, "step": 10470 }, { "epoch": 0.11, "learning_rate": 1.963839001303477e-05, "loss": 21.9535, "step": 10480 }, { "epoch": 0.11, "learning_rate": 1.9637456362282205e-05, "loss": 22.0938, "step": 10490 }, { "epoch": 0.11, "learning_rate": 1.9636521530025542e-05, "loss": 22.2173, "step": 10500 }, { "epoch": 0.11, "learning_rate": 1.9635585516379387e-05, "loss": 22.1715, "step": 10510 }, { "epoch": 0.11, "learning_rate": 1.9634648321458495e-05, "loss": 21.6539, "step": 10520 }, { "epoch": 0.11, "learning_rate": 1.9633709945377758e-05, "loss": 22.4624, "step": 10530 }, { "epoch": 0.11, "learning_rate": 1.9632770388252216e-05, "loss": 21.6658, "step": 10540 }, { "epoch": 0.11, "learning_rate": 1.9631829650197056e-05, "loss": 22.148, "step": 10550 }, { "epoch": 0.11, "learning_rate": 1.963088773132761e-05, "loss": 22.1346, "step": 10560 }, { "epoch": 0.11, "learning_rate": 1.9629944631759344e-05, "loss": 21.7224, "step": 10570 }, { "epoch": 0.11, "learning_rate": 1.9629000351607884e-05, "loss": 21.9538, "step": 10580 }, { "epoch": 0.11, "learning_rate": 1.9628054890988997e-05, "loss": 21.6342, "step": 10590 }, { "epoch": 0.11, "learning_rate": 1.9627108250018582e-05, "loss": 21.4213, "step": 10600 }, { "epoch": 0.11, "learning_rate": 1.9626160428812702e-05, "loss": 21.8227, "step": 10610 }, { "epoch": 0.11, "learning_rate": 1.962521142748755e-05, "loss": 23.2386, "step": 10620 }, { "epoch": 0.11, "learning_rate": 1.9624261246159468e-05, "loss": 21.7575, "step": 10630 }, { "epoch": 0.12, "learning_rate": 1.962330988494495e-05, "loss": 22.2316, "step": 10640 }, { "epoch": 0.12, "learning_rate": 1.962235734396062e-05, "loss": 21.7746, "step": 10650 }, { "epoch": 0.12, "learning_rate": 1.9621403623323258e-05, "loss": 22.3353, "step": 10660 }, { "epoch": 0.12, "learning_rate": 1.962044872314979e-05, "loss": 21.9104, "step": 10670 }, { "epoch": 0.12, "learning_rate": 1.9619492643557275e-05, "loss": 21.7557, "step": 10680 }, { "epoch": 0.12, "learning_rate": 1.9618535384662924e-05, "loss": 22.0132, "step": 10690 }, { "epoch": 0.12, "learning_rate": 1.9617576946584097e-05, "loss": 21.9539, "step": 10700 }, { "epoch": 0.12, "learning_rate": 1.9616617329438294e-05, "loss": 21.9397, "step": 10710 }, { "epoch": 0.12, "learning_rate": 1.961565653334315e-05, "loss": 21.9479, "step": 10720 }, { "epoch": 0.12, "learning_rate": 1.9614694558416466e-05, "loss": 21.7344, "step": 10730 }, { "epoch": 0.12, "learning_rate": 1.9613731404776168e-05, "loss": 22.4015, "step": 10740 }, { "epoch": 0.12, "learning_rate": 1.9612767072540335e-05, "loss": 21.6781, "step": 10750 }, { "epoch": 0.12, "learning_rate": 1.961180156182719e-05, "loss": 22.2023, "step": 10760 }, { "epoch": 0.12, "learning_rate": 1.96108348727551e-05, "loss": 22.0369, "step": 10770 }, { "epoch": 0.12, "learning_rate": 1.9609867005442576e-05, "loss": 22.0656, "step": 10780 }, { "epoch": 0.12, "learning_rate": 1.9608897960008274e-05, "loss": 22.2057, "step": 10790 }, { "epoch": 0.12, "learning_rate": 1.9607927736570994e-05, "loss": 21.995, "step": 10800 }, { "epoch": 0.12, "learning_rate": 1.960695633524968e-05, "loss": 22.5233, "step": 10810 }, { "epoch": 0.12, "learning_rate": 1.960598375616342e-05, "loss": 21.4775, "step": 10820 }, { "epoch": 0.12, "learning_rate": 1.960500999943145e-05, "loss": 21.5613, "step": 10830 }, { "epoch": 0.12, "learning_rate": 1.9604035065173147e-05, "loss": 21.947, "step": 10840 }, { "epoch": 0.12, "learning_rate": 1.960305895350803e-05, "loss": 22.3767, "step": 10850 }, { "epoch": 0.12, "learning_rate": 1.9602081664555767e-05, "loss": 22.5389, "step": 10860 }, { "epoch": 0.12, "learning_rate": 1.9601103198436173e-05, "loss": 22.1659, "step": 10870 }, { "epoch": 0.12, "learning_rate": 1.9600123555269198e-05, "loss": 22.9619, "step": 10880 }, { "epoch": 0.12, "learning_rate": 1.9599142735174947e-05, "loss": 21.7622, "step": 10890 }, { "epoch": 0.12, "learning_rate": 1.959816073827365e-05, "loss": 22.2331, "step": 10900 }, { "epoch": 0.12, "learning_rate": 1.9597177564685715e-05, "loss": 22.4048, "step": 10910 }, { "epoch": 0.12, "learning_rate": 1.959619321453166e-05, "loss": 22.6168, "step": 10920 }, { "epoch": 0.12, "learning_rate": 1.9595207687932164e-05, "loss": 21.6119, "step": 10930 }, { "epoch": 0.12, "learning_rate": 1.959422098500805e-05, "loss": 22.6989, "step": 10940 }, { "epoch": 0.12, "learning_rate": 1.959323310588028e-05, "loss": 22.1797, "step": 10950 }, { "epoch": 0.12, "learning_rate": 1.9592244050669967e-05, "loss": 22.1315, "step": 10960 }, { "epoch": 0.12, "learning_rate": 1.959125381949836e-05, "loss": 22.0103, "step": 10970 }, { "epoch": 0.12, "learning_rate": 1.9590262412486862e-05, "loss": 21.9253, "step": 10980 }, { "epoch": 0.12, "learning_rate": 1.958926982975701e-05, "loss": 21.9533, "step": 10990 }, { "epoch": 0.12, "learning_rate": 1.9588276071430486e-05, "loss": 21.6531, "step": 11000 }, { "epoch": 0.12, "learning_rate": 1.958728113762913e-05, "loss": 22.0284, "step": 11010 }, { "epoch": 0.12, "learning_rate": 1.9586285028474908e-05, "loss": 22.7746, "step": 11020 }, { "epoch": 0.12, "learning_rate": 1.958528774408994e-05, "loss": 21.0495, "step": 11030 }, { "epoch": 0.12, "learning_rate": 1.958428928459649e-05, "loss": 21.874, "step": 11040 }, { "epoch": 0.12, "learning_rate": 1.9583289650116963e-05, "loss": 22.3144, "step": 11050 }, { "epoch": 0.12, "learning_rate": 1.9582288840773907e-05, "loss": 22.5515, "step": 11060 }, { "epoch": 0.12, "learning_rate": 1.958128685669002e-05, "loss": 22.1941, "step": 11070 }, { "epoch": 0.12, "learning_rate": 1.9580283697988135e-05, "loss": 21.8142, "step": 11080 }, { "epoch": 0.12, "learning_rate": 1.9579279364791242e-05, "loss": 22.6992, "step": 11090 }, { "epoch": 0.12, "learning_rate": 1.9578273857222457e-05, "loss": 21.5368, "step": 11100 }, { "epoch": 0.12, "learning_rate": 1.9577267175405063e-05, "loss": 22.0869, "step": 11110 }, { "epoch": 0.12, "learning_rate": 1.9576259319462463e-05, "loss": 22.3106, "step": 11120 }, { "epoch": 0.12, "learning_rate": 1.957525028951822e-05, "loss": 22.8026, "step": 11130 }, { "epoch": 0.12, "learning_rate": 1.9574240085696037e-05, "loss": 22.36, "step": 11140 }, { "epoch": 0.12, "learning_rate": 1.9573228708119755e-05, "loss": 22.4596, "step": 11150 }, { "epoch": 0.12, "learning_rate": 1.9572216156913374e-05, "loss": 21.8724, "step": 11160 }, { "epoch": 0.12, "learning_rate": 1.9571202432201013e-05, "loss": 22.3196, "step": 11170 }, { "epoch": 0.12, "learning_rate": 1.957018753410696e-05, "loss": 22.4856, "step": 11180 }, { "epoch": 0.12, "learning_rate": 1.9569171462755637e-05, "loss": 22.6066, "step": 11190 }, { "epoch": 0.12, "learning_rate": 1.9568154218271603e-05, "loss": 22.411, "step": 11200 }, { "epoch": 0.12, "learning_rate": 1.956713580077957e-05, "loss": 21.7554, "step": 11210 }, { "epoch": 0.12, "learning_rate": 1.9566116210404393e-05, "loss": 22.2052, "step": 11220 }, { "epoch": 0.12, "learning_rate": 1.956509544727107e-05, "loss": 22.6856, "step": 11230 }, { "epoch": 0.12, "learning_rate": 1.9564073511504732e-05, "loss": 22.1144, "step": 11240 }, { "epoch": 0.12, "learning_rate": 1.9563050403230674e-05, "loss": 22.2476, "step": 11250 }, { "epoch": 0.12, "learning_rate": 1.956202612257432e-05, "loss": 21.6884, "step": 11260 }, { "epoch": 0.12, "learning_rate": 1.9561000669661237e-05, "loss": 22.2497, "step": 11270 }, { "epoch": 0.12, "learning_rate": 1.955997404461715e-05, "loss": 21.495, "step": 11280 }, { "epoch": 0.12, "learning_rate": 1.955894624756791e-05, "loss": 22.7449, "step": 11290 }, { "epoch": 0.12, "learning_rate": 1.9557917278639522e-05, "loss": 21.9859, "step": 11300 }, { "epoch": 0.12, "learning_rate": 1.9556887137958133e-05, "loss": 21.3978, "step": 11310 }, { "epoch": 0.12, "learning_rate": 1.9555855825650038e-05, "loss": 21.5202, "step": 11320 }, { "epoch": 0.12, "learning_rate": 1.955482334184166e-05, "loss": 22.3177, "step": 11330 }, { "epoch": 0.12, "learning_rate": 1.9553789686659584e-05, "loss": 22.3109, "step": 11340 }, { "epoch": 0.12, "learning_rate": 1.9552754860230528e-05, "loss": 21.5923, "step": 11350 }, { "epoch": 0.12, "learning_rate": 1.9551718862681363e-05, "loss": 22.0029, "step": 11360 }, { "epoch": 0.12, "learning_rate": 1.9550681694139086e-05, "loss": 22.2364, "step": 11370 }, { "epoch": 0.12, "learning_rate": 1.9549643354730857e-05, "loss": 21.9053, "step": 11380 }, { "epoch": 0.12, "learning_rate": 1.9548603844583974e-05, "loss": 22.0056, "step": 11390 }, { "epoch": 0.12, "learning_rate": 1.9547563163825863e-05, "loss": 22.2521, "step": 11400 }, { "epoch": 0.12, "learning_rate": 1.9546521312584117e-05, "loss": 22.3861, "step": 11410 }, { "epoch": 0.12, "learning_rate": 1.954547829098646e-05, "loss": 21.595, "step": 11420 }, { "epoch": 0.12, "learning_rate": 1.954443409916076e-05, "loss": 21.7094, "step": 11430 }, { "epoch": 0.12, "learning_rate": 1.9543388737235025e-05, "loss": 21.8654, "step": 11440 }, { "epoch": 0.12, "learning_rate": 1.954234220533742e-05, "loss": 22.2967, "step": 11450 }, { "epoch": 0.12, "learning_rate": 1.954129450359624e-05, "loss": 22.152, "step": 11460 }, { "epoch": 0.12, "learning_rate": 1.954024563213993e-05, "loss": 21.6713, "step": 11470 }, { "epoch": 0.12, "learning_rate": 1.953919559109707e-05, "loss": 22.5974, "step": 11480 }, { "epoch": 0.12, "learning_rate": 1.95381443805964e-05, "loss": 22.3158, "step": 11490 }, { "epoch": 0.12, "learning_rate": 1.9537092000766783e-05, "loss": 21.7603, "step": 11500 }, { "epoch": 0.12, "learning_rate": 1.9536038451737244e-05, "loss": 22.3053, "step": 11510 }, { "epoch": 0.12, "learning_rate": 1.953498373363694e-05, "loss": 21.4106, "step": 11520 }, { "epoch": 0.12, "learning_rate": 1.953392784659517e-05, "loss": 23.0791, "step": 11530 }, { "epoch": 0.12, "learning_rate": 1.9532870790741386e-05, "loss": 22.665, "step": 11540 }, { "epoch": 0.12, "learning_rate": 1.9531812566205175e-05, "loss": 22.2369, "step": 11550 }, { "epoch": 0.12, "learning_rate": 1.953075317311627e-05, "loss": 22.2576, "step": 11560 }, { "epoch": 0.13, "learning_rate": 1.9529692611604546e-05, "loss": 22.7839, "step": 11570 }, { "epoch": 0.13, "learning_rate": 1.9528630881800028e-05, "loss": 22.5991, "step": 11580 }, { "epoch": 0.13, "learning_rate": 1.9527567983832877e-05, "loss": 22.0617, "step": 11590 }, { "epoch": 0.13, "learning_rate": 1.9526503917833394e-05, "loss": 22.0342, "step": 11600 }, { "epoch": 0.13, "learning_rate": 1.9525438683932032e-05, "loss": 21.8185, "step": 11610 }, { "epoch": 0.13, "learning_rate": 1.9524372282259387e-05, "loss": 21.8671, "step": 11620 }, { "epoch": 0.13, "learning_rate": 1.9523304712946182e-05, "loss": 21.2327, "step": 11630 }, { "epoch": 0.13, "learning_rate": 1.952223597612331e-05, "loss": 22.158, "step": 11640 }, { "epoch": 0.13, "learning_rate": 1.9521166071921787e-05, "loss": 22.2651, "step": 11650 }, { "epoch": 0.13, "learning_rate": 1.9520095000472772e-05, "loss": 21.905, "step": 11660 }, { "epoch": 0.13, "learning_rate": 1.9519022761907584e-05, "loss": 21.7153, "step": 11670 }, { "epoch": 0.13, "learning_rate": 1.951794935635767e-05, "loss": 22.1699, "step": 11680 }, { "epoch": 0.13, "learning_rate": 1.9516874783954622e-05, "loss": 21.7654, "step": 11690 }, { "epoch": 0.13, "learning_rate": 1.951579904483018e-05, "loss": 23.1438, "step": 11700 }, { "epoch": 0.13, "learning_rate": 1.951472213911622e-05, "loss": 22.2275, "step": 11710 }, { "epoch": 0.13, "learning_rate": 1.9513644066944764e-05, "loss": 21.5835, "step": 11720 }, { "epoch": 0.13, "learning_rate": 1.951256482844799e-05, "loss": 22.1635, "step": 11730 }, { "epoch": 0.13, "learning_rate": 1.951148442375819e-05, "loss": 22.2026, "step": 11740 }, { "epoch": 0.13, "learning_rate": 1.9510402853007834e-05, "loss": 21.7416, "step": 11750 }, { "epoch": 0.13, "learning_rate": 1.9509320116329507e-05, "loss": 22.0501, "step": 11760 }, { "epoch": 0.13, "learning_rate": 1.9508236213855944e-05, "loss": 22.0911, "step": 11770 }, { "epoch": 0.13, "learning_rate": 1.950715114572004e-05, "loss": 21.3582, "step": 11780 }, { "epoch": 0.13, "learning_rate": 1.9506064912054802e-05, "loss": 21.9626, "step": 11790 }, { "epoch": 0.13, "learning_rate": 1.9504977512993406e-05, "loss": 22.443, "step": 11800 }, { "epoch": 0.13, "learning_rate": 1.950388894866916e-05, "loss": 22.0693, "step": 11810 }, { "epoch": 0.13, "learning_rate": 1.950279921921552e-05, "loss": 22.295, "step": 11820 }, { "epoch": 0.13, "learning_rate": 1.9501708324766078e-05, "loss": 21.78, "step": 11830 }, { "epoch": 0.13, "learning_rate": 1.9500616265454574e-05, "loss": 22.5081, "step": 11840 }, { "epoch": 0.13, "learning_rate": 1.949952304141488e-05, "loss": 21.8715, "step": 11850 }, { "epoch": 0.13, "learning_rate": 1.9498428652781034e-05, "loss": 22.5068, "step": 11860 }, { "epoch": 0.13, "learning_rate": 1.9497333099687193e-05, "loss": 21.9182, "step": 11870 }, { "epoch": 0.13, "learning_rate": 1.9496236382267673e-05, "loss": 22.3651, "step": 11880 }, { "epoch": 0.13, "learning_rate": 1.9495138500656923e-05, "loss": 22.4511, "step": 11890 }, { "epoch": 0.13, "learning_rate": 1.949403945498953e-05, "loss": 22.6091, "step": 11900 }, { "epoch": 0.13, "learning_rate": 1.9492939245400245e-05, "loss": 21.864, "step": 11910 }, { "epoch": 0.13, "learning_rate": 1.9491837872023943e-05, "loss": 20.8129, "step": 11920 }, { "epoch": 0.13, "learning_rate": 1.949073533499564e-05, "loss": 21.7375, "step": 11930 }, { "epoch": 0.13, "learning_rate": 1.9489631634450516e-05, "loss": 22.183, "step": 11940 }, { "epoch": 0.13, "learning_rate": 1.9488526770523862e-05, "loss": 22.0118, "step": 11950 }, { "epoch": 0.13, "learning_rate": 1.948742074335114e-05, "loss": 21.4422, "step": 11960 }, { "epoch": 0.13, "learning_rate": 1.9486313553067943e-05, "loss": 22.7709, "step": 11970 }, { "epoch": 0.13, "learning_rate": 1.9485205199810005e-05, "loss": 22.153, "step": 11980 }, { "epoch": 0.13, "learning_rate": 1.9484095683713203e-05, "loss": 21.7172, "step": 11990 }, { "epoch": 0.13, "learning_rate": 1.948298500491356e-05, "loss": 21.7603, "step": 12000 }, { "epoch": 0.13, "learning_rate": 1.948187316354724e-05, "loss": 22.121, "step": 12010 }, { "epoch": 0.13, "learning_rate": 1.948076015975054e-05, "loss": 22.3523, "step": 12020 }, { "epoch": 0.13, "learning_rate": 1.947964599365993e-05, "loss": 21.8534, "step": 12030 }, { "epoch": 0.13, "learning_rate": 1.9478530665411982e-05, "loss": 21.9343, "step": 12040 }, { "epoch": 0.13, "learning_rate": 1.9477414175143434e-05, "loss": 22.1014, "step": 12050 }, { "epoch": 0.13, "learning_rate": 1.9476296522991167e-05, "loss": 22.7039, "step": 12060 }, { "epoch": 0.13, "learning_rate": 1.9475177709092195e-05, "loss": 21.9179, "step": 12070 }, { "epoch": 0.13, "learning_rate": 1.9474057733583685e-05, "loss": 21.3196, "step": 12080 }, { "epoch": 0.13, "learning_rate": 1.9472936596602933e-05, "loss": 22.6137, "step": 12090 }, { "epoch": 0.13, "learning_rate": 1.947181429828739e-05, "loss": 21.7767, "step": 12100 }, { "epoch": 0.13, "learning_rate": 1.9470690838774643e-05, "loss": 21.919, "step": 12110 }, { "epoch": 0.13, "learning_rate": 1.9469566218202417e-05, "loss": 21.3296, "step": 12120 }, { "epoch": 0.13, "learning_rate": 1.9468440436708593e-05, "loss": 21.4936, "step": 12130 }, { "epoch": 0.13, "learning_rate": 1.946731349443118e-05, "loss": 22.3326, "step": 12140 }, { "epoch": 0.13, "learning_rate": 1.9466185391508344e-05, "loss": 22.8625, "step": 12150 }, { "epoch": 0.13, "learning_rate": 1.9465056128078372e-05, "loss": 21.6735, "step": 12160 }, { "epoch": 0.13, "learning_rate": 1.9463925704279717e-05, "loss": 21.347, "step": 12170 }, { "epoch": 0.13, "learning_rate": 1.946279412025096e-05, "loss": 21.2368, "step": 12180 }, { "epoch": 0.13, "learning_rate": 1.946166137613083e-05, "loss": 22.2006, "step": 12190 }, { "epoch": 0.13, "learning_rate": 1.9460527472058185e-05, "loss": 21.9749, "step": 12200 }, { "epoch": 0.13, "learning_rate": 1.9459392408172045e-05, "loss": 21.2354, "step": 12210 }, { "epoch": 0.13, "learning_rate": 1.945825618461157e-05, "loss": 22.6107, "step": 12220 }, { "epoch": 0.13, "learning_rate": 1.945711880151604e-05, "loss": 22.5925, "step": 12230 }, { "epoch": 0.13, "learning_rate": 1.94559802590249e-05, "loss": 22.5481, "step": 12240 }, { "epoch": 0.13, "learning_rate": 1.9454840557277733e-05, "loss": 21.7809, "step": 12250 }, { "epoch": 0.13, "learning_rate": 1.9453699696414254e-05, "loss": 22.2594, "step": 12260 }, { "epoch": 0.13, "learning_rate": 1.945255767657433e-05, "loss": 22.2804, "step": 12270 }, { "epoch": 0.13, "learning_rate": 1.945141449789797e-05, "loss": 21.802, "step": 12280 }, { "epoch": 0.13, "learning_rate": 1.9450270160525314e-05, "loss": 21.7994, "step": 12290 }, { "epoch": 0.13, "learning_rate": 1.9449124664596662e-05, "loss": 21.7204, "step": 12300 }, { "epoch": 0.13, "learning_rate": 1.944797801025244e-05, "loss": 22.4486, "step": 12310 }, { "epoch": 0.13, "learning_rate": 1.944683019763322e-05, "loss": 21.7343, "step": 12320 }, { "epoch": 0.13, "learning_rate": 1.9445681226879727e-05, "loss": 22.8379, "step": 12330 }, { "epoch": 0.13, "learning_rate": 1.944453109813281e-05, "loss": 22.1322, "step": 12340 }, { "epoch": 0.13, "learning_rate": 1.9443379811533475e-05, "loss": 22.9742, "step": 12350 }, { "epoch": 0.13, "learning_rate": 1.944222736722286e-05, "loss": 21.767, "step": 12360 }, { "epoch": 0.13, "learning_rate": 1.9441073765342246e-05, "loss": 23.3225, "step": 12370 }, { "epoch": 0.13, "learning_rate": 1.943991900603307e-05, "loss": 21.4752, "step": 12380 }, { "epoch": 0.13, "learning_rate": 1.943876308943689e-05, "loss": 22.4408, "step": 12390 }, { "epoch": 0.13, "learning_rate": 1.9437606015695417e-05, "loss": 21.5854, "step": 12400 }, { "epoch": 0.13, "learning_rate": 1.943644778495051e-05, "loss": 21.3085, "step": 12410 }, { "epoch": 0.13, "learning_rate": 1.943528839734415e-05, "loss": 21.9019, "step": 12420 }, { "epoch": 0.13, "learning_rate": 1.943412785301848e-05, "loss": 21.9701, "step": 12430 }, { "epoch": 0.13, "learning_rate": 1.9432966152115776e-05, "loss": 20.9435, "step": 12440 }, { "epoch": 0.13, "learning_rate": 1.9431803294778454e-05, "loss": 21.8254, "step": 12450 }, { "epoch": 0.13, "learning_rate": 1.9430639281149083e-05, "loss": 21.7975, "step": 12460 }, { "epoch": 0.13, "learning_rate": 1.942947411137035e-05, "loss": 21.5907, "step": 12470 }, { "epoch": 0.13, "learning_rate": 1.9428307785585116e-05, "loss": 22.0372, "step": 12480 }, { "epoch": 0.14, "learning_rate": 1.9427140303936355e-05, "loss": 22.7111, "step": 12490 }, { "epoch": 0.14, "learning_rate": 1.9425971666567198e-05, "loss": 22.034, "step": 12500 }, { "epoch": 0.14, "learning_rate": 1.9424801873620915e-05, "loss": 21.8975, "step": 12510 }, { "epoch": 0.14, "learning_rate": 1.9423630925240916e-05, "loss": 22.665, "step": 12520 }, { "epoch": 0.14, "learning_rate": 1.9422458821570755e-05, "loss": 22.0563, "step": 12530 }, { "epoch": 0.14, "learning_rate": 1.9421285562754123e-05, "loss": 22.0088, "step": 12540 }, { "epoch": 0.14, "learning_rate": 1.9420111148934854e-05, "loss": 22.0813, "step": 12550 }, { "epoch": 0.14, "learning_rate": 1.9418935580256933e-05, "loss": 21.5078, "step": 12560 }, { "epoch": 0.14, "learning_rate": 1.9417758856864473e-05, "loss": 22.4094, "step": 12570 }, { "epoch": 0.14, "learning_rate": 1.941658097890174e-05, "loss": 21.9396, "step": 12580 }, { "epoch": 0.14, "learning_rate": 1.9415401946513125e-05, "loss": 22.2437, "step": 12590 }, { "epoch": 0.14, "learning_rate": 1.9414221759843183e-05, "loss": 22.4812, "step": 12600 }, { "epoch": 0.14, "learning_rate": 1.9413040419036592e-05, "loss": 21.4013, "step": 12610 }, { "epoch": 0.14, "learning_rate": 1.9411857924238176e-05, "loss": 22.2233, "step": 12620 }, { "epoch": 0.14, "learning_rate": 1.9410674275592916e-05, "loss": 22.1571, "step": 12630 }, { "epoch": 0.14, "learning_rate": 1.9409489473245908e-05, "loss": 22.0403, "step": 12640 }, { "epoch": 0.14, "learning_rate": 1.940830351734241e-05, "loss": 21.3847, "step": 12650 }, { "epoch": 0.14, "learning_rate": 1.9407116408027812e-05, "loss": 21.6915, "step": 12660 }, { "epoch": 0.14, "learning_rate": 1.940592814544765e-05, "loss": 21.4617, "step": 12670 }, { "epoch": 0.14, "learning_rate": 1.9404738729747593e-05, "loss": 22.6955, "step": 12680 }, { "epoch": 0.14, "learning_rate": 1.940354816107346e-05, "loss": 22.0667, "step": 12690 }, { "epoch": 0.14, "learning_rate": 1.9402356439571216e-05, "loss": 22.0892, "step": 12700 }, { "epoch": 0.14, "learning_rate": 1.940116356538695e-05, "loss": 22.3438, "step": 12710 }, { "epoch": 0.14, "learning_rate": 1.939996953866691e-05, "loss": 21.3983, "step": 12720 }, { "epoch": 0.14, "learning_rate": 1.939877435955747e-05, "loss": 21.052, "step": 12730 }, { "epoch": 0.14, "learning_rate": 1.9397578028205162e-05, "loss": 22.3065, "step": 12740 }, { "epoch": 0.14, "learning_rate": 1.9396380544756644e-05, "loss": 21.7714, "step": 12750 }, { "epoch": 0.14, "learning_rate": 1.939518190935872e-05, "loss": 21.8733, "step": 12760 }, { "epoch": 0.14, "learning_rate": 1.9393982122158345e-05, "loss": 22.1309, "step": 12770 }, { "epoch": 0.14, "learning_rate": 1.9392781183302602e-05, "loss": 21.0491, "step": 12780 }, { "epoch": 0.14, "learning_rate": 1.9391579092938717e-05, "loss": 21.6893, "step": 12790 }, { "epoch": 0.14, "learning_rate": 1.9390375851214066e-05, "loss": 22.2231, "step": 12800 }, { "epoch": 0.14, "learning_rate": 1.9389171458276156e-05, "loss": 21.9562, "step": 12810 }, { "epoch": 0.14, "learning_rate": 1.938796591427264e-05, "loss": 22.524, "step": 12820 }, { "epoch": 0.14, "learning_rate": 1.9386759219351315e-05, "loss": 22.2006, "step": 12830 }, { "epoch": 0.14, "learning_rate": 1.9385551373660113e-05, "loss": 21.6386, "step": 12840 }, { "epoch": 0.14, "learning_rate": 1.938434237734711e-05, "loss": 21.7389, "step": 12850 }, { "epoch": 0.14, "learning_rate": 1.9383132230560523e-05, "loss": 22.008, "step": 12860 }, { "epoch": 0.14, "learning_rate": 1.9381920933448715e-05, "loss": 21.6676, "step": 12870 }, { "epoch": 0.14, "learning_rate": 1.9380708486160175e-05, "loss": 22.0041, "step": 12880 }, { "epoch": 0.14, "learning_rate": 1.937949488884355e-05, "loss": 21.8059, "step": 12890 }, { "epoch": 0.14, "learning_rate": 1.937828014164762e-05, "loss": 22.8231, "step": 12900 }, { "epoch": 0.14, "learning_rate": 1.937706424472131e-05, "loss": 22.1157, "step": 12910 }, { "epoch": 0.14, "learning_rate": 1.9375847198213672e-05, "loss": 21.8657, "step": 12920 }, { "epoch": 0.14, "learning_rate": 1.9374629002273923e-05, "loss": 22.6628, "step": 12930 }, { "epoch": 0.14, "learning_rate": 1.93734096570514e-05, "loss": 22.0837, "step": 12940 }, { "epoch": 0.14, "learning_rate": 1.9372189162695592e-05, "loss": 22.5935, "step": 12950 }, { "epoch": 0.14, "learning_rate": 1.937096751935612e-05, "loss": 22.8239, "step": 12960 }, { "epoch": 0.14, "learning_rate": 1.936974472718276e-05, "loss": 21.5946, "step": 12970 }, { "epoch": 0.14, "learning_rate": 1.9368520786325412e-05, "loss": 21.5568, "step": 12980 }, { "epoch": 0.14, "learning_rate": 1.936729569693413e-05, "loss": 23.2847, "step": 12990 }, { "epoch": 0.14, "learning_rate": 1.9366069459159104e-05, "loss": 21.7281, "step": 13000 }, { "epoch": 0.14, "learning_rate": 1.9364842073150663e-05, "loss": 22.3739, "step": 13010 }, { "epoch": 0.14, "learning_rate": 1.9363613539059277e-05, "loss": 22.2461, "step": 13020 }, { "epoch": 0.14, "learning_rate": 1.936238385703556e-05, "loss": 21.9387, "step": 13030 }, { "epoch": 0.14, "learning_rate": 1.9361153027230264e-05, "loss": 21.941, "step": 13040 }, { "epoch": 0.14, "learning_rate": 1.9359921049794287e-05, "loss": 21.6246, "step": 13050 }, { "epoch": 0.14, "learning_rate": 1.9358687924878656e-05, "loss": 21.3039, "step": 13060 }, { "epoch": 0.14, "learning_rate": 1.935745365263455e-05, "loss": 22.3156, "step": 13070 }, { "epoch": 0.14, "learning_rate": 1.9356218233213285e-05, "loss": 21.3912, "step": 13080 }, { "epoch": 0.14, "learning_rate": 1.9354981666766313e-05, "loss": 21.052, "step": 13090 }, { "epoch": 0.14, "learning_rate": 1.9353743953445237e-05, "loss": 21.8189, "step": 13100 }, { "epoch": 0.14, "learning_rate": 1.9352505093401793e-05, "loss": 21.7134, "step": 13110 }, { "epoch": 0.14, "learning_rate": 1.9351265086787856e-05, "loss": 21.8657, "step": 13120 }, { "epoch": 0.14, "learning_rate": 1.9350023933755446e-05, "loss": 21.9554, "step": 13130 }, { "epoch": 0.14, "learning_rate": 1.9348781634456725e-05, "loss": 22.1592, "step": 13140 }, { "epoch": 0.14, "learning_rate": 1.934753818904399e-05, "loss": 22.3718, "step": 13150 }, { "epoch": 0.14, "learning_rate": 1.934629359766968e-05, "loss": 21.8669, "step": 13160 }, { "epoch": 0.14, "learning_rate": 1.9345047860486375e-05, "loss": 21.9929, "step": 13170 }, { "epoch": 0.14, "learning_rate": 1.9343800977646803e-05, "loss": 22.5001, "step": 13180 }, { "epoch": 0.14, "learning_rate": 1.934255294930382e-05, "loss": 21.8428, "step": 13190 }, { "epoch": 0.14, "learning_rate": 1.9341303775610427e-05, "loss": 22.8052, "step": 13200 }, { "epoch": 0.14, "learning_rate": 1.9340053456719768e-05, "loss": 22.5194, "step": 13210 }, { "epoch": 0.14, "learning_rate": 1.9338801992785127e-05, "loss": 22.1447, "step": 13220 }, { "epoch": 0.14, "learning_rate": 1.933754938395993e-05, "loss": 22.5055, "step": 13230 }, { "epoch": 0.14, "learning_rate": 1.9336295630397735e-05, "loss": 21.9901, "step": 13240 }, { "epoch": 0.14, "learning_rate": 1.9335040732252248e-05, "loss": 21.7884, "step": 13250 }, { "epoch": 0.14, "learning_rate": 1.9333784689677313e-05, "loss": 21.8616, "step": 13260 }, { "epoch": 0.14, "learning_rate": 1.9332527502826915e-05, "loss": 21.9835, "step": 13270 }, { "epoch": 0.14, "learning_rate": 1.933126917185518e-05, "loss": 22.5978, "step": 13280 }, { "epoch": 0.14, "learning_rate": 1.933000969691637e-05, "loss": 21.6529, "step": 13290 }, { "epoch": 0.14, "learning_rate": 1.9328749078164892e-05, "loss": 21.1914, "step": 13300 }, { "epoch": 0.14, "learning_rate": 1.9327487315755294e-05, "loss": 21.7103, "step": 13310 }, { "epoch": 0.14, "learning_rate": 1.932622440984226e-05, "loss": 22.4672, "step": 13320 }, { "epoch": 0.14, "learning_rate": 1.932496036058061e-05, "loss": 21.3876, "step": 13330 }, { "epoch": 0.14, "learning_rate": 1.932369516812532e-05, "loss": 21.2814, "step": 13340 }, { "epoch": 0.14, "learning_rate": 1.9322428832631493e-05, "loss": 21.8751, "step": 13350 }, { "epoch": 0.14, "learning_rate": 1.9321161354254373e-05, "loss": 22.703, "step": 13360 }, { "epoch": 0.14, "learning_rate": 1.9319892733149346e-05, "loss": 21.4903, "step": 13370 }, { "epoch": 0.14, "learning_rate": 1.9318622969471945e-05, "loss": 22.2498, "step": 13380 }, { "epoch": 0.14, "learning_rate": 1.931735206337783e-05, "loss": 21.2711, "step": 13390 }, { "epoch": 0.14, "learning_rate": 1.931608001502281e-05, "loss": 21.7074, "step": 13400 }, { "epoch": 0.14, "learning_rate": 1.9314806824562833e-05, "loss": 21.9928, "step": 13410 }, { "epoch": 0.15, "learning_rate": 1.9313532492153984e-05, "loss": 22.3565, "step": 13420 }, { "epoch": 0.15, "learning_rate": 1.9312257017952488e-05, "loss": 21.6011, "step": 13430 }, { "epoch": 0.15, "learning_rate": 1.9310980402114716e-05, "loss": 21.7206, "step": 13440 }, { "epoch": 0.15, "learning_rate": 1.930970264479717e-05, "loss": 22.9054, "step": 13450 }, { "epoch": 0.15, "learning_rate": 1.9308423746156503e-05, "loss": 23.108, "step": 13460 }, { "epoch": 0.15, "learning_rate": 1.93071437063495e-05, "loss": 22.6622, "step": 13470 }, { "epoch": 0.15, "learning_rate": 1.930586252553308e-05, "loss": 22.0943, "step": 13480 }, { "epoch": 0.15, "learning_rate": 1.930458020386432e-05, "loss": 22.0412, "step": 13490 }, { "epoch": 0.15, "learning_rate": 1.9303296741500422e-05, "loss": 21.838, "step": 13500 }, { "epoch": 0.15, "learning_rate": 1.9302012138598726e-05, "loss": 22.1294, "step": 13510 }, { "epoch": 0.15, "learning_rate": 1.930072639531673e-05, "loss": 21.8678, "step": 13520 }, { "epoch": 0.15, "learning_rate": 1.9299439511812046e-05, "loss": 21.8322, "step": 13530 }, { "epoch": 0.15, "learning_rate": 1.9298151488242453e-05, "loss": 21.6278, "step": 13540 }, { "epoch": 0.15, "learning_rate": 1.9296862324765843e-05, "loss": 22.4477, "step": 13550 }, { "epoch": 0.15, "learning_rate": 1.9295572021540274e-05, "loss": 21.8764, "step": 13560 }, { "epoch": 0.15, "learning_rate": 1.9294280578723922e-05, "loss": 21.4787, "step": 13570 }, { "epoch": 0.15, "learning_rate": 1.9292987996475113e-05, "loss": 22.119, "step": 13580 }, { "epoch": 0.15, "learning_rate": 1.929169427495231e-05, "loss": 21.4625, "step": 13590 }, { "epoch": 0.15, "learning_rate": 1.9290399414314123e-05, "loss": 21.6881, "step": 13600 }, { "epoch": 0.15, "learning_rate": 1.928910341471929e-05, "loss": 20.9967, "step": 13610 }, { "epoch": 0.15, "learning_rate": 1.9287806276326696e-05, "loss": 21.8454, "step": 13620 }, { "epoch": 0.15, "learning_rate": 1.9286507999295364e-05, "loss": 21.3742, "step": 13630 }, { "epoch": 0.15, "learning_rate": 1.9285208583784453e-05, "loss": 21.7424, "step": 13640 }, { "epoch": 0.15, "learning_rate": 1.928390802995327e-05, "loss": 21.9822, "step": 13650 }, { "epoch": 0.15, "learning_rate": 1.928260633796125e-05, "loss": 22.0032, "step": 13660 }, { "epoch": 0.15, "learning_rate": 1.9281303507967982e-05, "loss": 22.8652, "step": 13670 }, { "epoch": 0.15, "learning_rate": 1.927999954013318e-05, "loss": 22.6881, "step": 13680 }, { "epoch": 0.15, "learning_rate": 1.9278694434616704e-05, "loss": 21.8587, "step": 13690 }, { "epoch": 0.15, "learning_rate": 1.927738819157856e-05, "loss": 21.1864, "step": 13700 }, { "epoch": 0.15, "learning_rate": 1.9276080811178878e-05, "loss": 21.4959, "step": 13710 }, { "epoch": 0.15, "learning_rate": 1.9274772293577944e-05, "loss": 22.7285, "step": 13720 }, { "epoch": 0.15, "learning_rate": 1.9273462638936173e-05, "loss": 22.2556, "step": 13730 }, { "epoch": 0.15, "learning_rate": 1.927215184741412e-05, "loss": 21.2657, "step": 13740 }, { "epoch": 0.15, "learning_rate": 1.9270839919172482e-05, "loss": 21.6098, "step": 13750 }, { "epoch": 0.15, "learning_rate": 1.92695268543721e-05, "loss": 21.1177, "step": 13760 }, { "epoch": 0.15, "learning_rate": 1.926821265317394e-05, "loss": 21.7503, "step": 13770 }, { "epoch": 0.15, "learning_rate": 1.9266897315739122e-05, "loss": 21.9274, "step": 13780 }, { "epoch": 0.15, "learning_rate": 1.9265580842228904e-05, "loss": 22.3143, "step": 13790 }, { "epoch": 0.15, "learning_rate": 1.926426323280467e-05, "loss": 22.3266, "step": 13800 }, { "epoch": 0.15, "learning_rate": 1.926294448762796e-05, "loss": 22.0258, "step": 13810 }, { "epoch": 0.15, "learning_rate": 1.9261624606860442e-05, "loss": 21.9458, "step": 13820 }, { "epoch": 0.15, "learning_rate": 1.9260303590663925e-05, "loss": 21.807, "step": 13830 }, { "epoch": 0.15, "learning_rate": 1.9258981439200367e-05, "loss": 21.9958, "step": 13840 }, { "epoch": 0.15, "learning_rate": 1.9257658152631843e-05, "loss": 21.5365, "step": 13850 }, { "epoch": 0.15, "learning_rate": 1.9256333731120596e-05, "loss": 21.9846, "step": 13860 }, { "epoch": 0.15, "learning_rate": 1.9255008174828986e-05, "loss": 21.9134, "step": 13870 }, { "epoch": 0.15, "learning_rate": 1.925368148391952e-05, "loss": 21.3246, "step": 13880 }, { "epoch": 0.15, "learning_rate": 1.9252353658554845e-05, "loss": 21.5134, "step": 13890 }, { "epoch": 0.15, "learning_rate": 1.9251024698897745e-05, "loss": 21.8759, "step": 13900 }, { "epoch": 0.15, "learning_rate": 1.9249694605111145e-05, "loss": 21.9988, "step": 13910 }, { "epoch": 0.15, "learning_rate": 1.9248363377358107e-05, "loss": 21.9028, "step": 13920 }, { "epoch": 0.15, "learning_rate": 1.9247031015801832e-05, "loss": 21.1759, "step": 13930 }, { "epoch": 0.15, "learning_rate": 1.9245697520605663e-05, "loss": 22.3951, "step": 13940 }, { "epoch": 0.15, "learning_rate": 1.9244362891933077e-05, "loss": 22.4367, "step": 13950 }, { "epoch": 0.15, "learning_rate": 1.9243027129947694e-05, "loss": 21.4885, "step": 13960 }, { "epoch": 0.15, "learning_rate": 1.9241690234813276e-05, "loss": 22.2202, "step": 13970 }, { "epoch": 0.15, "learning_rate": 1.9240352206693713e-05, "loss": 21.8314, "step": 13980 }, { "epoch": 0.15, "learning_rate": 1.9239013045753046e-05, "loss": 22.0592, "step": 13990 }, { "epoch": 0.15, "learning_rate": 1.9237672752155446e-05, "loss": 22.4248, "step": 14000 }, { "epoch": 0.15, "learning_rate": 1.9236331326065224e-05, "loss": 21.8045, "step": 14010 }, { "epoch": 0.15, "learning_rate": 1.923498876764684e-05, "loss": 21.2371, "step": 14020 }, { "epoch": 0.15, "learning_rate": 1.923364507706488e-05, "loss": 21.7945, "step": 14030 }, { "epoch": 0.15, "learning_rate": 1.9232300254484068e-05, "loss": 20.4916, "step": 14040 }, { "epoch": 0.15, "learning_rate": 1.9230954300069286e-05, "loss": 21.723, "step": 14050 }, { "epoch": 0.15, "learning_rate": 1.922960721398553e-05, "loss": 21.1838, "step": 14060 }, { "epoch": 0.15, "learning_rate": 1.922825899639795e-05, "loss": 21.8668, "step": 14070 }, { "epoch": 0.15, "learning_rate": 1.922690964747183e-05, "loss": 22.3936, "step": 14080 }, { "epoch": 0.15, "learning_rate": 1.9225559167372598e-05, "loss": 21.1919, "step": 14090 }, { "epoch": 0.15, "learning_rate": 1.9224207556265812e-05, "loss": 22.6864, "step": 14100 }, { "epoch": 0.15, "learning_rate": 1.922285481431717e-05, "loss": 21.7426, "step": 14110 }, { "epoch": 0.15, "learning_rate": 1.9221500941692513e-05, "loss": 21.3085, "step": 14120 }, { "epoch": 0.15, "learning_rate": 1.9220145938557828e-05, "loss": 22.2767, "step": 14130 }, { "epoch": 0.15, "learning_rate": 1.921878980507922e-05, "loss": 22.0403, "step": 14140 }, { "epoch": 0.15, "learning_rate": 1.9217432541422946e-05, "loss": 21.9478, "step": 14150 }, { "epoch": 0.15, "learning_rate": 1.9216074147755407e-05, "loss": 22.4381, "step": 14160 }, { "epoch": 0.15, "learning_rate": 1.921471462424313e-05, "loss": 22.131, "step": 14170 }, { "epoch": 0.15, "learning_rate": 1.921335397105278e-05, "loss": 21.6617, "step": 14180 }, { "epoch": 0.15, "learning_rate": 1.921199218835118e-05, "loss": 21.7693, "step": 14190 }, { "epoch": 0.15, "learning_rate": 1.9210629276305262e-05, "loss": 21.7178, "step": 14200 }, { "epoch": 0.15, "learning_rate": 1.920926523508213e-05, "loss": 22.1289, "step": 14210 }, { "epoch": 0.15, "learning_rate": 1.920790006484899e-05, "loss": 22.3884, "step": 14220 }, { "epoch": 0.15, "learning_rate": 1.920653376577322e-05, "loss": 21.5121, "step": 14230 }, { "epoch": 0.15, "learning_rate": 1.920516633802232e-05, "loss": 21.6105, "step": 14240 }, { "epoch": 0.15, "learning_rate": 1.9203797781763918e-05, "loss": 21.9079, "step": 14250 }, { "epoch": 0.15, "learning_rate": 1.9202428097165803e-05, "loss": 21.4834, "step": 14260 }, { "epoch": 0.15, "learning_rate": 1.9201057284395887e-05, "loss": 21.6593, "step": 14270 }, { "epoch": 0.15, "learning_rate": 1.9199685343622226e-05, "loss": 21.4076, "step": 14280 }, { "epoch": 0.15, "learning_rate": 1.9198312275013012e-05, "loss": 22.5853, "step": 14290 }, { "epoch": 0.15, "learning_rate": 1.919693807873658e-05, "loss": 21.8238, "step": 14300 }, { "epoch": 0.15, "learning_rate": 1.9195562754961397e-05, "loss": 21.7567, "step": 14310 }, { "epoch": 0.15, "learning_rate": 1.919418630385607e-05, "loss": 22.121, "step": 14320 }, { "epoch": 0.15, "learning_rate": 1.9192808725589347e-05, "loss": 22.0632, "step": 14330 }, { "epoch": 0.16, "learning_rate": 1.9191430020330108e-05, "loss": 21.8293, "step": 14340 }, { "epoch": 0.16, "learning_rate": 1.919005018824738e-05, "loss": 21.4856, "step": 14350 }, { "epoch": 0.16, "learning_rate": 1.9188669229510326e-05, "loss": 22.2738, "step": 14360 }, { "epoch": 0.16, "learning_rate": 1.9187287144288237e-05, "loss": 22.1245, "step": 14370 }, { "epoch": 0.16, "learning_rate": 1.9185903932750554e-05, "loss": 22.6826, "step": 14380 }, { "epoch": 0.16, "learning_rate": 1.918451959506685e-05, "loss": 22.1524, "step": 14390 }, { "epoch": 0.16, "learning_rate": 1.9183134131406844e-05, "loss": 21.9896, "step": 14400 }, { "epoch": 0.16, "learning_rate": 1.918174754194038e-05, "loss": 22.3398, "step": 14410 }, { "epoch": 0.16, "learning_rate": 1.9180359826837447e-05, "loss": 21.7885, "step": 14420 }, { "epoch": 0.16, "learning_rate": 1.9178970986268174e-05, "loss": 22.2901, "step": 14430 }, { "epoch": 0.16, "learning_rate": 1.917758102040283e-05, "loss": 22.2567, "step": 14440 }, { "epoch": 0.16, "learning_rate": 1.9176189929411812e-05, "loss": 21.0745, "step": 14450 }, { "epoch": 0.16, "learning_rate": 1.917479771346566e-05, "loss": 22.2012, "step": 14460 }, { "epoch": 0.16, "learning_rate": 1.917340437273506e-05, "loss": 21.9074, "step": 14470 }, { "epoch": 0.16, "learning_rate": 1.9172009907390824e-05, "loss": 21.6554, "step": 14480 }, { "epoch": 0.16, "learning_rate": 1.91706143176039e-05, "loss": 22.099, "step": 14490 }, { "epoch": 0.16, "learning_rate": 1.9169217603545394e-05, "loss": 21.6328, "step": 14500 }, { "epoch": 0.16, "learning_rate": 1.9167819765386525e-05, "loss": 21.4619, "step": 14510 }, { "epoch": 0.16, "learning_rate": 1.916642080329867e-05, "loss": 22.5099, "step": 14520 }, { "epoch": 0.16, "learning_rate": 1.9165020717453324e-05, "loss": 22.3828, "step": 14530 }, { "epoch": 0.16, "learning_rate": 1.916361950802214e-05, "loss": 21.9368, "step": 14540 }, { "epoch": 0.16, "learning_rate": 1.9162217175176897e-05, "loss": 21.2966, "step": 14550 }, { "epoch": 0.16, "learning_rate": 1.9160813719089512e-05, "loss": 22.2416, "step": 14560 }, { "epoch": 0.16, "learning_rate": 1.9159409139932038e-05, "loss": 22.1403, "step": 14570 }, { "epoch": 0.16, "learning_rate": 1.9158003437876677e-05, "loss": 21.5092, "step": 14580 }, { "epoch": 0.16, "learning_rate": 1.915659661309576e-05, "loss": 20.9701, "step": 14590 }, { "epoch": 0.16, "learning_rate": 1.9155188665761754e-05, "loss": 21.7539, "step": 14600 }, { "epoch": 0.16, "learning_rate": 1.9153779596047265e-05, "loss": 22.665, "step": 14610 }, { "epoch": 0.16, "learning_rate": 1.915236940412504e-05, "loss": 22.1091, "step": 14620 }, { "epoch": 0.16, "learning_rate": 1.915095809016796e-05, "loss": 22.3068, "step": 14630 }, { "epoch": 0.16, "learning_rate": 1.9149545654349052e-05, "loss": 21.8533, "step": 14640 }, { "epoch": 0.16, "learning_rate": 1.9148132096841465e-05, "loss": 21.3122, "step": 14650 }, { "epoch": 0.16, "learning_rate": 1.9146717417818494e-05, "loss": 21.5557, "step": 14660 }, { "epoch": 0.16, "learning_rate": 1.9145301617453578e-05, "loss": 22.8459, "step": 14670 }, { "epoch": 0.16, "learning_rate": 1.914388469592028e-05, "loss": 22.4812, "step": 14680 }, { "epoch": 0.16, "learning_rate": 1.9142466653392317e-05, "loss": 21.8751, "step": 14690 }, { "epoch": 0.16, "learning_rate": 1.9141047490043526e-05, "loss": 21.7324, "step": 14700 }, { "epoch": 0.16, "learning_rate": 1.913962720604789e-05, "loss": 22.3547, "step": 14710 }, { "epoch": 0.16, "learning_rate": 1.9138205801579532e-05, "loss": 21.4679, "step": 14720 }, { "epoch": 0.16, "learning_rate": 1.9136783276812708e-05, "loss": 22.1951, "step": 14730 }, { "epoch": 0.16, "learning_rate": 1.9135359631921813e-05, "loss": 21.5995, "step": 14740 }, { "epoch": 0.16, "learning_rate": 1.9133934867081373e-05, "loss": 21.6364, "step": 14750 }, { "epoch": 0.16, "learning_rate": 1.9132508982466067e-05, "loss": 22.7368, "step": 14760 }, { "epoch": 0.16, "learning_rate": 1.9131081978250692e-05, "loss": 22.7352, "step": 14770 }, { "epoch": 0.16, "learning_rate": 1.9129653854610198e-05, "loss": 21.2708, "step": 14780 }, { "epoch": 0.16, "learning_rate": 1.9128224611719663e-05, "loss": 22.1265, "step": 14790 }, { "epoch": 0.16, "learning_rate": 1.9126794249754303e-05, "loss": 22.3297, "step": 14800 }, { "epoch": 0.16, "learning_rate": 1.912536276888948e-05, "loss": 21.9716, "step": 14810 }, { "epoch": 0.16, "learning_rate": 1.912393016930068e-05, "loss": 20.9555, "step": 14820 }, { "epoch": 0.16, "learning_rate": 1.9122496451163535e-05, "loss": 21.3165, "step": 14830 }, { "epoch": 0.16, "learning_rate": 1.912106161465381e-05, "loss": 21.4568, "step": 14840 }, { "epoch": 0.16, "learning_rate": 1.9119625659947416e-05, "loss": 22.4998, "step": 14850 }, { "epoch": 0.16, "learning_rate": 1.911818858722038e-05, "loss": 21.2246, "step": 14860 }, { "epoch": 0.16, "learning_rate": 1.911675039664889e-05, "loss": 21.5299, "step": 14870 }, { "epoch": 0.16, "learning_rate": 1.9115311088409264e-05, "loss": 21.7725, "step": 14880 }, { "epoch": 0.16, "learning_rate": 1.9113870662677945e-05, "loss": 21.5552, "step": 14890 }, { "epoch": 0.16, "learning_rate": 1.9112429119631528e-05, "loss": 21.9424, "step": 14900 }, { "epoch": 0.16, "learning_rate": 1.9110986459446736e-05, "loss": 22.1132, "step": 14910 }, { "epoch": 0.16, "learning_rate": 1.9109542682300433e-05, "loss": 21.8339, "step": 14920 }, { "epoch": 0.16, "learning_rate": 1.9108097788369623e-05, "loss": 21.8946, "step": 14930 }, { "epoch": 0.16, "learning_rate": 1.9106651777831433e-05, "loss": 21.8859, "step": 14940 }, { "epoch": 0.16, "learning_rate": 1.9105204650863145e-05, "loss": 22.7422, "step": 14950 }, { "epoch": 0.16, "learning_rate": 1.9103756407642166e-05, "loss": 21.2104, "step": 14960 }, { "epoch": 0.16, "learning_rate": 1.9102307048346046e-05, "loss": 21.4338, "step": 14970 }, { "epoch": 0.16, "learning_rate": 1.9100856573152465e-05, "loss": 21.24, "step": 14980 }, { "epoch": 0.16, "learning_rate": 1.909940498223925e-05, "loss": 21.3076, "step": 14990 }, { "epoch": 0.16, "learning_rate": 1.9097952275784354e-05, "loss": 22.0516, "step": 15000 }, { "epoch": 0.16, "learning_rate": 1.9096498453965872e-05, "loss": 22.3182, "step": 15010 }, { "epoch": 0.16, "learning_rate": 1.9095043516962036e-05, "loss": 21.7484, "step": 15020 }, { "epoch": 0.16, "learning_rate": 1.9093587464951215e-05, "loss": 21.6236, "step": 15030 }, { "epoch": 0.16, "learning_rate": 1.9092130298111913e-05, "loss": 22.543, "step": 15040 }, { "epoch": 0.16, "learning_rate": 1.909067201662277e-05, "loss": 21.431, "step": 15050 }, { "epoch": 0.16, "learning_rate": 1.908921262066257e-05, "loss": 21.6484, "step": 15060 }, { "epoch": 0.16, "learning_rate": 1.9087752110410222e-05, "loss": 20.9267, "step": 15070 }, { "epoch": 0.16, "learning_rate": 1.9086290486044774e-05, "loss": 22.1758, "step": 15080 }, { "epoch": 0.16, "learning_rate": 1.9084827747745423e-05, "loss": 21.3579, "step": 15090 }, { "epoch": 0.16, "learning_rate": 1.9083363895691483e-05, "loss": 22.0185, "step": 15100 }, { "epoch": 0.16, "learning_rate": 1.9081898930062426e-05, "loss": 21.9414, "step": 15110 }, { "epoch": 0.16, "learning_rate": 1.9080432851037843e-05, "loss": 21.3248, "step": 15120 }, { "epoch": 0.16, "learning_rate": 1.907896565879747e-05, "loss": 21.7169, "step": 15130 }, { "epoch": 0.16, "learning_rate": 1.9077497353521174e-05, "loss": 22.0128, "step": 15140 }, { "epoch": 0.16, "learning_rate": 1.9076027935388965e-05, "loss": 21.6743, "step": 15150 }, { "epoch": 0.16, "learning_rate": 1.9074557404580985e-05, "loss": 22.0101, "step": 15160 }, { "epoch": 0.16, "learning_rate": 1.907308576127752e-05, "loss": 20.5194, "step": 15170 }, { "epoch": 0.16, "learning_rate": 1.9071613005658974e-05, "loss": 21.9311, "step": 15180 }, { "epoch": 0.16, "learning_rate": 1.907013913790591e-05, "loss": 22.0604, "step": 15190 }, { "epoch": 0.16, "learning_rate": 1.9068664158199013e-05, "loss": 21.273, "step": 15200 }, { "epoch": 0.16, "learning_rate": 1.9067188066719105e-05, "loss": 21.0437, "step": 15210 }, { "epoch": 0.16, "learning_rate": 1.9065710863647153e-05, "loss": 21.3397, "step": 15220 }, { "epoch": 0.16, "learning_rate": 1.9064232549164254e-05, "loss": 21.1972, "step": 15230 }, { "epoch": 0.16, "learning_rate": 1.9062753123451635e-05, "loss": 21.157, "step": 15240 }, { "epoch": 0.16, "learning_rate": 1.906127258669068e-05, "loss": 21.5573, "step": 15250 }, { "epoch": 0.16, "learning_rate": 1.905979093906288e-05, "loss": 21.4018, "step": 15260 }, { "epoch": 0.17, "learning_rate": 1.9058308180749884e-05, "loss": 21.1428, "step": 15270 }, { "epoch": 0.17, "learning_rate": 1.9056824311933475e-05, "loss": 22.3828, "step": 15280 }, { "epoch": 0.17, "learning_rate": 1.9055339332795562e-05, "loss": 22.0464, "step": 15290 }, { "epoch": 0.17, "learning_rate": 1.90538532435182e-05, "loss": 21.5462, "step": 15300 }, { "epoch": 0.17, "learning_rate": 1.9052366044283575e-05, "loss": 21.5637, "step": 15310 }, { "epoch": 0.17, "learning_rate": 1.905087773527401e-05, "loss": 21.8524, "step": 15320 }, { "epoch": 0.17, "learning_rate": 1.9049388316671963e-05, "loss": 21.1988, "step": 15330 }, { "epoch": 0.17, "learning_rate": 1.9047897788660027e-05, "loss": 21.8529, "step": 15340 }, { "epoch": 0.17, "learning_rate": 1.904640615142094e-05, "loss": 22.3029, "step": 15350 }, { "epoch": 0.17, "learning_rate": 1.9044913405137566e-05, "loss": 22.1127, "step": 15360 }, { "epoch": 0.17, "learning_rate": 1.9043419549992906e-05, "loss": 22.0096, "step": 15370 }, { "epoch": 0.17, "learning_rate": 1.9041924586170103e-05, "loss": 21.7423, "step": 15380 }, { "epoch": 0.17, "learning_rate": 1.904042851385243e-05, "loss": 21.8053, "step": 15390 }, { "epoch": 0.17, "learning_rate": 1.90389313332233e-05, "loss": 22.0465, "step": 15400 }, { "epoch": 0.17, "learning_rate": 1.9037433044466254e-05, "loss": 21.4949, "step": 15410 }, { "epoch": 0.17, "learning_rate": 1.9035933647764982e-05, "loss": 21.661, "step": 15420 }, { "epoch": 0.17, "learning_rate": 1.90344331433033e-05, "loss": 22.6284, "step": 15430 }, { "epoch": 0.17, "learning_rate": 1.903293153126516e-05, "loss": 21.886, "step": 15440 }, { "epoch": 0.17, "learning_rate": 1.9031428811834654e-05, "loss": 21.9171, "step": 15450 }, { "epoch": 0.17, "learning_rate": 1.9029924985196013e-05, "loss": 22.0071, "step": 15460 }, { "epoch": 0.17, "learning_rate": 1.9028420051533586e-05, "loss": 21.7284, "step": 15470 }, { "epoch": 0.17, "learning_rate": 1.9026914011031883e-05, "loss": 21.951, "step": 15480 }, { "epoch": 0.17, "learning_rate": 1.9025406863875532e-05, "loss": 21.6439, "step": 15490 }, { "epoch": 0.17, "learning_rate": 1.9023898610249302e-05, "loss": 21.4667, "step": 15500 }, { "epoch": 0.17, "learning_rate": 1.9022389250338093e-05, "loss": 21.4147, "step": 15510 }, { "epoch": 0.17, "learning_rate": 1.9020878784326952e-05, "loss": 21.7661, "step": 15520 }, { "epoch": 0.17, "learning_rate": 1.9019367212401053e-05, "loss": 22.6995, "step": 15530 }, { "epoch": 0.17, "learning_rate": 1.9017854534745703e-05, "loss": 22.7859, "step": 15540 }, { "epoch": 0.17, "learning_rate": 1.9016340751546353e-05, "loss": 21.1097, "step": 15550 }, { "epoch": 0.17, "learning_rate": 1.9014825862988583e-05, "loss": 22.1347, "step": 15560 }, { "epoch": 0.17, "learning_rate": 1.9013309869258114e-05, "loss": 21.86, "step": 15570 }, { "epoch": 0.17, "learning_rate": 1.9011792770540795e-05, "loss": 21.6789, "step": 15580 }, { "epoch": 0.17, "learning_rate": 1.9010274567022617e-05, "loss": 21.8493, "step": 15590 }, { "epoch": 0.17, "learning_rate": 1.9008755258889705e-05, "loss": 22.0162, "step": 15600 }, { "epoch": 0.17, "learning_rate": 1.9007234846328314e-05, "loss": 22.1278, "step": 15610 }, { "epoch": 0.17, "learning_rate": 1.9005713329524845e-05, "loss": 21.2093, "step": 15620 }, { "epoch": 0.17, "learning_rate": 1.900419070866583e-05, "loss": 20.6947, "step": 15630 }, { "epoch": 0.17, "learning_rate": 1.9002666983937924e-05, "loss": 22.0572, "step": 15640 }, { "epoch": 0.17, "learning_rate": 1.900114215552794e-05, "loss": 21.7976, "step": 15650 }, { "epoch": 0.17, "learning_rate": 1.8999616223622807e-05, "loss": 21.632, "step": 15660 }, { "epoch": 0.17, "learning_rate": 1.8998089188409598e-05, "loss": 22.3204, "step": 15670 }, { "epoch": 0.17, "learning_rate": 1.899656105007552e-05, "loss": 22.384, "step": 15680 }, { "epoch": 0.17, "learning_rate": 1.8995031808807914e-05, "loss": 22.6176, "step": 15690 }, { "epoch": 0.17, "learning_rate": 1.8993501464794263e-05, "loss": 22.0513, "step": 15700 }, { "epoch": 0.17, "learning_rate": 1.8991970018222177e-05, "loss": 21.686, "step": 15710 }, { "epoch": 0.17, "learning_rate": 1.89904374692794e-05, "loss": 22.0433, "step": 15720 }, { "epoch": 0.17, "learning_rate": 1.8988903818153815e-05, "loss": 21.7724, "step": 15730 }, { "epoch": 0.17, "learning_rate": 1.8987369065033444e-05, "loss": 22.319, "step": 15740 }, { "epoch": 0.17, "learning_rate": 1.898583321010644e-05, "loss": 21.6863, "step": 15750 }, { "epoch": 0.17, "learning_rate": 1.8984296253561084e-05, "loss": 21.8567, "step": 15760 }, { "epoch": 0.17, "learning_rate": 1.8982758195585812e-05, "loss": 21.292, "step": 15770 }, { "epoch": 0.17, "learning_rate": 1.8981219036369168e-05, "loss": 21.8585, "step": 15780 }, { "epoch": 0.17, "learning_rate": 1.8979678776099857e-05, "loss": 21.6539, "step": 15790 }, { "epoch": 0.17, "learning_rate": 1.89781374149667e-05, "loss": 22.0586, "step": 15800 }, { "epoch": 0.17, "learning_rate": 1.897659495315866e-05, "loss": 21.8487, "step": 15810 }, { "epoch": 0.17, "learning_rate": 1.8975051390864844e-05, "loss": 21.2266, "step": 15820 }, { "epoch": 0.17, "learning_rate": 1.8973506728274473e-05, "loss": 21.4615, "step": 15830 }, { "epoch": 0.17, "learning_rate": 1.8971960965576924e-05, "loss": 22.0857, "step": 15840 }, { "epoch": 0.17, "learning_rate": 1.8970414102961695e-05, "loss": 22.0633, "step": 15850 }, { "epoch": 0.17, "learning_rate": 1.8968866140618424e-05, "loss": 21.9137, "step": 15860 }, { "epoch": 0.17, "learning_rate": 1.8967317078736886e-05, "loss": 22.6371, "step": 15870 }, { "epoch": 0.17, "learning_rate": 1.8965766917506987e-05, "loss": 22.2654, "step": 15880 }, { "epoch": 0.17, "learning_rate": 1.896421565711877e-05, "loss": 22.5286, "step": 15890 }, { "epoch": 0.17, "learning_rate": 1.896266329776241e-05, "loss": 21.6936, "step": 15900 }, { "epoch": 0.17, "learning_rate": 1.8961109839628217e-05, "loss": 22.3249, "step": 15910 }, { "epoch": 0.17, "learning_rate": 1.895955528290664e-05, "loss": 22.5574, "step": 15920 }, { "epoch": 0.17, "learning_rate": 1.8957999627788258e-05, "loss": 21.755, "step": 15930 }, { "epoch": 0.17, "learning_rate": 1.8956442874463793e-05, "loss": 22.1753, "step": 15940 }, { "epoch": 0.17, "learning_rate": 1.8954885023124087e-05, "loss": 21.3314, "step": 15950 }, { "epoch": 0.17, "learning_rate": 1.8953326073960127e-05, "loss": 21.7631, "step": 15960 }, { "epoch": 0.17, "learning_rate": 1.895176602716303e-05, "loss": 22.3507, "step": 15970 }, { "epoch": 0.17, "learning_rate": 1.895020488292406e-05, "loss": 21.7058, "step": 15980 }, { "epoch": 0.17, "learning_rate": 1.8948642641434593e-05, "loss": 20.8323, "step": 15990 }, { "epoch": 0.17, "learning_rate": 1.894707930288616e-05, "loss": 21.8317, "step": 16000 }, { "epoch": 0.17, "learning_rate": 1.8945514867470417e-05, "loss": 22.776, "step": 16010 }, { "epoch": 0.17, "learning_rate": 1.8943949335379156e-05, "loss": 21.5213, "step": 16020 }, { "epoch": 0.17, "learning_rate": 1.89423827068043e-05, "loss": 21.6592, "step": 16030 }, { "epoch": 0.17, "learning_rate": 1.8940814981937915e-05, "loss": 21.5747, "step": 16040 }, { "epoch": 0.17, "learning_rate": 1.893924616097219e-05, "loss": 21.5326, "step": 16050 }, { "epoch": 0.17, "learning_rate": 1.893767624409946e-05, "loss": 22.0532, "step": 16060 }, { "epoch": 0.17, "learning_rate": 1.8936105231512187e-05, "loss": 22.1806, "step": 16070 }, { "epoch": 0.17, "learning_rate": 1.8934533123402973e-05, "loss": 21.5076, "step": 16080 }, { "epoch": 0.17, "learning_rate": 1.8932959919964545e-05, "loss": 21.3723, "step": 16090 }, { "epoch": 0.17, "learning_rate": 1.8931385621389772e-05, "loss": 22.3, "step": 16100 }, { "epoch": 0.17, "learning_rate": 1.8929810227871653e-05, "loss": 21.1189, "step": 16110 }, { "epoch": 0.17, "learning_rate": 1.892823373960333e-05, "loss": 21.3885, "step": 16120 }, { "epoch": 0.17, "learning_rate": 1.8926656156778066e-05, "loss": 22.3943, "step": 16130 }, { "epoch": 0.17, "learning_rate": 1.8925077479589265e-05, "loss": 22.405, "step": 16140 }, { "epoch": 0.17, "learning_rate": 1.8923497708230472e-05, "loss": 21.1903, "step": 16150 }, { "epoch": 0.17, "learning_rate": 1.892191684289535e-05, "loss": 21.6829, "step": 16160 }, { "epoch": 0.17, "learning_rate": 1.892033488377771e-05, "loss": 20.9528, "step": 16170 }, { "epoch": 0.17, "learning_rate": 1.8918751831071494e-05, "loss": 21.7559, "step": 16180 }, { "epoch": 0.18, "learning_rate": 1.891716768497077e-05, "loss": 22.0877, "step": 16190 }, { "epoch": 0.18, "learning_rate": 1.8915582445669756e-05, "loss": 21.7176, "step": 16200 }, { "epoch": 0.18, "learning_rate": 1.8913996113362784e-05, "loss": 22.3533, "step": 16210 }, { "epoch": 0.18, "learning_rate": 1.8912408688244337e-05, "loss": 22.1847, "step": 16220 }, { "epoch": 0.18, "learning_rate": 1.891082017050902e-05, "loss": 21.9082, "step": 16230 }, { "epoch": 0.18, "learning_rate": 1.8909230560351587e-05, "loss": 20.8943, "step": 16240 }, { "epoch": 0.18, "learning_rate": 1.8907639857966908e-05, "loss": 21.9652, "step": 16250 }, { "epoch": 0.18, "learning_rate": 1.8906048063549995e-05, "loss": 22.2644, "step": 16260 }, { "epoch": 0.18, "learning_rate": 1.8904455177296002e-05, "loss": 22.1988, "step": 16270 }, { "epoch": 0.18, "learning_rate": 1.89028611994002e-05, "loss": 22.0075, "step": 16280 }, { "epoch": 0.18, "learning_rate": 1.8901266130058004e-05, "loss": 22.1186, "step": 16290 }, { "epoch": 0.18, "learning_rate": 1.889966996946497e-05, "loss": 21.1987, "step": 16300 }, { "epoch": 0.18, "learning_rate": 1.8898072717816768e-05, "loss": 21.7228, "step": 16310 }, { "epoch": 0.18, "learning_rate": 1.889647437530922e-05, "loss": 21.3683, "step": 16320 }, { "epoch": 0.18, "learning_rate": 1.8894874942138274e-05, "loss": 21.1217, "step": 16330 }, { "epoch": 0.18, "learning_rate": 1.889327441850001e-05, "loss": 22.2941, "step": 16340 }, { "epoch": 0.18, "learning_rate": 1.889167280459064e-05, "loss": 21.2716, "step": 16350 }, { "epoch": 0.18, "learning_rate": 1.8890070100606527e-05, "loss": 21.0411, "step": 16360 }, { "epoch": 0.18, "learning_rate": 1.8888466306744146e-05, "loss": 21.5375, "step": 16370 }, { "epoch": 0.18, "learning_rate": 1.8886861423200117e-05, "loss": 22.1357, "step": 16380 }, { "epoch": 0.18, "learning_rate": 1.8885255450171185e-05, "loss": 22.0486, "step": 16390 }, { "epoch": 0.18, "learning_rate": 1.888364838785424e-05, "loss": 22.1862, "step": 16400 }, { "epoch": 0.18, "learning_rate": 1.88820402364463e-05, "loss": 21.3314, "step": 16410 }, { "epoch": 0.18, "learning_rate": 1.888043099614451e-05, "loss": 21.4242, "step": 16420 }, { "epoch": 0.18, "learning_rate": 1.8878820667146162e-05, "loss": 21.8653, "step": 16430 }, { "epoch": 0.18, "learning_rate": 1.887720924964867e-05, "loss": 21.9226, "step": 16440 }, { "epoch": 0.18, "learning_rate": 1.887559674384959e-05, "loss": 21.6349, "step": 16450 }, { "epoch": 0.18, "learning_rate": 1.8873983149946603e-05, "loss": 21.8909, "step": 16460 }, { "epoch": 0.18, "learning_rate": 1.887236846813753e-05, "loss": 22.0394, "step": 16470 }, { "epoch": 0.18, "learning_rate": 1.887075269862032e-05, "loss": 21.8827, "step": 16480 }, { "epoch": 0.18, "learning_rate": 1.8869135841593062e-05, "loss": 22.7855, "step": 16490 }, { "epoch": 0.18, "learning_rate": 1.8867517897253973e-05, "loss": 22.0345, "step": 16500 }, { "epoch": 0.18, "learning_rate": 1.8865898865801405e-05, "loss": 21.6459, "step": 16510 }, { "epoch": 0.18, "learning_rate": 1.886427874743384e-05, "loss": 21.8632, "step": 16520 }, { "epoch": 0.18, "learning_rate": 1.8862657542349904e-05, "loss": 22.0156, "step": 16530 }, { "epoch": 0.18, "learning_rate": 1.8861035250748343e-05, "loss": 20.7115, "step": 16540 }, { "epoch": 0.18, "learning_rate": 1.885941187282804e-05, "loss": 22.5052, "step": 16550 }, { "epoch": 0.18, "learning_rate": 1.8857787408788016e-05, "loss": 21.1464, "step": 16560 }, { "epoch": 0.18, "learning_rate": 1.8856161858827428e-05, "loss": 22.0984, "step": 16570 }, { "epoch": 0.18, "learning_rate": 1.885453522314555e-05, "loss": 21.6418, "step": 16580 }, { "epoch": 0.18, "learning_rate": 1.88529075019418e-05, "loss": 22.2668, "step": 16590 }, { "epoch": 0.18, "learning_rate": 1.885127869541574e-05, "loss": 21.4323, "step": 16600 }, { "epoch": 0.18, "learning_rate": 1.884964880376704e-05, "loss": 22.1834, "step": 16610 }, { "epoch": 0.18, "learning_rate": 1.8848017827195527e-05, "loss": 21.1641, "step": 16620 }, { "epoch": 0.18, "learning_rate": 1.8846385765901145e-05, "loss": 21.8756, "step": 16630 }, { "epoch": 0.18, "learning_rate": 1.884475262008398e-05, "loss": 21.7751, "step": 16640 }, { "epoch": 0.18, "learning_rate": 1.8843118389944243e-05, "loss": 21.4135, "step": 16650 }, { "epoch": 0.18, "learning_rate": 1.884148307568228e-05, "loss": 22.1639, "step": 16660 }, { "epoch": 0.18, "learning_rate": 1.8839846677498582e-05, "loss": 21.6687, "step": 16670 }, { "epoch": 0.18, "learning_rate": 1.8838209195593758e-05, "loss": 21.2557, "step": 16680 }, { "epoch": 0.18, "learning_rate": 1.883657063016856e-05, "loss": 21.8679, "step": 16690 }, { "epoch": 0.18, "learning_rate": 1.8834930981423856e-05, "loss": 21.9365, "step": 16700 }, { "epoch": 0.18, "learning_rate": 1.883329024956067e-05, "loss": 22.2679, "step": 16710 }, { "epoch": 0.18, "learning_rate": 1.883164843478014e-05, "loss": 21.4195, "step": 16720 }, { "epoch": 0.18, "learning_rate": 1.8830005537283554e-05, "loss": 21.6569, "step": 16730 }, { "epoch": 0.18, "learning_rate": 1.882836155727231e-05, "loss": 21.706, "step": 16740 }, { "epoch": 0.18, "learning_rate": 1.8826716494947966e-05, "loss": 22.0266, "step": 16750 }, { "epoch": 0.18, "learning_rate": 1.8825070350512186e-05, "loss": 21.4908, "step": 16760 }, { "epoch": 0.18, "learning_rate": 1.882342312416679e-05, "loss": 22.1422, "step": 16770 }, { "epoch": 0.18, "learning_rate": 1.882177481611371e-05, "loss": 21.553, "step": 16780 }, { "epoch": 0.18, "learning_rate": 1.8820125426555023e-05, "loss": 21.7424, "step": 16790 }, { "epoch": 0.18, "learning_rate": 1.8818474955692938e-05, "loss": 21.3323, "step": 16800 }, { "epoch": 0.18, "learning_rate": 1.88168234037298e-05, "loss": 22.5376, "step": 16810 }, { "epoch": 0.18, "learning_rate": 1.8815170770868067e-05, "loss": 21.6833, "step": 16820 }, { "epoch": 0.18, "learning_rate": 1.8813517057310356e-05, "loss": 21.3101, "step": 16830 }, { "epoch": 0.18, "learning_rate": 1.8811862263259396e-05, "loss": 21.4315, "step": 16840 }, { "epoch": 0.18, "learning_rate": 1.8810206388918066e-05, "loss": 21.8277, "step": 16850 }, { "epoch": 0.18, "learning_rate": 1.8808549434489357e-05, "loss": 21.9913, "step": 16860 }, { "epoch": 0.18, "learning_rate": 1.880689140017641e-05, "loss": 21.2873, "step": 16870 }, { "epoch": 0.18, "learning_rate": 1.880523228618249e-05, "loss": 22.0649, "step": 16880 }, { "epoch": 0.18, "learning_rate": 1.8803572092710993e-05, "loss": 22.171, "step": 16890 }, { "epoch": 0.18, "learning_rate": 1.8801910819965458e-05, "loss": 22.357, "step": 16900 }, { "epoch": 0.18, "learning_rate": 1.8800248468149545e-05, "loss": 20.9164, "step": 16910 }, { "epoch": 0.18, "learning_rate": 1.8798585037467044e-05, "loss": 22.3284, "step": 16920 }, { "epoch": 0.18, "learning_rate": 1.8796920528121893e-05, "loss": 21.2707, "step": 16930 }, { "epoch": 0.18, "learning_rate": 1.879525494031815e-05, "loss": 21.4135, "step": 16940 }, { "epoch": 0.18, "learning_rate": 1.879358827426e-05, "loss": 21.4025, "step": 16950 }, { "epoch": 0.18, "learning_rate": 1.879192053015178e-05, "loss": 21.9709, "step": 16960 }, { "epoch": 0.18, "learning_rate": 1.8790251708197936e-05, "loss": 21.3558, "step": 16970 }, { "epoch": 0.18, "learning_rate": 1.8788581808603065e-05, "loss": 22.1342, "step": 16980 }, { "epoch": 0.18, "learning_rate": 1.8786910831571888e-05, "loss": 22.4351, "step": 16990 }, { "epoch": 0.18, "learning_rate": 1.8785238777309252e-05, "loss": 21.6443, "step": 17000 }, { "epoch": 0.18, "learning_rate": 1.878356564602015e-05, "loss": 21.6205, "step": 17010 }, { "epoch": 0.18, "learning_rate": 1.878189143790969e-05, "loss": 21.6231, "step": 17020 }, { "epoch": 0.18, "learning_rate": 1.8780216153183134e-05, "loss": 21.6246, "step": 17030 }, { "epoch": 0.18, "learning_rate": 1.8778539792045855e-05, "loss": 21.8528, "step": 17040 }, { "epoch": 0.18, "learning_rate": 1.877686235470337e-05, "loss": 20.9318, "step": 17050 }, { "epoch": 0.18, "learning_rate": 1.8775183841361323e-05, "loss": 21.347, "step": 17060 }, { "epoch": 0.18, "learning_rate": 1.8773504252225493e-05, "loss": 21.3865, "step": 17070 }, { "epoch": 0.18, "learning_rate": 1.8771823587501786e-05, "loss": 21.7958, "step": 17080 }, { "epoch": 0.18, "learning_rate": 1.8770141847396244e-05, "loss": 21.4027, "step": 17090 }, { "epoch": 0.18, "learning_rate": 1.8768459032115044e-05, "loss": 21.5479, "step": 17100 }, { "epoch": 0.18, "learning_rate": 1.8766775141864486e-05, "loss": 21.5071, "step": 17110 }, { "epoch": 0.19, "learning_rate": 1.8765090176851006e-05, "loss": 20.9904, "step": 17120 }, { "epoch": 0.19, "learning_rate": 1.876340413728118e-05, "loss": 21.8917, "step": 17130 }, { "epoch": 0.19, "learning_rate": 1.8761717023361697e-05, "loss": 21.2484, "step": 17140 }, { "epoch": 0.19, "learning_rate": 1.8760028835299396e-05, "loss": 21.5471, "step": 17150 }, { "epoch": 0.19, "learning_rate": 1.8758339573301243e-05, "loss": 22.0348, "step": 17160 }, { "epoch": 0.19, "learning_rate": 1.8756649237574324e-05, "loss": 22.3823, "step": 17170 }, { "epoch": 0.19, "learning_rate": 1.8754957828325874e-05, "loss": 21.4398, "step": 17180 }, { "epoch": 0.19, "learning_rate": 1.8753265345763247e-05, "loss": 21.6374, "step": 17190 }, { "epoch": 0.19, "learning_rate": 1.8751571790093935e-05, "loss": 21.5531, "step": 17200 }, { "epoch": 0.19, "learning_rate": 1.8749877161525556e-05, "loss": 21.1573, "step": 17210 }, { "epoch": 0.19, "learning_rate": 1.8748181460265865e-05, "loss": 21.6817, "step": 17220 }, { "epoch": 0.19, "learning_rate": 1.874648468652275e-05, "loss": 21.7072, "step": 17230 }, { "epoch": 0.19, "learning_rate": 1.874478684050422e-05, "loss": 21.9041, "step": 17240 }, { "epoch": 0.19, "learning_rate": 1.874308792241843e-05, "loss": 21.8259, "step": 17250 }, { "epoch": 0.19, "learning_rate": 1.8741387932473653e-05, "loss": 22.2305, "step": 17260 }, { "epoch": 0.19, "learning_rate": 1.8739686870878305e-05, "loss": 21.5746, "step": 17270 }, { "epoch": 0.19, "learning_rate": 1.873798473784092e-05, "loss": 21.5452, "step": 17280 }, { "epoch": 0.19, "learning_rate": 1.8736281533570174e-05, "loss": 21.883, "step": 17290 }, { "epoch": 0.19, "learning_rate": 1.8734577258274876e-05, "loss": 22.0126, "step": 17300 }, { "epoch": 0.19, "learning_rate": 1.8732871912163962e-05, "loss": 22.4054, "step": 17310 }, { "epoch": 0.19, "learning_rate": 1.873116549544649e-05, "loss": 21.4391, "step": 17320 }, { "epoch": 0.19, "learning_rate": 1.8729458008331666e-05, "loss": 21.1205, "step": 17330 }, { "epoch": 0.19, "learning_rate": 1.8727749451028813e-05, "loss": 22.0367, "step": 17340 }, { "epoch": 0.19, "learning_rate": 1.8726039823747398e-05, "loss": 21.9425, "step": 17350 }, { "epoch": 0.19, "learning_rate": 1.8724329126697012e-05, "loss": 21.9896, "step": 17360 }, { "epoch": 0.19, "learning_rate": 1.8722617360087373e-05, "loss": 22.0091, "step": 17370 }, { "epoch": 0.19, "learning_rate": 1.872090452412834e-05, "loss": 21.9621, "step": 17380 }, { "epoch": 0.19, "learning_rate": 1.8719190619029897e-05, "loss": 21.7843, "step": 17390 }, { "epoch": 0.19, "learning_rate": 1.8717475645002155e-05, "loss": 20.5973, "step": 17400 }, { "epoch": 0.19, "learning_rate": 1.871575960225537e-05, "loss": 21.9335, "step": 17410 }, { "epoch": 0.19, "learning_rate": 1.8714042490999916e-05, "loss": 21.8607, "step": 17420 }, { "epoch": 0.19, "learning_rate": 1.8712324311446303e-05, "loss": 21.5724, "step": 17430 }, { "epoch": 0.19, "learning_rate": 1.8710605063805166e-05, "loss": 21.5052, "step": 17440 }, { "epoch": 0.19, "learning_rate": 1.8708884748287282e-05, "loss": 22.1845, "step": 17450 }, { "epoch": 0.19, "learning_rate": 1.870716336510356e-05, "loss": 22.0751, "step": 17460 }, { "epoch": 0.19, "learning_rate": 1.8705440914465015e-05, "loss": 22.8332, "step": 17470 }, { "epoch": 0.19, "learning_rate": 1.8703717396582827e-05, "loss": 21.74, "step": 17480 }, { "epoch": 0.19, "learning_rate": 1.870199281166828e-05, "loss": 21.5671, "step": 17490 }, { "epoch": 0.19, "learning_rate": 1.8700267159932805e-05, "loss": 21.9133, "step": 17500 }, { "epoch": 0.19, "learning_rate": 1.869854044158796e-05, "loss": 22.3862, "step": 17510 }, { "epoch": 0.19, "learning_rate": 1.8696812656845427e-05, "loss": 21.0076, "step": 17520 }, { "epoch": 0.19, "learning_rate": 1.8695083805917026e-05, "loss": 21.9821, "step": 17530 }, { "epoch": 0.19, "learning_rate": 1.8693353889014707e-05, "loss": 21.1318, "step": 17540 }, { "epoch": 0.19, "learning_rate": 1.8691622906350545e-05, "loss": 22.464, "step": 17550 }, { "epoch": 0.19, "learning_rate": 1.8689890858136758e-05, "loss": 22.0934, "step": 17560 }, { "epoch": 0.19, "learning_rate": 1.868815774458568e-05, "loss": 22.2237, "step": 17570 }, { "epoch": 0.19, "learning_rate": 1.8686423565909777e-05, "loss": 20.7449, "step": 17580 }, { "epoch": 0.19, "learning_rate": 1.868468832232166e-05, "loss": 21.6891, "step": 17590 }, { "epoch": 0.19, "learning_rate": 1.8682952014034058e-05, "loss": 21.5845, "step": 17600 }, { "epoch": 0.19, "learning_rate": 1.8681214641259837e-05, "loss": 21.8538, "step": 17610 }, { "epoch": 0.19, "learning_rate": 1.8679476204211987e-05, "loss": 21.7309, "step": 17620 }, { "epoch": 0.19, "learning_rate": 1.867773670310363e-05, "loss": 21.7328, "step": 17630 }, { "epoch": 0.19, "learning_rate": 1.867599613814802e-05, "loss": 21.3884, "step": 17640 }, { "epoch": 0.19, "learning_rate": 1.8674254509558544e-05, "loss": 22.4058, "step": 17650 }, { "epoch": 0.19, "learning_rate": 1.8672511817548718e-05, "loss": 21.8941, "step": 17660 }, { "epoch": 0.19, "learning_rate": 1.8670768062332186e-05, "loss": 22.0546, "step": 17670 }, { "epoch": 0.19, "learning_rate": 1.8669023244122725e-05, "loss": 22.0508, "step": 17680 }, { "epoch": 0.19, "learning_rate": 1.8667277363134236e-05, "loss": 21.7473, "step": 17690 }, { "epoch": 0.19, "learning_rate": 1.866553041958076e-05, "loss": 22.4437, "step": 17700 }, { "epoch": 0.19, "learning_rate": 1.8663782413676465e-05, "loss": 21.7213, "step": 17710 }, { "epoch": 0.19, "learning_rate": 1.8662033345635642e-05, "loss": 21.7555, "step": 17720 }, { "epoch": 0.19, "learning_rate": 1.866028321567272e-05, "loss": 21.4408, "step": 17730 }, { "epoch": 0.19, "learning_rate": 1.865853202400226e-05, "loss": 21.7734, "step": 17740 }, { "epoch": 0.19, "learning_rate": 1.865677977083895e-05, "loss": 22.2942, "step": 17750 }, { "epoch": 0.19, "learning_rate": 1.86550264563976e-05, "loss": 21.2371, "step": 17760 }, { "epoch": 0.19, "learning_rate": 1.8653272080893164e-05, "loss": 20.783, "step": 17770 }, { "epoch": 0.19, "learning_rate": 1.8651516644540715e-05, "loss": 21.9172, "step": 17780 }, { "epoch": 0.19, "learning_rate": 1.8649760147555467e-05, "loss": 21.8432, "step": 17790 }, { "epoch": 0.19, "learning_rate": 1.864800259015275e-05, "loss": 21.5769, "step": 17800 }, { "epoch": 0.19, "learning_rate": 1.864624397254804e-05, "loss": 21.8888, "step": 17810 }, { "epoch": 0.19, "learning_rate": 1.8644484294956927e-05, "loss": 21.8927, "step": 17820 }, { "epoch": 0.19, "learning_rate": 1.8642723557595145e-05, "loss": 22.1007, "step": 17830 }, { "epoch": 0.19, "learning_rate": 1.8640961760678548e-05, "loss": 21.3709, "step": 17840 }, { "epoch": 0.19, "learning_rate": 1.8639198904423123e-05, "loss": 21.7149, "step": 17850 }, { "epoch": 0.19, "learning_rate": 1.8637434989044992e-05, "loss": 21.762, "step": 17860 }, { "epoch": 0.19, "learning_rate": 1.8635670014760396e-05, "loss": 21.4368, "step": 17870 }, { "epoch": 0.19, "learning_rate": 1.8633903981785717e-05, "loss": 21.9028, "step": 17880 }, { "epoch": 0.19, "learning_rate": 1.863213689033746e-05, "loss": 21.0169, "step": 17890 }, { "epoch": 0.19, "learning_rate": 1.863036874063226e-05, "loss": 22.4509, "step": 17900 }, { "epoch": 0.19, "learning_rate": 1.862859953288689e-05, "loss": 22.0139, "step": 17910 }, { "epoch": 0.19, "learning_rate": 1.8626829267318233e-05, "loss": 21.9156, "step": 17920 }, { "epoch": 0.19, "learning_rate": 1.862505794414333e-05, "loss": 21.8073, "step": 17930 }, { "epoch": 0.19, "learning_rate": 1.8623285563579325e-05, "loss": 22.3224, "step": 17940 }, { "epoch": 0.19, "learning_rate": 1.862151212584351e-05, "loss": 21.9077, "step": 17950 }, { "epoch": 0.19, "learning_rate": 1.8619737631153294e-05, "loss": 20.9513, "step": 17960 }, { "epoch": 0.19, "learning_rate": 1.8617962079726224e-05, "loss": 21.8061, "step": 17970 }, { "epoch": 0.19, "learning_rate": 1.8616185471779976e-05, "loss": 21.5711, "step": 17980 }, { "epoch": 0.19, "learning_rate": 1.861440780753235e-05, "loss": 22.1056, "step": 17990 }, { "epoch": 0.19, "learning_rate": 1.861262908720128e-05, "loss": 21.6546, "step": 18000 }, { "epoch": 0.19, "learning_rate": 1.8610849311004825e-05, "loss": 21.0525, "step": 18010 }, { "epoch": 0.19, "learning_rate": 1.8609068479161182e-05, "loss": 21.6992, "step": 18020 }, { "epoch": 0.19, "learning_rate": 1.8607286591888672e-05, "loss": 21.518, "step": 18030 }, { "epoch": 0.2, "learning_rate": 1.8605503649405742e-05, "loss": 21.2503, "step": 18040 }, { "epoch": 0.2, "learning_rate": 1.860371965193097e-05, "loss": 21.6167, "step": 18050 }, { "epoch": 0.2, "learning_rate": 1.8601934599683072e-05, "loss": 21.6994, "step": 18060 }, { "epoch": 0.2, "learning_rate": 1.8600148492880882e-05, "loss": 22.2555, "step": 18070 }, { "epoch": 0.2, "learning_rate": 1.859836133174337e-05, "loss": 22.258, "step": 18080 }, { "epoch": 0.2, "learning_rate": 1.859657311648963e-05, "loss": 22.3695, "step": 18090 }, { "epoch": 0.2, "learning_rate": 1.859478384733889e-05, "loss": 21.8297, "step": 18100 }, { "epoch": 0.2, "learning_rate": 1.8592993524510503e-05, "loss": 21.5842, "step": 18110 }, { "epoch": 0.2, "learning_rate": 1.859120214822396e-05, "loss": 22.297, "step": 18120 }, { "epoch": 0.2, "learning_rate": 1.858940971869887e-05, "loss": 22.57, "step": 18130 }, { "epoch": 0.2, "learning_rate": 1.8587616236154976e-05, "loss": 21.6257, "step": 18140 }, { "epoch": 0.2, "learning_rate": 1.858582170081215e-05, "loss": 22.3653, "step": 18150 }, { "epoch": 0.2, "learning_rate": 1.8584026112890394e-05, "loss": 22.0813, "step": 18160 }, { "epoch": 0.2, "learning_rate": 1.858222947260984e-05, "loss": 22.0463, "step": 18170 }, { "epoch": 0.2, "learning_rate": 1.8580431780190746e-05, "loss": 21.749, "step": 18180 }, { "epoch": 0.2, "learning_rate": 1.8578633035853494e-05, "loss": 20.9348, "step": 18190 }, { "epoch": 0.2, "learning_rate": 1.8576833239818614e-05, "loss": 21.118, "step": 18200 }, { "epoch": 0.2, "learning_rate": 1.8575032392306737e-05, "loss": 20.8486, "step": 18210 }, { "epoch": 0.2, "learning_rate": 1.857323049353865e-05, "loss": 21.5787, "step": 18220 }, { "epoch": 0.2, "learning_rate": 1.857142754373525e-05, "loss": 21.7875, "step": 18230 }, { "epoch": 0.2, "learning_rate": 1.8569623543117572e-05, "loss": 21.6265, "step": 18240 }, { "epoch": 0.2, "learning_rate": 1.8567818491906776e-05, "loss": 21.6975, "step": 18250 }, { "epoch": 0.2, "learning_rate": 1.8566012390324157e-05, "loss": 21.8031, "step": 18260 }, { "epoch": 0.2, "learning_rate": 1.856420523859113e-05, "loss": 21.6681, "step": 18270 }, { "epoch": 0.2, "learning_rate": 1.856239703692924e-05, "loss": 21.4137, "step": 18280 }, { "epoch": 0.2, "learning_rate": 1.8560587785560172e-05, "loss": 22.2494, "step": 18290 }, { "epoch": 0.2, "learning_rate": 1.8558777484705723e-05, "loss": 21.3745, "step": 18300 }, { "epoch": 0.2, "learning_rate": 1.8556966134587832e-05, "loss": 21.4511, "step": 18310 }, { "epoch": 0.2, "learning_rate": 1.8555153735428557e-05, "loss": 21.7033, "step": 18320 }, { "epoch": 0.2, "learning_rate": 1.8553340287450094e-05, "loss": 22.3226, "step": 18330 }, { "epoch": 0.2, "learning_rate": 1.8551525790874756e-05, "loss": 21.5836, "step": 18340 }, { "epoch": 0.2, "learning_rate": 1.8549710245925e-05, "loss": 21.9935, "step": 18350 }, { "epoch": 0.2, "learning_rate": 1.8547893652823393e-05, "loss": 22.2192, "step": 18360 }, { "epoch": 0.2, "learning_rate": 1.854607601179265e-05, "loss": 22.1221, "step": 18370 }, { "epoch": 0.2, "learning_rate": 1.85442573230556e-05, "loss": 21.9498, "step": 18380 }, { "epoch": 0.2, "learning_rate": 1.8542437586835202e-05, "loss": 21.9799, "step": 18390 }, { "epoch": 0.2, "learning_rate": 1.8540616803354555e-05, "loss": 21.2428, "step": 18400 }, { "epoch": 0.2, "learning_rate": 1.853879497283687e-05, "loss": 21.8294, "step": 18410 }, { "epoch": 0.2, "learning_rate": 1.8536972095505495e-05, "loss": 21.4451, "step": 18420 }, { "epoch": 0.2, "learning_rate": 1.853514817158391e-05, "loss": 21.4909, "step": 18430 }, { "epoch": 0.2, "learning_rate": 1.853332320129572e-05, "loss": 21.5863, "step": 18440 }, { "epoch": 0.2, "learning_rate": 1.853149718486465e-05, "loss": 22.305, "step": 18450 }, { "epoch": 0.2, "learning_rate": 1.8529670122514565e-05, "loss": 20.7559, "step": 18460 }, { "epoch": 0.2, "learning_rate": 1.8527842014469458e-05, "loss": 21.7208, "step": 18470 }, { "epoch": 0.2, "learning_rate": 1.8526012860953434e-05, "loss": 22.0286, "step": 18480 }, { "epoch": 0.2, "learning_rate": 1.852418266219075e-05, "loss": 21.0303, "step": 18490 }, { "epoch": 0.2, "learning_rate": 1.8522351418405775e-05, "loss": 22.1548, "step": 18500 }, { "epoch": 0.2, "learning_rate": 1.852051912982301e-05, "loss": 21.7028, "step": 18510 }, { "epoch": 0.2, "learning_rate": 1.8518685796667082e-05, "loss": 21.219, "step": 18520 }, { "epoch": 0.2, "learning_rate": 1.8516851419162756e-05, "loss": 21.5217, "step": 18530 }, { "epoch": 0.2, "learning_rate": 1.851501599753491e-05, "loss": 21.672, "step": 18540 }, { "epoch": 0.2, "learning_rate": 1.8513179532008557e-05, "loss": 21.7698, "step": 18550 }, { "epoch": 0.2, "learning_rate": 1.8511342022808844e-05, "loss": 21.9277, "step": 18560 }, { "epoch": 0.2, "learning_rate": 1.8509503470161038e-05, "loss": 22.4089, "step": 18570 }, { "epoch": 0.2, "learning_rate": 1.8507663874290536e-05, "loss": 21.7121, "step": 18580 }, { "epoch": 0.2, "learning_rate": 1.8505823235422865e-05, "loss": 21.4816, "step": 18590 }, { "epoch": 0.2, "learning_rate": 1.8503981553783675e-05, "loss": 21.5491, "step": 18600 }, { "epoch": 0.2, "learning_rate": 1.850213882959875e-05, "loss": 20.6525, "step": 18610 }, { "epoch": 0.2, "learning_rate": 1.8500295063094e-05, "loss": 21.9444, "step": 18620 }, { "epoch": 0.2, "learning_rate": 1.8498450254495456e-05, "loss": 21.2833, "step": 18630 }, { "epoch": 0.2, "learning_rate": 1.8496604404029287e-05, "loss": 22.1879, "step": 18640 }, { "epoch": 0.2, "learning_rate": 1.849475751192178e-05, "loss": 21.1889, "step": 18650 }, { "epoch": 0.2, "learning_rate": 1.8492909578399364e-05, "loss": 22.2704, "step": 18660 }, { "epoch": 0.2, "learning_rate": 1.849106060368858e-05, "loss": 22.4585, "step": 18670 }, { "epoch": 0.2, "learning_rate": 1.8489210588016103e-05, "loss": 21.3447, "step": 18680 }, { "epoch": 0.2, "learning_rate": 1.8487359531608733e-05, "loss": 21.5423, "step": 18690 }, { "epoch": 0.2, "learning_rate": 1.848550743469341e-05, "loss": 21.3399, "step": 18700 }, { "epoch": 0.2, "learning_rate": 1.848365429749718e-05, "loss": 22.1346, "step": 18710 }, { "epoch": 0.2, "learning_rate": 1.8481800120247236e-05, "loss": 21.0806, "step": 18720 }, { "epoch": 0.2, "learning_rate": 1.847994490317089e-05, "loss": 20.9107, "step": 18730 }, { "epoch": 0.2, "learning_rate": 1.847808864649558e-05, "loss": 21.8126, "step": 18740 }, { "epoch": 0.2, "learning_rate": 1.847623135044888e-05, "loss": 22.0136, "step": 18750 }, { "epoch": 0.2, "learning_rate": 1.8474373015258472e-05, "loss": 21.5672, "step": 18760 }, { "epoch": 0.2, "learning_rate": 1.8472513641152193e-05, "loss": 20.9607, "step": 18770 }, { "epoch": 0.2, "learning_rate": 1.847065322835799e-05, "loss": 21.9338, "step": 18780 }, { "epoch": 0.2, "learning_rate": 1.846879177710393e-05, "loss": 22.514, "step": 18790 }, { "epoch": 0.2, "learning_rate": 1.8466929287618227e-05, "loss": 21.1946, "step": 18800 }, { "epoch": 0.2, "learning_rate": 1.846506576012921e-05, "loss": 21.9898, "step": 18810 }, { "epoch": 0.2, "learning_rate": 1.8463201194865346e-05, "loss": 21.9209, "step": 18820 }, { "epoch": 0.2, "learning_rate": 1.8461335592055208e-05, "loss": 21.3844, "step": 18830 }, { "epoch": 0.2, "learning_rate": 1.845946895192752e-05, "loss": 20.9434, "step": 18840 }, { "epoch": 0.2, "learning_rate": 1.8457601274711115e-05, "loss": 21.197, "step": 18850 }, { "epoch": 0.2, "learning_rate": 1.8455732560634968e-05, "loss": 22.4125, "step": 18860 }, { "epoch": 0.2, "learning_rate": 1.845386280992817e-05, "loss": 21.4456, "step": 18870 }, { "epoch": 0.2, "learning_rate": 1.8451992022819945e-05, "loss": 21.1316, "step": 18880 }, { "epoch": 0.2, "learning_rate": 1.8450120199539637e-05, "loss": 22.0226, "step": 18890 }, { "epoch": 0.2, "learning_rate": 1.844824734031673e-05, "loss": 21.7604, "step": 18900 }, { "epoch": 0.2, "learning_rate": 1.8446373445380823e-05, "loss": 22.2414, "step": 18910 }, { "epoch": 0.2, "learning_rate": 1.8444498514961643e-05, "loss": 21.2343, "step": 18920 }, { "epoch": 0.2, "learning_rate": 1.8442622549289057e-05, "loss": 21.2007, "step": 18930 }, { "epoch": 0.2, "learning_rate": 1.844074554859304e-05, "loss": 21.4496, "step": 18940 }, { "epoch": 0.2, "learning_rate": 1.8438867513103703e-05, "loss": 22.4, "step": 18950 }, { "epoch": 0.2, "learning_rate": 1.843698844305129e-05, "loss": 21.6881, "step": 18960 }, { "epoch": 0.21, "learning_rate": 1.8435108338666162e-05, "loss": 21.952, "step": 18970 }, { "epoch": 0.21, "learning_rate": 1.843322720017881e-05, "loss": 22.414, "step": 18980 }, { "epoch": 0.21, "learning_rate": 1.8431345027819856e-05, "loss": 21.0633, "step": 18990 }, { "epoch": 0.21, "learning_rate": 1.842946182182004e-05, "loss": 21.9881, "step": 19000 }, { "epoch": 0.21, "learning_rate": 1.8427577582410232e-05, "loss": 21.079, "step": 19010 }, { "epoch": 0.21, "learning_rate": 1.8425692309821433e-05, "loss": 21.3453, "step": 19020 }, { "epoch": 0.21, "learning_rate": 1.8423806004284775e-05, "loss": 22.2188, "step": 19030 }, { "epoch": 0.21, "learning_rate": 1.84219186660315e-05, "loss": 20.9958, "step": 19040 }, { "epoch": 0.21, "learning_rate": 1.842003029529299e-05, "loss": 22.465, "step": 19050 }, { "epoch": 0.21, "learning_rate": 1.8418140892300748e-05, "loss": 21.7157, "step": 19060 }, { "epoch": 0.21, "learning_rate": 1.8416250457286412e-05, "loss": 21.6897, "step": 19070 }, { "epoch": 0.21, "learning_rate": 1.841435899048173e-05, "loss": 20.9041, "step": 19080 }, { "epoch": 0.21, "learning_rate": 1.841246649211859e-05, "loss": 21.0802, "step": 19090 }, { "epoch": 0.21, "learning_rate": 1.841057296242901e-05, "loss": 21.8083, "step": 19100 }, { "epoch": 0.21, "learning_rate": 1.8408678401645116e-05, "loss": 22.3993, "step": 19110 }, { "epoch": 0.21, "learning_rate": 1.8406782809999178e-05, "loss": 21.5551, "step": 19120 }, { "epoch": 0.21, "learning_rate": 1.840488618772359e-05, "loss": 21.0453, "step": 19130 }, { "epoch": 0.21, "learning_rate": 1.840298853505086e-05, "loss": 21.3836, "step": 19140 }, { "epoch": 0.21, "learning_rate": 1.8401089852213633e-05, "loss": 22.011, "step": 19150 }, { "epoch": 0.21, "learning_rate": 1.839919013944468e-05, "loss": 21.7623, "step": 19160 }, { "epoch": 0.21, "learning_rate": 1.8397289396976896e-05, "loss": 21.3694, "step": 19170 }, { "epoch": 0.21, "learning_rate": 1.8395387625043306e-05, "loss": 20.9465, "step": 19180 }, { "epoch": 0.21, "learning_rate": 1.839348482387705e-05, "loss": 21.0565, "step": 19190 }, { "epoch": 0.21, "learning_rate": 1.8391580993711407e-05, "loss": 21.3783, "step": 19200 }, { "epoch": 0.21, "learning_rate": 1.8389676134779776e-05, "loss": 22.3651, "step": 19210 }, { "epoch": 0.21, "learning_rate": 1.8387770247315685e-05, "loss": 21.6987, "step": 19220 }, { "epoch": 0.21, "learning_rate": 1.838586333155278e-05, "loss": 21.6645, "step": 19230 }, { "epoch": 0.21, "learning_rate": 1.8383955387724848e-05, "loss": 21.8754, "step": 19240 }, { "epoch": 0.21, "learning_rate": 1.838204641606579e-05, "loss": 21.4504, "step": 19250 }, { "epoch": 0.21, "learning_rate": 1.8380136416809632e-05, "loss": 22.1279, "step": 19260 }, { "epoch": 0.21, "learning_rate": 1.8378225390190536e-05, "loss": 21.8773, "step": 19270 }, { "epoch": 0.21, "learning_rate": 1.8376313336442785e-05, "loss": 21.6637, "step": 19280 }, { "epoch": 0.21, "learning_rate": 1.837440025580078e-05, "loss": 22.1922, "step": 19290 }, { "epoch": 0.21, "learning_rate": 1.8372486148499064e-05, "loss": 21.727, "step": 19300 }, { "epoch": 0.21, "learning_rate": 1.8370571014772292e-05, "loss": 22.8118, "step": 19310 }, { "epoch": 0.21, "learning_rate": 1.836865485485525e-05, "loss": 21.536, "step": 19320 }, { "epoch": 0.21, "learning_rate": 1.836673766898285e-05, "loss": 22.5678, "step": 19330 }, { "epoch": 0.21, "learning_rate": 1.836481945739013e-05, "loss": 21.8115, "step": 19340 }, { "epoch": 0.21, "learning_rate": 1.8362900220312253e-05, "loss": 22.1342, "step": 19350 }, { "epoch": 0.21, "learning_rate": 1.8360979957984507e-05, "loss": 21.8506, "step": 19360 }, { "epoch": 0.21, "learning_rate": 1.835905867064231e-05, "loss": 21.8527, "step": 19370 }, { "epoch": 0.21, "learning_rate": 1.83571363585212e-05, "loss": 21.7796, "step": 19380 }, { "epoch": 0.21, "learning_rate": 1.835521302185684e-05, "loss": 21.7988, "step": 19390 }, { "epoch": 0.21, "learning_rate": 1.8353288660885026e-05, "loss": 21.2173, "step": 19400 }, { "epoch": 0.21, "learning_rate": 1.835136327584167e-05, "loss": 21.169, "step": 19410 }, { "epoch": 0.21, "learning_rate": 1.8349436866962822e-05, "loss": 22.2808, "step": 19420 }, { "epoch": 0.21, "learning_rate": 1.8347509434484644e-05, "loss": 21.6324, "step": 19430 }, { "epoch": 0.21, "learning_rate": 1.834558097864343e-05, "loss": 21.8889, "step": 19440 }, { "epoch": 0.21, "learning_rate": 1.8343651499675603e-05, "loss": 21.7869, "step": 19450 }, { "epoch": 0.21, "learning_rate": 1.8341720997817703e-05, "loss": 20.8595, "step": 19460 }, { "epoch": 0.21, "learning_rate": 1.8339789473306405e-05, "loss": 22.4213, "step": 19470 }, { "epoch": 0.21, "learning_rate": 1.8337856926378497e-05, "loss": 21.8877, "step": 19480 }, { "epoch": 0.21, "learning_rate": 1.8335923357270906e-05, "loss": 21.9243, "step": 19490 }, { "epoch": 0.21, "learning_rate": 1.8333988766220676e-05, "loss": 22.3058, "step": 19500 }, { "epoch": 0.21, "learning_rate": 1.833205315346498e-05, "loss": 22.0218, "step": 19510 }, { "epoch": 0.21, "learning_rate": 1.8330116519241107e-05, "loss": 20.779, "step": 19520 }, { "epoch": 0.21, "learning_rate": 1.8328178863786488e-05, "loss": 21.5688, "step": 19530 }, { "epoch": 0.21, "learning_rate": 1.8326240187338667e-05, "loss": 21.2469, "step": 19540 }, { "epoch": 0.21, "learning_rate": 1.832430049013531e-05, "loss": 21.1244, "step": 19550 }, { "epoch": 0.21, "learning_rate": 1.8322359772414227e-05, "loss": 21.6571, "step": 19560 }, { "epoch": 0.21, "learning_rate": 1.832041803441333e-05, "loss": 21.7383, "step": 19570 }, { "epoch": 0.21, "learning_rate": 1.8318475276370665e-05, "loss": 21.5358, "step": 19580 }, { "epoch": 0.21, "learning_rate": 1.831653149852441e-05, "loss": 22.7346, "step": 19590 }, { "epoch": 0.21, "learning_rate": 1.8314586701112864e-05, "loss": 22.4887, "step": 19600 }, { "epoch": 0.21, "learning_rate": 1.8312640884374446e-05, "loss": 21.7856, "step": 19610 }, { "epoch": 0.21, "learning_rate": 1.83106940485477e-05, "loss": 21.7336, "step": 19620 }, { "epoch": 0.21, "learning_rate": 1.830874619387131e-05, "loss": 21.558, "step": 19630 }, { "epoch": 0.21, "learning_rate": 1.8306797320584055e-05, "loss": 21.9189, "step": 19640 }, { "epoch": 0.21, "learning_rate": 1.8304847428924874e-05, "loss": 21.6126, "step": 19650 }, { "epoch": 0.21, "learning_rate": 1.8302896519132808e-05, "loss": 22.421, "step": 19660 }, { "epoch": 0.21, "learning_rate": 1.8300944591447027e-05, "loss": 22.3777, "step": 19670 }, { "epoch": 0.21, "learning_rate": 1.829899164610683e-05, "loss": 22.2355, "step": 19680 }, { "epoch": 0.21, "learning_rate": 1.8297037683351635e-05, "loss": 21.7929, "step": 19690 }, { "epoch": 0.21, "learning_rate": 1.8295082703420992e-05, "loss": 22.1154, "step": 19700 }, { "epoch": 0.21, "learning_rate": 1.8293126706554573e-05, "loss": 22.3322, "step": 19710 }, { "epoch": 0.21, "learning_rate": 1.8291169692992166e-05, "loss": 21.2101, "step": 19720 }, { "epoch": 0.21, "learning_rate": 1.8289211662973702e-05, "loss": 21.7739, "step": 19730 }, { "epoch": 0.21, "learning_rate": 1.8287252616739213e-05, "loss": 21.8652, "step": 19740 }, { "epoch": 0.21, "learning_rate": 1.828529255452888e-05, "loss": 22.051, "step": 19750 }, { "epoch": 0.21, "learning_rate": 1.828333147658299e-05, "loss": 21.3937, "step": 19760 }, { "epoch": 0.21, "learning_rate": 1.828136938314196e-05, "loss": 21.7402, "step": 19770 }, { "epoch": 0.21, "learning_rate": 1.827940627444634e-05, "loss": 21.5223, "step": 19780 }, { "epoch": 0.21, "learning_rate": 1.827744215073679e-05, "loss": 21.89, "step": 19790 }, { "epoch": 0.21, "learning_rate": 1.827547701225411e-05, "loss": 21.905, "step": 19800 }, { "epoch": 0.21, "learning_rate": 1.8273510859239208e-05, "loss": 21.1557, "step": 19810 }, { "epoch": 0.21, "learning_rate": 1.8271543691933128e-05, "loss": 21.9119, "step": 19820 }, { "epoch": 0.21, "learning_rate": 1.8269575510577034e-05, "loss": 21.8132, "step": 19830 }, { "epoch": 0.21, "learning_rate": 1.8267606315412217e-05, "loss": 21.624, "step": 19840 }, { "epoch": 0.21, "learning_rate": 1.8265636106680088e-05, "loss": 21.7767, "step": 19850 }, { "epoch": 0.21, "learning_rate": 1.8263664884622187e-05, "loss": 21.1839, "step": 19860 }, { "epoch": 0.21, "learning_rate": 1.8261692649480174e-05, "loss": 22.0663, "step": 19870 }, { "epoch": 0.21, "learning_rate": 1.8259719401495842e-05, "loss": 21.4173, "step": 19880 }, { "epoch": 0.22, "learning_rate": 1.825774514091109e-05, "loss": 21.4056, "step": 19890 }, { "epoch": 0.22, "learning_rate": 1.8255769867967964e-05, "loss": 21.6585, "step": 19900 }, { "epoch": 0.22, "learning_rate": 1.8253793582908608e-05, "loss": 21.196, "step": 19910 }, { "epoch": 0.22, "learning_rate": 1.8251816285975322e-05, "loss": 21.8733, "step": 19920 }, { "epoch": 0.22, "learning_rate": 1.8249837977410502e-05, "loss": 22.3175, "step": 19930 }, { "epoch": 0.22, "learning_rate": 1.824785865745668e-05, "loss": 21.1525, "step": 19940 }, { "epoch": 0.22, "learning_rate": 1.8245878326356513e-05, "loss": 21.3311, "step": 19950 }, { "epoch": 0.22, "learning_rate": 1.824389698435278e-05, "loss": 21.9804, "step": 19960 }, { "epoch": 0.22, "learning_rate": 1.8241914631688377e-05, "loss": 22.1929, "step": 19970 }, { "epoch": 0.22, "learning_rate": 1.8239931268606338e-05, "loss": 21.373, "step": 19980 }, { "epoch": 0.22, "learning_rate": 1.8237946895349813e-05, "loss": 20.9384, "step": 19990 }, { "epoch": 0.22, "learning_rate": 1.8235961512162076e-05, "loss": 22.11, "step": 20000 }, { "epoch": 0.22, "learning_rate": 1.823397511928652e-05, "loss": 22.6081, "step": 20010 }, { "epoch": 0.22, "learning_rate": 1.8231987716966673e-05, "loss": 20.9061, "step": 20020 }, { "epoch": 0.22, "learning_rate": 1.8229999305446177e-05, "loss": 21.309, "step": 20030 }, { "epoch": 0.22, "learning_rate": 1.82280098849688e-05, "loss": 21.3108, "step": 20040 }, { "epoch": 0.22, "learning_rate": 1.8226019455778437e-05, "loss": 22.0505, "step": 20050 }, { "epoch": 0.22, "learning_rate": 1.8224028018119112e-05, "loss": 21.7283, "step": 20060 }, { "epoch": 0.22, "learning_rate": 1.8222035572234953e-05, "loss": 21.1579, "step": 20070 }, { "epoch": 0.22, "learning_rate": 1.8220042118370232e-05, "loss": 21.4204, "step": 20080 }, { "epoch": 0.22, "learning_rate": 1.821804765676933e-05, "loss": 21.3051, "step": 20090 }, { "epoch": 0.22, "learning_rate": 1.8216052187676763e-05, "loss": 21.7141, "step": 20100 }, { "epoch": 0.22, "learning_rate": 1.8214055711337167e-05, "loss": 21.563, "step": 20110 }, { "epoch": 0.22, "learning_rate": 1.82120582279953e-05, "loss": 21.7995, "step": 20120 }, { "epoch": 0.22, "learning_rate": 1.8210059737896033e-05, "loss": 21.0529, "step": 20130 }, { "epoch": 0.22, "learning_rate": 1.8208060241284386e-05, "loss": 22.1331, "step": 20140 }, { "epoch": 0.22, "learning_rate": 1.8206059738405478e-05, "loss": 20.7095, "step": 20150 }, { "epoch": 0.22, "learning_rate": 1.8204058229504562e-05, "loss": 21.7356, "step": 20160 }, { "epoch": 0.22, "learning_rate": 1.8202055714827015e-05, "loss": 21.0525, "step": 20170 }, { "epoch": 0.22, "learning_rate": 1.8200052194618333e-05, "loss": 21.7267, "step": 20180 }, { "epoch": 0.22, "learning_rate": 1.819804766912414e-05, "loss": 21.2891, "step": 20190 }, { "epoch": 0.22, "learning_rate": 1.8196042138590177e-05, "loss": 22.857, "step": 20200 }, { "epoch": 0.22, "learning_rate": 1.8194035603262318e-05, "loss": 21.5512, "step": 20210 }, { "epoch": 0.22, "learning_rate": 1.819202806338655e-05, "loss": 22.1794, "step": 20220 }, { "epoch": 0.22, "learning_rate": 1.8190019519208986e-05, "loss": 20.986, "step": 20230 }, { "epoch": 0.22, "learning_rate": 1.818800997097587e-05, "loss": 22.197, "step": 20240 }, { "epoch": 0.22, "learning_rate": 1.8185999418933557e-05, "loss": 21.9446, "step": 20250 }, { "epoch": 0.22, "learning_rate": 1.8183987863328535e-05, "loss": 21.6033, "step": 20260 }, { "epoch": 0.22, "learning_rate": 1.8181975304407403e-05, "loss": 21.4182, "step": 20270 }, { "epoch": 0.22, "learning_rate": 1.8179961742416896e-05, "loss": 20.7206, "step": 20280 }, { "epoch": 0.22, "learning_rate": 1.8177947177603865e-05, "loss": 21.6258, "step": 20290 }, { "epoch": 0.22, "learning_rate": 1.8175931610215293e-05, "loss": 21.2003, "step": 20300 }, { "epoch": 0.22, "learning_rate": 1.8173915040498268e-05, "loss": 21.0635, "step": 20310 }, { "epoch": 0.22, "learning_rate": 1.8171897468700013e-05, "loss": 22.0016, "step": 20320 }, { "epoch": 0.22, "learning_rate": 1.8169878895067877e-05, "loss": 21.9265, "step": 20330 }, { "epoch": 0.22, "learning_rate": 1.8167859319849325e-05, "loss": 22.2721, "step": 20340 }, { "epoch": 0.22, "learning_rate": 1.816583874329195e-05, "loss": 22.1148, "step": 20350 }, { "epoch": 0.22, "learning_rate": 1.8163817165643456e-05, "loss": 20.9705, "step": 20360 }, { "epoch": 0.22, "learning_rate": 1.8161794587151685e-05, "loss": 21.6832, "step": 20370 }, { "epoch": 0.22, "learning_rate": 1.8159771008064596e-05, "loss": 22.0997, "step": 20380 }, { "epoch": 0.22, "learning_rate": 1.815774642863027e-05, "loss": 22.4505, "step": 20390 }, { "epoch": 0.22, "learning_rate": 1.81557208490969e-05, "loss": 21.8077, "step": 20400 }, { "epoch": 0.22, "learning_rate": 1.8153694269712826e-05, "loss": 21.6668, "step": 20410 }, { "epoch": 0.22, "learning_rate": 1.815166669072649e-05, "loss": 21.2399, "step": 20420 }, { "epoch": 0.22, "learning_rate": 1.814963811238646e-05, "loss": 22.3113, "step": 20430 }, { "epoch": 0.22, "learning_rate": 1.8147608534941436e-05, "loss": 21.1981, "step": 20440 }, { "epoch": 0.22, "learning_rate": 1.814557795864023e-05, "loss": 22.0932, "step": 20450 }, { "epoch": 0.22, "learning_rate": 1.814354638373178e-05, "loss": 21.3614, "step": 20460 }, { "epoch": 0.22, "learning_rate": 1.8141513810465154e-05, "loss": 22.1359, "step": 20470 }, { "epoch": 0.22, "learning_rate": 1.8139480239089523e-05, "loss": 21.2738, "step": 20480 }, { "epoch": 0.22, "learning_rate": 1.8137445669854204e-05, "loss": 21.7235, "step": 20490 }, { "epoch": 0.22, "learning_rate": 1.813541010300862e-05, "loss": 21.097, "step": 20500 }, { "epoch": 0.22, "learning_rate": 1.8133373538802317e-05, "loss": 21.0448, "step": 20510 }, { "epoch": 0.22, "learning_rate": 1.8131335977484975e-05, "loss": 22.0357, "step": 20520 }, { "epoch": 0.22, "learning_rate": 1.8129297419306392e-05, "loss": 21.2972, "step": 20530 }, { "epoch": 0.22, "learning_rate": 1.8127257864516474e-05, "loss": 21.4916, "step": 20540 }, { "epoch": 0.22, "learning_rate": 1.8125217313365267e-05, "loss": 21.944, "step": 20550 }, { "epoch": 0.22, "learning_rate": 1.812317576610293e-05, "loss": 21.1459, "step": 20560 }, { "epoch": 0.22, "learning_rate": 1.812113322297975e-05, "loss": 21.8899, "step": 20570 }, { "epoch": 0.22, "learning_rate": 1.811908968424613e-05, "loss": 21.7643, "step": 20580 }, { "epoch": 0.22, "learning_rate": 1.8117045150152598e-05, "loss": 21.9649, "step": 20590 }, { "epoch": 0.22, "learning_rate": 1.8114999620949804e-05, "loss": 21.465, "step": 20600 }, { "epoch": 0.22, "learning_rate": 1.8112953096888517e-05, "loss": 21.7431, "step": 20610 }, { "epoch": 0.22, "learning_rate": 1.8110905578219635e-05, "loss": 22.3149, "step": 20620 }, { "epoch": 0.22, "learning_rate": 1.810885706519417e-05, "loss": 21.4374, "step": 20630 }, { "epoch": 0.22, "learning_rate": 1.8106807558063263e-05, "loss": 21.5602, "step": 20640 }, { "epoch": 0.22, "learning_rate": 1.8104757057078168e-05, "loss": 22.0299, "step": 20650 }, { "epoch": 0.22, "learning_rate": 1.8102705562490273e-05, "loss": 21.7292, "step": 20660 }, { "epoch": 0.22, "learning_rate": 1.8100653074551075e-05, "loss": 21.7089, "step": 20670 }, { "epoch": 0.22, "learning_rate": 1.8098599593512202e-05, "loss": 22.3298, "step": 20680 }, { "epoch": 0.22, "learning_rate": 1.80965451196254e-05, "loss": 21.3224, "step": 20690 }, { "epoch": 0.22, "learning_rate": 1.8094489653142536e-05, "loss": 21.6148, "step": 20700 }, { "epoch": 0.22, "learning_rate": 1.8092433194315606e-05, "loss": 21.2509, "step": 20710 }, { "epoch": 0.22, "learning_rate": 1.809037574339671e-05, "loss": 21.5712, "step": 20720 }, { "epoch": 0.22, "learning_rate": 1.8088317300638093e-05, "loss": 21.5252, "step": 20730 }, { "epoch": 0.22, "learning_rate": 1.8086257866292104e-05, "loss": 21.6085, "step": 20740 }, { "epoch": 0.22, "learning_rate": 1.808419744061122e-05, "loss": 21.7802, "step": 20750 }, { "epoch": 0.22, "learning_rate": 1.808213602384804e-05, "loss": 21.8969, "step": 20760 }, { "epoch": 0.22, "learning_rate": 1.808007361625528e-05, "loss": 21.153, "step": 20770 }, { "epoch": 0.22, "learning_rate": 1.8078010218085782e-05, "loss": 22.1726, "step": 20780 }, { "epoch": 0.22, "learning_rate": 1.8075945829592512e-05, "loss": 21.7555, "step": 20790 }, { "epoch": 0.22, "learning_rate": 1.807388045102855e-05, "loss": 20.9585, "step": 20800 }, { "epoch": 0.22, "learning_rate": 1.8071814082647106e-05, "loss": 22.6315, "step": 20810 }, { "epoch": 0.23, "learning_rate": 1.8069746724701498e-05, "loss": 21.7121, "step": 20820 }, { "epoch": 0.23, "learning_rate": 1.8067678377445182e-05, "loss": 21.7387, "step": 20830 }, { "epoch": 0.23, "learning_rate": 1.8065609041131723e-05, "loss": 21.1417, "step": 20840 }, { "epoch": 0.23, "learning_rate": 1.806353871601481e-05, "loss": 21.1915, "step": 20850 }, { "epoch": 0.23, "learning_rate": 1.806146740234826e-05, "loss": 21.8539, "step": 20860 }, { "epoch": 0.23, "learning_rate": 1.8059395100386003e-05, "loss": 21.2717, "step": 20870 }, { "epoch": 0.23, "learning_rate": 1.805732181038209e-05, "loss": 21.9004, "step": 20880 }, { "epoch": 0.23, "learning_rate": 1.8055247532590697e-05, "loss": 21.534, "step": 20890 }, { "epoch": 0.23, "learning_rate": 1.8053172267266124e-05, "loss": 21.2683, "step": 20900 }, { "epoch": 0.23, "learning_rate": 1.8051096014662787e-05, "loss": 21.5821, "step": 20910 }, { "epoch": 0.23, "learning_rate": 1.8049018775035217e-05, "loss": 21.7403, "step": 20920 }, { "epoch": 0.23, "learning_rate": 1.8046940548638084e-05, "loss": 22.4963, "step": 20930 }, { "epoch": 0.23, "learning_rate": 1.804486133572616e-05, "loss": 21.7873, "step": 20940 }, { "epoch": 0.23, "learning_rate": 1.804278113655435e-05, "loss": 21.3567, "step": 20950 }, { "epoch": 0.23, "learning_rate": 1.8040699951377678e-05, "loss": 21.404, "step": 20960 }, { "epoch": 0.23, "learning_rate": 1.8038617780451286e-05, "loss": 22.4775, "step": 20970 }, { "epoch": 0.23, "learning_rate": 1.8036534624030428e-05, "loss": 21.8512, "step": 20980 }, { "epoch": 0.23, "learning_rate": 1.8034450482370506e-05, "loss": 21.9339, "step": 20990 }, { "epoch": 0.23, "learning_rate": 1.8032365355727012e-05, "loss": 22.0268, "step": 21000 }, { "epoch": 0.23, "learning_rate": 1.8030279244355573e-05, "loss": 21.557, "step": 21010 }, { "epoch": 0.23, "learning_rate": 1.8028192148511943e-05, "loss": 21.3506, "step": 21020 }, { "epoch": 0.23, "learning_rate": 1.8026104068451983e-05, "loss": 21.2476, "step": 21030 }, { "epoch": 0.23, "learning_rate": 1.8024015004431686e-05, "loss": 21.6852, "step": 21040 }, { "epoch": 0.23, "learning_rate": 1.8021924956707156e-05, "loss": 21.4009, "step": 21050 }, { "epoch": 0.23, "learning_rate": 1.8019833925534626e-05, "loss": 21.6273, "step": 21060 }, { "epoch": 0.23, "learning_rate": 1.801774191117045e-05, "loss": 20.9928, "step": 21070 }, { "epoch": 0.23, "learning_rate": 1.8015648913871086e-05, "loss": 21.601, "step": 21080 }, { "epoch": 0.23, "learning_rate": 1.8013554933893137e-05, "loss": 21.7359, "step": 21090 }, { "epoch": 0.23, "learning_rate": 1.801145997149331e-05, "loss": 21.4176, "step": 21100 }, { "epoch": 0.23, "learning_rate": 1.8009364026928437e-05, "loss": 22.2756, "step": 21110 }, { "epoch": 0.23, "learning_rate": 1.8007267100455467e-05, "loss": 21.2547, "step": 21120 }, { "epoch": 0.23, "learning_rate": 1.800516919233148e-05, "loss": 22.2906, "step": 21130 }, { "epoch": 0.23, "learning_rate": 1.8003070302813664e-05, "loss": 22.1982, "step": 21140 }, { "epoch": 0.23, "learning_rate": 1.8000970432159334e-05, "loss": 21.5608, "step": 21150 }, { "epoch": 0.23, "learning_rate": 1.7998869580625923e-05, "loss": 22.0552, "step": 21160 }, { "epoch": 0.23, "learning_rate": 1.7996767748470984e-05, "loss": 22.1003, "step": 21170 }, { "epoch": 0.23, "learning_rate": 1.7994664935952193e-05, "loss": 21.4846, "step": 21180 }, { "epoch": 0.23, "learning_rate": 1.7992561143327344e-05, "loss": 21.9044, "step": 21190 }, { "epoch": 0.23, "learning_rate": 1.799045637085435e-05, "loss": 21.9961, "step": 21200 }, { "epoch": 0.23, "learning_rate": 1.798835061879125e-05, "loss": 21.2325, "step": 21210 }, { "epoch": 0.23, "learning_rate": 1.7986243887396193e-05, "loss": 21.7283, "step": 21220 }, { "epoch": 0.23, "learning_rate": 1.7984136176927457e-05, "loss": 21.6083, "step": 21230 }, { "epoch": 0.23, "learning_rate": 1.7982027487643436e-05, "loss": 21.2314, "step": 21240 }, { "epoch": 0.23, "learning_rate": 1.7979917819802644e-05, "loss": 21.4245, "step": 21250 }, { "epoch": 0.23, "learning_rate": 1.7977807173663718e-05, "loss": 21.0025, "step": 21260 }, { "epoch": 0.23, "learning_rate": 1.797569554948541e-05, "loss": 21.4826, "step": 21270 }, { "epoch": 0.23, "learning_rate": 1.7973582947526597e-05, "loss": 21.3207, "step": 21280 }, { "epoch": 0.23, "learning_rate": 1.797146936804627e-05, "loss": 22.0215, "step": 21290 }, { "epoch": 0.23, "learning_rate": 1.7969354811303548e-05, "loss": 22.2049, "step": 21300 }, { "epoch": 0.23, "learning_rate": 1.7967239277557663e-05, "loss": 21.8063, "step": 21310 }, { "epoch": 0.23, "learning_rate": 1.7965122767067967e-05, "loss": 21.1534, "step": 21320 }, { "epoch": 0.23, "learning_rate": 1.7963005280093935e-05, "loss": 22.6042, "step": 21330 }, { "epoch": 0.23, "learning_rate": 1.7960886816895164e-05, "loss": 21.522, "step": 21340 }, { "epoch": 0.23, "learning_rate": 1.795876737773136e-05, "loss": 21.0701, "step": 21350 }, { "epoch": 0.23, "learning_rate": 1.7956646962862358e-05, "loss": 21.5028, "step": 21360 }, { "epoch": 0.23, "learning_rate": 1.7954525572548117e-05, "loss": 21.5701, "step": 21370 }, { "epoch": 0.23, "learning_rate": 1.7952403207048702e-05, "loss": 21.7463, "step": 21380 }, { "epoch": 0.23, "learning_rate": 1.7950279866624303e-05, "loss": 21.5701, "step": 21390 }, { "epoch": 0.23, "learning_rate": 1.7948155551535236e-05, "loss": 21.214, "step": 21400 }, { "epoch": 0.23, "learning_rate": 1.7946030262041927e-05, "loss": 22.0273, "step": 21410 }, { "epoch": 0.23, "learning_rate": 1.794390399840493e-05, "loss": 21.6136, "step": 21420 }, { "epoch": 0.23, "learning_rate": 1.7941776760884912e-05, "loss": 21.7155, "step": 21430 }, { "epoch": 0.23, "learning_rate": 1.7939648549742663e-05, "loss": 22.1531, "step": 21440 }, { "epoch": 0.23, "learning_rate": 1.793751936523909e-05, "loss": 21.0458, "step": 21450 }, { "epoch": 0.23, "learning_rate": 1.793538920763522e-05, "loss": 21.5092, "step": 21460 }, { "epoch": 0.23, "learning_rate": 1.79332580771922e-05, "loss": 22.6221, "step": 21470 }, { "epoch": 0.23, "learning_rate": 1.79311259741713e-05, "loss": 22.0036, "step": 21480 }, { "epoch": 0.23, "learning_rate": 1.7928992898833896e-05, "loss": 22.0814, "step": 21490 }, { "epoch": 0.23, "learning_rate": 1.79268588514415e-05, "loss": 21.6162, "step": 21500 }, { "epoch": 0.23, "learning_rate": 1.7924723832255737e-05, "loss": 21.0786, "step": 21510 }, { "epoch": 0.23, "learning_rate": 1.7922587841538344e-05, "loss": 21.1781, "step": 21520 }, { "epoch": 0.23, "learning_rate": 1.7920450879551185e-05, "loss": 21.7732, "step": 21530 }, { "epoch": 0.23, "learning_rate": 1.791831294655624e-05, "loss": 21.4481, "step": 21540 }, { "epoch": 0.23, "learning_rate": 1.791617404281561e-05, "loss": 22.0619, "step": 21550 }, { "epoch": 0.23, "learning_rate": 1.7914034168591515e-05, "loss": 21.3876, "step": 21560 }, { "epoch": 0.23, "learning_rate": 1.791189332414629e-05, "loss": 21.3077, "step": 21570 }, { "epoch": 0.23, "learning_rate": 1.7909751509742393e-05, "loss": 21.1945, "step": 21580 }, { "epoch": 0.23, "learning_rate": 1.7907608725642406e-05, "loss": 21.4873, "step": 21590 }, { "epoch": 0.23, "learning_rate": 1.7905464972109012e-05, "loss": 22.2787, "step": 21600 }, { "epoch": 0.23, "learning_rate": 1.7903320249405033e-05, "loss": 20.9238, "step": 21610 }, { "epoch": 0.23, "learning_rate": 1.7901174557793398e-05, "loss": 21.5676, "step": 21620 }, { "epoch": 0.23, "learning_rate": 1.789902789753716e-05, "loss": 20.9677, "step": 21630 }, { "epoch": 0.23, "learning_rate": 1.7896880268899486e-05, "loss": 21.5771, "step": 21640 }, { "epoch": 0.23, "learning_rate": 1.7894731672143667e-05, "loss": 21.4699, "step": 21650 }, { "epoch": 0.23, "learning_rate": 1.789258210753311e-05, "loss": 20.8446, "step": 21660 }, { "epoch": 0.23, "learning_rate": 1.789043157533134e-05, "loss": 21.9269, "step": 21670 }, { "epoch": 0.23, "learning_rate": 1.7888280075802e-05, "loss": 21.1752, "step": 21680 }, { "epoch": 0.23, "learning_rate": 1.788612760920886e-05, "loss": 22.2112, "step": 21690 }, { "epoch": 0.23, "learning_rate": 1.7883974175815792e-05, "loss": 22.0993, "step": 21700 }, { "epoch": 0.23, "learning_rate": 1.7881819775886802e-05, "loss": 21.0229, "step": 21710 }, { "epoch": 0.23, "learning_rate": 1.7879664409686007e-05, "loss": 22.7043, "step": 21720 }, { "epoch": 0.23, "learning_rate": 1.7877508077477648e-05, "loss": 22.028, "step": 21730 }, { "epoch": 0.24, "learning_rate": 1.7875350779526076e-05, "loss": 21.7317, "step": 21740 }, { "epoch": 0.24, "learning_rate": 1.7873192516095767e-05, "loss": 21.115, "step": 21750 }, { "epoch": 0.24, "learning_rate": 1.787103328745131e-05, "loss": 21.377, "step": 21760 }, { "epoch": 0.24, "learning_rate": 1.786887309385742e-05, "loss": 21.2011, "step": 21770 }, { "epoch": 0.24, "learning_rate": 1.7866711935578922e-05, "loss": 22.0049, "step": 21780 }, { "epoch": 0.24, "learning_rate": 1.786454981288077e-05, "loss": 20.8477, "step": 21790 }, { "epoch": 0.24, "learning_rate": 1.786238672602802e-05, "loss": 21.9221, "step": 21800 }, { "epoch": 0.24, "learning_rate": 1.7860222675285866e-05, "loss": 21.4691, "step": 21810 }, { "epoch": 0.24, "learning_rate": 1.7858057660919602e-05, "loss": 21.976, "step": 21820 }, { "epoch": 0.24, "learning_rate": 1.785589168319465e-05, "loss": 21.1064, "step": 21830 }, { "epoch": 0.24, "learning_rate": 1.785372474237655e-05, "loss": 21.5475, "step": 21840 }, { "epoch": 0.24, "learning_rate": 1.7851556838730954e-05, "loss": 21.5546, "step": 21850 }, { "epoch": 0.24, "learning_rate": 1.784938797252364e-05, "loss": 22.0427, "step": 21860 }, { "epoch": 0.24, "learning_rate": 1.7847218144020497e-05, "loss": 21.2559, "step": 21870 }, { "epoch": 0.24, "learning_rate": 1.784504735348754e-05, "loss": 21.5534, "step": 21880 }, { "epoch": 0.24, "learning_rate": 1.7842875601190894e-05, "loss": 21.677, "step": 21890 }, { "epoch": 0.24, "learning_rate": 1.7840702887396807e-05, "loss": 21.4291, "step": 21900 }, { "epoch": 0.24, "learning_rate": 1.7838529212371636e-05, "loss": 21.8626, "step": 21910 }, { "epoch": 0.24, "learning_rate": 1.7836354576381873e-05, "loss": 21.2049, "step": 21920 }, { "epoch": 0.24, "learning_rate": 1.783417897969411e-05, "loss": 21.5891, "step": 21930 }, { "epoch": 0.24, "learning_rate": 1.7832002422575064e-05, "loss": 22.0219, "step": 21940 }, { "epoch": 0.24, "learning_rate": 1.7829824905291578e-05, "loss": 21.0075, "step": 21950 }, { "epoch": 0.24, "learning_rate": 1.7827646428110595e-05, "loss": 21.8078, "step": 21960 }, { "epoch": 0.24, "learning_rate": 1.7825466991299193e-05, "loss": 20.5559, "step": 21970 }, { "epoch": 0.24, "learning_rate": 1.7823286595124557e-05, "loss": 21.4999, "step": 21980 }, { "epoch": 0.24, "learning_rate": 1.782110523985399e-05, "loss": 21.5198, "step": 21990 }, { "epoch": 0.24, "learning_rate": 1.781892292575492e-05, "loss": 21.7802, "step": 22000 }, { "epoch": 0.24, "learning_rate": 1.7816739653094886e-05, "loss": 21.5376, "step": 22010 }, { "epoch": 0.24, "learning_rate": 1.7814555422141547e-05, "loss": 21.2552, "step": 22020 }, { "epoch": 0.24, "learning_rate": 1.781237023316268e-05, "loss": 21.5347, "step": 22030 }, { "epoch": 0.24, "learning_rate": 1.781018408642617e-05, "loss": 21.4141, "step": 22040 }, { "epoch": 0.24, "learning_rate": 1.7807996982200038e-05, "loss": 21.234, "step": 22050 }, { "epoch": 0.24, "learning_rate": 1.7805808920752407e-05, "loss": 21.397, "step": 22060 }, { "epoch": 0.24, "learning_rate": 1.7803619902351523e-05, "loss": 21.3981, "step": 22070 }, { "epoch": 0.24, "learning_rate": 1.780142992726575e-05, "loss": 21.7781, "step": 22080 }, { "epoch": 0.24, "learning_rate": 1.779923899576357e-05, "loss": 21.8246, "step": 22090 }, { "epoch": 0.24, "learning_rate": 1.7797047108113572e-05, "loss": 21.0564, "step": 22100 }, { "epoch": 0.24, "learning_rate": 1.779485426458448e-05, "loss": 21.3697, "step": 22110 }, { "epoch": 0.24, "learning_rate": 1.779266046544512e-05, "loss": 21.3436, "step": 22120 }, { "epoch": 0.24, "learning_rate": 1.7790465710964442e-05, "loss": 21.3561, "step": 22130 }, { "epoch": 0.24, "learning_rate": 1.7788270001411514e-05, "loss": 21.424, "step": 22140 }, { "epoch": 0.24, "learning_rate": 1.7786073337055516e-05, "loss": 22.5095, "step": 22150 }, { "epoch": 0.24, "learning_rate": 1.778387571816575e-05, "loss": 21.0688, "step": 22160 }, { "epoch": 0.24, "learning_rate": 1.7781677145011634e-05, "loss": 21.7452, "step": 22170 }, { "epoch": 0.24, "learning_rate": 1.77794776178627e-05, "loss": 21.0943, "step": 22180 }, { "epoch": 0.24, "learning_rate": 1.77772771369886e-05, "loss": 21.8656, "step": 22190 }, { "epoch": 0.24, "learning_rate": 1.7775075702659102e-05, "loss": 21.6289, "step": 22200 }, { "epoch": 0.24, "learning_rate": 1.7772873315144093e-05, "loss": 21.0988, "step": 22210 }, { "epoch": 0.24, "learning_rate": 1.7770669974713566e-05, "loss": 21.6201, "step": 22220 }, { "epoch": 0.24, "learning_rate": 1.776846568163765e-05, "loss": 21.8834, "step": 22230 }, { "epoch": 0.24, "learning_rate": 1.776626043618658e-05, "loss": 22.0219, "step": 22240 }, { "epoch": 0.24, "learning_rate": 1.77640542386307e-05, "loss": 21.7179, "step": 22250 }, { "epoch": 0.24, "learning_rate": 1.7761847089240483e-05, "loss": 21.61, "step": 22260 }, { "epoch": 0.24, "learning_rate": 1.7759638988286515e-05, "loss": 21.7125, "step": 22270 }, { "epoch": 0.24, "learning_rate": 1.77574299360395e-05, "loss": 21.1931, "step": 22280 }, { "epoch": 0.24, "learning_rate": 1.7755219932770257e-05, "loss": 21.0956, "step": 22290 }, { "epoch": 0.24, "learning_rate": 1.7753008978749714e-05, "loss": 22.0826, "step": 22300 }, { "epoch": 0.24, "learning_rate": 1.7750797074248927e-05, "loss": 21.5841, "step": 22310 }, { "epoch": 0.24, "learning_rate": 1.7748584219539072e-05, "loss": 21.5386, "step": 22320 }, { "epoch": 0.24, "learning_rate": 1.7746370414891423e-05, "loss": 22.1456, "step": 22330 }, { "epoch": 0.24, "learning_rate": 1.774415566057739e-05, "loss": 21.281, "step": 22340 }, { "epoch": 0.24, "learning_rate": 1.7741939956868482e-05, "loss": 22.2039, "step": 22350 }, { "epoch": 0.24, "learning_rate": 1.773972330403634e-05, "loss": 21.6081, "step": 22360 }, { "epoch": 0.24, "learning_rate": 1.7737505702352714e-05, "loss": 20.8147, "step": 22370 }, { "epoch": 0.24, "learning_rate": 1.7735287152089466e-05, "loss": 22.2144, "step": 22380 }, { "epoch": 0.24, "learning_rate": 1.773306765351858e-05, "loss": 21.1047, "step": 22390 }, { "epoch": 0.24, "learning_rate": 1.7730847206912166e-05, "loss": 21.6965, "step": 22400 }, { "epoch": 0.24, "learning_rate": 1.772862581254243e-05, "loss": 21.377, "step": 22410 }, { "epoch": 0.24, "learning_rate": 1.7726403470681703e-05, "loss": 21.4453, "step": 22420 }, { "epoch": 0.24, "learning_rate": 1.7724180181602438e-05, "loss": 21.0477, "step": 22430 }, { "epoch": 0.24, "learning_rate": 1.7721955945577195e-05, "loss": 20.984, "step": 22440 }, { "epoch": 0.24, "learning_rate": 1.7719730762878656e-05, "loss": 21.888, "step": 22450 }, { "epoch": 0.24, "learning_rate": 1.7717504633779618e-05, "loss": 20.7077, "step": 22460 }, { "epoch": 0.24, "learning_rate": 1.7715277558552994e-05, "loss": 21.4893, "step": 22470 }, { "epoch": 0.24, "learning_rate": 1.771304953747181e-05, "loss": 21.7752, "step": 22480 }, { "epoch": 0.24, "learning_rate": 1.771082057080921e-05, "loss": 20.959, "step": 22490 }, { "epoch": 0.24, "learning_rate": 1.7708590658838457e-05, "loss": 21.726, "step": 22500 }, { "epoch": 0.24, "learning_rate": 1.7706359801832923e-05, "loss": 22.1728, "step": 22510 }, { "epoch": 0.24, "learning_rate": 1.7704128000066108e-05, "loss": 20.662, "step": 22520 }, { "epoch": 0.24, "learning_rate": 1.770189525381161e-05, "loss": 20.8579, "step": 22530 }, { "epoch": 0.24, "learning_rate": 1.769966156334316e-05, "loss": 22.0799, "step": 22540 }, { "epoch": 0.24, "learning_rate": 1.769742692893459e-05, "loss": 21.5057, "step": 22550 }, { "epoch": 0.24, "learning_rate": 1.7695191350859863e-05, "loss": 21.6543, "step": 22560 }, { "epoch": 0.24, "learning_rate": 1.7692954829393045e-05, "loss": 21.1789, "step": 22570 }, { "epoch": 0.24, "learning_rate": 1.769071736480832e-05, "loss": 21.4407, "step": 22580 }, { "epoch": 0.24, "learning_rate": 1.768847895738e-05, "loss": 21.3714, "step": 22590 }, { "epoch": 0.24, "learning_rate": 1.7686239607382495e-05, "loss": 21.612, "step": 22600 }, { "epoch": 0.24, "learning_rate": 1.7683999315090333e-05, "loss": 22.2312, "step": 22610 }, { "epoch": 0.24, "learning_rate": 1.7681758080778174e-05, "loss": 21.3731, "step": 22620 }, { "epoch": 0.24, "learning_rate": 1.7679515904720773e-05, "loss": 21.7629, "step": 22630 }, { "epoch": 0.24, "learning_rate": 1.7677272787193018e-05, "loss": 21.9498, "step": 22640 }, { "epoch": 0.24, "learning_rate": 1.7675028728469896e-05, "loss": 21.2597, "step": 22650 }, { "epoch": 0.24, "learning_rate": 1.7672783728826523e-05, "loss": 22.3854, "step": 22660 }, { "epoch": 0.25, "learning_rate": 1.767053778853812e-05, "loss": 21.5681, "step": 22670 }, { "epoch": 0.25, "learning_rate": 1.7668290907880034e-05, "loss": 22.2146, "step": 22680 }, { "epoch": 0.25, "learning_rate": 1.7666043087127714e-05, "loss": 21.6742, "step": 22690 }, { "epoch": 0.25, "learning_rate": 1.7663794326556743e-05, "loss": 21.4089, "step": 22700 }, { "epoch": 0.25, "learning_rate": 1.7661544626442793e-05, "loss": 21.852, "step": 22710 }, { "epoch": 0.25, "learning_rate": 1.765929398706168e-05, "loss": 21.7753, "step": 22720 }, { "epoch": 0.25, "learning_rate": 1.765704240868931e-05, "loss": 21.4945, "step": 22730 }, { "epoch": 0.25, "learning_rate": 1.765478989160172e-05, "loss": 21.0926, "step": 22740 }, { "epoch": 0.25, "learning_rate": 1.765253643607506e-05, "loss": 21.7811, "step": 22750 }, { "epoch": 0.25, "learning_rate": 1.765028204238559e-05, "loss": 22.1643, "step": 22760 }, { "epoch": 0.25, "learning_rate": 1.7648026710809686e-05, "loss": 21.1389, "step": 22770 }, { "epoch": 0.25, "learning_rate": 1.764577044162384e-05, "loss": 21.8676, "step": 22780 }, { "epoch": 0.25, "learning_rate": 1.7643513235104664e-05, "loss": 21.428, "step": 22790 }, { "epoch": 0.25, "learning_rate": 1.7641255091528876e-05, "loss": 21.5116, "step": 22800 }, { "epoch": 0.25, "learning_rate": 1.7638996011173314e-05, "loss": 21.933, "step": 22810 }, { "epoch": 0.25, "learning_rate": 1.7636735994314934e-05, "loss": 20.8952, "step": 22820 }, { "epoch": 0.25, "learning_rate": 1.7634475041230796e-05, "loss": 21.2881, "step": 22830 }, { "epoch": 0.25, "learning_rate": 1.7632213152198084e-05, "loss": 21.404, "step": 22840 }, { "epoch": 0.25, "learning_rate": 1.7629950327494097e-05, "loss": 21.7082, "step": 22850 }, { "epoch": 0.25, "learning_rate": 1.7627686567396244e-05, "loss": 21.3378, "step": 22860 }, { "epoch": 0.25, "learning_rate": 1.762542187218205e-05, "loss": 21.7324, "step": 22870 }, { "epoch": 0.25, "learning_rate": 1.7623156242129153e-05, "loss": 21.5438, "step": 22880 }, { "epoch": 0.25, "learning_rate": 1.7620889677515314e-05, "loss": 21.3822, "step": 22890 }, { "epoch": 0.25, "learning_rate": 1.76186221786184e-05, "loss": 21.3926, "step": 22900 }, { "epoch": 0.25, "learning_rate": 1.7616353745716397e-05, "loss": 21.4683, "step": 22910 }, { "epoch": 0.25, "learning_rate": 1.76140843790874e-05, "loss": 21.9233, "step": 22920 }, { "epoch": 0.25, "learning_rate": 1.7611814079009622e-05, "loss": 21.5051, "step": 22930 }, { "epoch": 0.25, "learning_rate": 1.760954284576139e-05, "loss": 21.2159, "step": 22940 }, { "epoch": 0.25, "learning_rate": 1.7607270679621152e-05, "loss": 20.6196, "step": 22950 }, { "epoch": 0.25, "learning_rate": 1.7604997580867457e-05, "loss": 21.3949, "step": 22960 }, { "epoch": 0.25, "learning_rate": 1.760272354977898e-05, "loss": 21.6643, "step": 22970 }, { "epoch": 0.25, "learning_rate": 1.76004485866345e-05, "loss": 22.3044, "step": 22980 }, { "epoch": 0.25, "learning_rate": 1.7598172691712926e-05, "loss": 21.6318, "step": 22990 }, { "epoch": 0.25, "learning_rate": 1.7595895865293265e-05, "loss": 21.9385, "step": 23000 }, { "epoch": 0.25, "learning_rate": 1.7593618107654645e-05, "loss": 21.623, "step": 23010 }, { "epoch": 0.25, "learning_rate": 1.7591339419076305e-05, "loss": 21.5741, "step": 23020 }, { "epoch": 0.25, "learning_rate": 1.7589059799837608e-05, "loss": 21.7168, "step": 23030 }, { "epoch": 0.25, "learning_rate": 1.7586779250218017e-05, "loss": 22.3656, "step": 23040 }, { "epoch": 0.25, "learning_rate": 1.758449777049712e-05, "loss": 22.1238, "step": 23050 }, { "epoch": 0.25, "learning_rate": 1.7582215360954614e-05, "loss": 21.563, "step": 23060 }, { "epoch": 0.25, "learning_rate": 1.757993202187031e-05, "loss": 21.7209, "step": 23070 }, { "epoch": 0.25, "learning_rate": 1.757764775352414e-05, "loss": 21.7332, "step": 23080 }, { "epoch": 0.25, "learning_rate": 1.7575362556196132e-05, "loss": 21.503, "step": 23090 }, { "epoch": 0.25, "learning_rate": 1.757307643016645e-05, "loss": 21.0841, "step": 23100 }, { "epoch": 0.25, "learning_rate": 1.757078937571536e-05, "loss": 22.0048, "step": 23110 }, { "epoch": 0.25, "learning_rate": 1.7568501393123236e-05, "loss": 20.9448, "step": 23120 }, { "epoch": 0.25, "learning_rate": 1.7566212482670586e-05, "loss": 21.8141, "step": 23130 }, { "epoch": 0.25, "learning_rate": 1.756392264463801e-05, "loss": 21.2707, "step": 23140 }, { "epoch": 0.25, "learning_rate": 1.756163187930623e-05, "loss": 21.9392, "step": 23150 }, { "epoch": 0.25, "learning_rate": 1.7559340186956088e-05, "loss": 21.6249, "step": 23160 }, { "epoch": 0.25, "learning_rate": 1.755704756786853e-05, "loss": 21.391, "step": 23170 }, { "epoch": 0.25, "learning_rate": 1.755475402232462e-05, "loss": 21.6924, "step": 23180 }, { "epoch": 0.25, "learning_rate": 1.7552459550605537e-05, "loss": 21.6932, "step": 23190 }, { "epoch": 0.25, "learning_rate": 1.7550164152992573e-05, "loss": 21.2801, "step": 23200 }, { "epoch": 0.25, "learning_rate": 1.754786782976713e-05, "loss": 22.1497, "step": 23210 }, { "epoch": 0.25, "learning_rate": 1.7545570581210723e-05, "loss": 20.5554, "step": 23220 }, { "epoch": 0.25, "learning_rate": 1.754327240760499e-05, "loss": 21.9504, "step": 23230 }, { "epoch": 0.25, "learning_rate": 1.754097330923167e-05, "loss": 20.7955, "step": 23240 }, { "epoch": 0.25, "learning_rate": 1.7538673286372625e-05, "loss": 21.047, "step": 23250 }, { "epoch": 0.25, "learning_rate": 1.7536372339309822e-05, "loss": 20.8701, "step": 23260 }, { "epoch": 0.25, "learning_rate": 1.7534070468325347e-05, "loss": 21.1703, "step": 23270 }, { "epoch": 0.25, "learning_rate": 1.75317676737014e-05, "loss": 21.4372, "step": 23280 }, { "epoch": 0.25, "learning_rate": 1.7529463955720293e-05, "loss": 21.412, "step": 23290 }, { "epoch": 0.25, "learning_rate": 1.7527159314664447e-05, "loss": 21.3551, "step": 23300 }, { "epoch": 0.25, "learning_rate": 1.7524853750816398e-05, "loss": 21.5055, "step": 23310 }, { "epoch": 0.25, "learning_rate": 1.7522547264458803e-05, "loss": 21.9317, "step": 23320 }, { "epoch": 0.25, "learning_rate": 1.7520239855874418e-05, "loss": 21.4384, "step": 23330 }, { "epoch": 0.25, "learning_rate": 1.751793152534613e-05, "loss": 21.2036, "step": 23340 }, { "epoch": 0.25, "learning_rate": 1.7515622273156917e-05, "loss": 22.1698, "step": 23350 }, { "epoch": 0.25, "learning_rate": 1.751331209958989e-05, "loss": 21.5001, "step": 23360 }, { "epoch": 0.25, "learning_rate": 1.7511001004928263e-05, "loss": 21.6672, "step": 23370 }, { "epoch": 0.25, "learning_rate": 1.7508688989455365e-05, "loss": 20.7779, "step": 23380 }, { "epoch": 0.25, "learning_rate": 1.7506376053454633e-05, "loss": 21.8504, "step": 23390 }, { "epoch": 0.25, "learning_rate": 1.7504062197209626e-05, "loss": 21.5191, "step": 23400 }, { "epoch": 0.25, "learning_rate": 1.7501747421004012e-05, "loss": 21.9048, "step": 23410 }, { "epoch": 0.25, "learning_rate": 1.7499431725121567e-05, "loss": 22.0538, "step": 23420 }, { "epoch": 0.25, "learning_rate": 1.7497115109846187e-05, "loss": 22.04, "step": 23430 }, { "epoch": 0.25, "learning_rate": 1.7494797575461878e-05, "loss": 21.2228, "step": 23440 }, { "epoch": 0.25, "learning_rate": 1.7492479122252755e-05, "loss": 22.0033, "step": 23450 }, { "epoch": 0.25, "learning_rate": 1.7490159750503052e-05, "loss": 21.2076, "step": 23460 }, { "epoch": 0.25, "learning_rate": 1.7487839460497108e-05, "loss": 21.225, "step": 23470 }, { "epoch": 0.25, "learning_rate": 1.7485518252519383e-05, "loss": 21.9976, "step": 23480 }, { "epoch": 0.25, "learning_rate": 1.7483196126854444e-05, "loss": 21.6504, "step": 23490 }, { "epoch": 0.25, "learning_rate": 1.7480873083786975e-05, "loss": 21.592, "step": 23500 }, { "epoch": 0.25, "learning_rate": 1.747854912360176e-05, "loss": 21.7252, "step": 23510 }, { "epoch": 0.25, "learning_rate": 1.7476224246583718e-05, "loss": 22.3497, "step": 23520 }, { "epoch": 0.25, "learning_rate": 1.7473898453017862e-05, "loss": 21.8164, "step": 23530 }, { "epoch": 0.25, "learning_rate": 1.7471571743189318e-05, "loss": 21.9451, "step": 23540 }, { "epoch": 0.25, "learning_rate": 1.7469244117383336e-05, "loss": 21.4306, "step": 23550 }, { "epoch": 0.25, "learning_rate": 1.7466915575885268e-05, "loss": 21.4097, "step": 23560 }, { "epoch": 0.25, "learning_rate": 1.746458611898058e-05, "loss": 21.3248, "step": 23570 }, { "epoch": 0.25, "learning_rate": 1.7462255746954853e-05, "loss": 21.5465, "step": 23580 }, { "epoch": 0.26, "learning_rate": 1.7459924460093783e-05, "loss": 21.9436, "step": 23590 }, { "epoch": 0.26, "learning_rate": 1.7457592258683166e-05, "loss": 21.4147, "step": 23600 }, { "epoch": 0.26, "learning_rate": 1.7455259143008926e-05, "loss": 22.2693, "step": 23610 }, { "epoch": 0.26, "learning_rate": 1.7452925113357086e-05, "loss": 21.7592, "step": 23620 }, { "epoch": 0.26, "learning_rate": 1.745059017001379e-05, "loss": 21.4845, "step": 23630 }, { "epoch": 0.26, "learning_rate": 1.7448254313265294e-05, "loss": 21.397, "step": 23640 }, { "epoch": 0.26, "learning_rate": 1.7445917543397953e-05, "loss": 21.5583, "step": 23650 }, { "epoch": 0.26, "learning_rate": 1.7443579860698244e-05, "loss": 21.1453, "step": 23660 }, { "epoch": 0.26, "learning_rate": 1.7441241265452764e-05, "loss": 22.0984, "step": 23670 }, { "epoch": 0.26, "learning_rate": 1.743890175794821e-05, "loss": 20.8183, "step": 23680 }, { "epoch": 0.26, "learning_rate": 1.743656133847139e-05, "loss": 21.3774, "step": 23690 }, { "epoch": 0.26, "learning_rate": 1.7434220007309228e-05, "loss": 21.4597, "step": 23700 }, { "epoch": 0.26, "learning_rate": 1.7431877764748764e-05, "loss": 21.3877, "step": 23710 }, { "epoch": 0.26, "learning_rate": 1.742953461107714e-05, "loss": 21.617, "step": 23720 }, { "epoch": 0.26, "learning_rate": 1.7427190546581617e-05, "loss": 21.5197, "step": 23730 }, { "epoch": 0.26, "learning_rate": 1.7424845571549572e-05, "loss": 21.8885, "step": 23740 }, { "epoch": 0.26, "learning_rate": 1.7422499686268474e-05, "loss": 21.4717, "step": 23750 }, { "epoch": 0.26, "learning_rate": 1.742015289102593e-05, "loss": 21.7303, "step": 23760 }, { "epoch": 0.26, "learning_rate": 1.741780518610964e-05, "loss": 20.5447, "step": 23770 }, { "epoch": 0.26, "learning_rate": 1.7415456571807415e-05, "loss": 21.4554, "step": 23780 }, { "epoch": 0.26, "learning_rate": 1.7413107048407198e-05, "loss": 21.8641, "step": 23790 }, { "epoch": 0.26, "learning_rate": 1.741075661619701e-05, "loss": 21.1623, "step": 23800 }, { "epoch": 0.26, "learning_rate": 1.7408405275465016e-05, "loss": 22.2142, "step": 23810 }, { "epoch": 0.26, "learning_rate": 1.7406053026499477e-05, "loss": 21.2476, "step": 23820 }, { "epoch": 0.26, "learning_rate": 1.7403699869588765e-05, "loss": 22.2943, "step": 23830 }, { "epoch": 0.26, "learning_rate": 1.7401345805021362e-05, "loss": 22.0596, "step": 23840 }, { "epoch": 0.26, "learning_rate": 1.7398990833085872e-05, "loss": 21.5202, "step": 23850 }, { "epoch": 0.26, "learning_rate": 1.7396634954070995e-05, "loss": 22.0451, "step": 23860 }, { "epoch": 0.26, "learning_rate": 1.7394278168265555e-05, "loss": 22.0035, "step": 23870 }, { "epoch": 0.26, "learning_rate": 1.739192047595848e-05, "loss": 21.3556, "step": 23880 }, { "epoch": 0.26, "learning_rate": 1.738956187743881e-05, "loss": 21.4314, "step": 23890 }, { "epoch": 0.26, "learning_rate": 1.7387202372995702e-05, "loss": 21.7767, "step": 23900 }, { "epoch": 0.26, "learning_rate": 1.7384841962918417e-05, "loss": 21.0018, "step": 23910 }, { "epoch": 0.26, "learning_rate": 1.7382480647496332e-05, "loss": 22.0716, "step": 23920 }, { "epoch": 0.26, "learning_rate": 1.7380118427018927e-05, "loss": 22.2382, "step": 23930 }, { "epoch": 0.26, "learning_rate": 1.73777553017758e-05, "loss": 21.5717, "step": 23940 }, { "epoch": 0.26, "learning_rate": 1.7375391272056664e-05, "loss": 21.5745, "step": 23950 }, { "epoch": 0.26, "learning_rate": 1.737302633815133e-05, "loss": 21.6324, "step": 23960 }, { "epoch": 0.26, "learning_rate": 1.737066050034973e-05, "loss": 21.4904, "step": 23970 }, { "epoch": 0.26, "learning_rate": 1.7368293758941906e-05, "loss": 21.6112, "step": 23980 }, { "epoch": 0.26, "learning_rate": 1.7365926114218002e-05, "loss": 21.4619, "step": 23990 }, { "epoch": 0.26, "learning_rate": 1.736355756646829e-05, "loss": 21.7101, "step": 24000 }, { "epoch": 0.26, "learning_rate": 1.7361188115983133e-05, "loss": 21.0101, "step": 24010 }, { "epoch": 0.26, "learning_rate": 1.735881776305302e-05, "loss": 22.1505, "step": 24020 }, { "epoch": 0.26, "learning_rate": 1.735644650796854e-05, "loss": 22.0953, "step": 24030 }, { "epoch": 0.26, "learning_rate": 1.7354074351020397e-05, "loss": 21.4451, "step": 24040 }, { "epoch": 0.26, "learning_rate": 1.735170129249941e-05, "loss": 21.5804, "step": 24050 }, { "epoch": 0.26, "learning_rate": 1.73493273326965e-05, "loss": 21.2897, "step": 24060 }, { "epoch": 0.26, "learning_rate": 1.7346952471902706e-05, "loss": 21.4747, "step": 24070 }, { "epoch": 0.26, "learning_rate": 1.734457671040917e-05, "loss": 21.4398, "step": 24080 }, { "epoch": 0.26, "learning_rate": 1.7342200048507152e-05, "loss": 21.498, "step": 24090 }, { "epoch": 0.26, "learning_rate": 1.7339822486488016e-05, "loss": 20.6091, "step": 24100 }, { "epoch": 0.26, "learning_rate": 1.7337444024643243e-05, "loss": 21.472, "step": 24110 }, { "epoch": 0.26, "learning_rate": 1.7335064663264417e-05, "loss": 20.7629, "step": 24120 }, { "epoch": 0.26, "learning_rate": 1.7332684402643238e-05, "loss": 20.7067, "step": 24130 }, { "epoch": 0.26, "learning_rate": 1.733030324307151e-05, "loss": 21.1166, "step": 24140 }, { "epoch": 0.26, "learning_rate": 1.7327921184841157e-05, "loss": 21.9325, "step": 24150 }, { "epoch": 0.26, "learning_rate": 1.7325538228244208e-05, "loss": 21.4053, "step": 24160 }, { "epoch": 0.26, "learning_rate": 1.7323154373572793e-05, "loss": 22.0125, "step": 24170 }, { "epoch": 0.26, "learning_rate": 1.732076962111917e-05, "loss": 21.9184, "step": 24180 }, { "epoch": 0.26, "learning_rate": 1.7318383971175695e-05, "loss": 20.8219, "step": 24190 }, { "epoch": 0.26, "learning_rate": 1.7315997424034834e-05, "loss": 21.1999, "step": 24200 }, { "epoch": 0.26, "learning_rate": 1.7313609979989166e-05, "loss": 22.2116, "step": 24210 }, { "epoch": 0.26, "learning_rate": 1.7311221639331384e-05, "loss": 22.0405, "step": 24220 }, { "epoch": 0.26, "learning_rate": 1.7308832402354284e-05, "loss": 21.9855, "step": 24230 }, { "epoch": 0.26, "learning_rate": 1.7306442269350774e-05, "loss": 21.1288, "step": 24240 }, { "epoch": 0.26, "learning_rate": 1.7304051240613873e-05, "loss": 21.7341, "step": 24250 }, { "epoch": 0.26, "learning_rate": 1.7301659316436708e-05, "loss": 21.3834, "step": 24260 }, { "epoch": 0.26, "learning_rate": 1.729926649711252e-05, "loss": 21.4613, "step": 24270 }, { "epoch": 0.26, "learning_rate": 1.7296872782934654e-05, "loss": 21.3298, "step": 24280 }, { "epoch": 0.26, "learning_rate": 1.729447817419657e-05, "loss": 20.8071, "step": 24290 }, { "epoch": 0.26, "learning_rate": 1.7292082671191832e-05, "loss": 21.6675, "step": 24300 }, { "epoch": 0.26, "learning_rate": 1.7289686274214116e-05, "loss": 21.573, "step": 24310 }, { "epoch": 0.26, "learning_rate": 1.7287288983557213e-05, "loss": 21.1017, "step": 24320 }, { "epoch": 0.26, "learning_rate": 1.7284890799515016e-05, "loss": 20.9238, "step": 24330 }, { "epoch": 0.26, "learning_rate": 1.728249172238153e-05, "loss": 20.9489, "step": 24340 }, { "epoch": 0.26, "learning_rate": 1.7280091752450873e-05, "loss": 21.6623, "step": 24350 }, { "epoch": 0.26, "learning_rate": 1.7277690890017265e-05, "loss": 21.7645, "step": 24360 }, { "epoch": 0.26, "learning_rate": 1.727528913537504e-05, "loss": 21.6271, "step": 24370 }, { "epoch": 0.26, "learning_rate": 1.7272886488818645e-05, "loss": 21.618, "step": 24380 }, { "epoch": 0.26, "learning_rate": 1.727048295064263e-05, "loss": 21.4097, "step": 24390 }, { "epoch": 0.26, "learning_rate": 1.7268078521141657e-05, "loss": 21.4196, "step": 24400 }, { "epoch": 0.26, "learning_rate": 1.72656732006105e-05, "loss": 21.5225, "step": 24410 }, { "epoch": 0.26, "learning_rate": 1.7263266989344032e-05, "loss": 21.98, "step": 24420 }, { "epoch": 0.26, "learning_rate": 1.726085988763725e-05, "loss": 21.2006, "step": 24430 }, { "epoch": 0.26, "learning_rate": 1.725845189578525e-05, "loss": 21.5141, "step": 24440 }, { "epoch": 0.26, "learning_rate": 1.725604301408324e-05, "loss": 21.7455, "step": 24450 }, { "epoch": 0.26, "learning_rate": 1.7253633242826532e-05, "loss": 21.9689, "step": 24460 }, { "epoch": 0.26, "learning_rate": 1.7251222582310562e-05, "loss": 21.4349, "step": 24470 }, { "epoch": 0.26, "learning_rate": 1.7248811032830855e-05, "loss": 22.3122, "step": 24480 }, { "epoch": 0.26, "learning_rate": 1.724639859468306e-05, "loss": 21.6911, "step": 24490 }, { "epoch": 0.26, "learning_rate": 1.724398526816293e-05, "loss": 21.7117, "step": 24500 }, { "epoch": 0.26, "learning_rate": 1.7241571053566325e-05, "loss": 21.56, "step": 24510 }, { "epoch": 0.27, "learning_rate": 1.7239155951189217e-05, "loss": 21.7581, "step": 24520 }, { "epoch": 0.27, "learning_rate": 1.7236739961327687e-05, "loss": 21.7526, "step": 24530 }, { "epoch": 0.27, "learning_rate": 1.723432308427792e-05, "loss": 22.2921, "step": 24540 }, { "epoch": 0.27, "learning_rate": 1.7231905320336213e-05, "loss": 21.5567, "step": 24550 }, { "epoch": 0.27, "learning_rate": 1.7229486669798974e-05, "loss": 21.0646, "step": 24560 }, { "epoch": 0.27, "learning_rate": 1.722706713296272e-05, "loss": 20.9818, "step": 24570 }, { "epoch": 0.27, "learning_rate": 1.7224646710124068e-05, "loss": 21.3997, "step": 24580 }, { "epoch": 0.27, "learning_rate": 1.722222540157975e-05, "loss": 21.431, "step": 24590 }, { "epoch": 0.27, "learning_rate": 1.7219803207626612e-05, "loss": 20.6614, "step": 24600 }, { "epoch": 0.27, "learning_rate": 1.72173801285616e-05, "loss": 20.9391, "step": 24610 }, { "epoch": 0.27, "learning_rate": 1.7214956164681775e-05, "loss": 21.5718, "step": 24620 }, { "epoch": 0.27, "learning_rate": 1.7212531316284294e-05, "loss": 21.0788, "step": 24630 }, { "epoch": 0.27, "learning_rate": 1.721010558366644e-05, "loss": 21.6799, "step": 24640 }, { "epoch": 0.27, "learning_rate": 1.7207678967125588e-05, "loss": 21.8114, "step": 24650 }, { "epoch": 0.27, "learning_rate": 1.7205251466959237e-05, "loss": 20.9005, "step": 24660 }, { "epoch": 0.27, "learning_rate": 1.720282308346498e-05, "loss": 21.4754, "step": 24670 }, { "epoch": 0.27, "learning_rate": 1.720039381694053e-05, "loss": 21.8898, "step": 24680 }, { "epoch": 0.27, "learning_rate": 1.71979636676837e-05, "loss": 21.0222, "step": 24690 }, { "epoch": 0.27, "learning_rate": 1.7195532635992414e-05, "loss": 22.1157, "step": 24700 }, { "epoch": 0.27, "learning_rate": 1.7193100722164705e-05, "loss": 22.7936, "step": 24710 }, { "epoch": 0.27, "learning_rate": 1.7190667926498713e-05, "loss": 20.7328, "step": 24720 }, { "epoch": 0.27, "learning_rate": 1.718823424929269e-05, "loss": 21.7292, "step": 24730 }, { "epoch": 0.27, "learning_rate": 1.718579969084499e-05, "loss": 21.5505, "step": 24740 }, { "epoch": 0.27, "learning_rate": 1.7183364251454074e-05, "loss": 22.5246, "step": 24750 }, { "epoch": 0.27, "learning_rate": 1.718092793141852e-05, "loss": 21.1658, "step": 24760 }, { "epoch": 0.27, "learning_rate": 1.7178490731037007e-05, "loss": 21.2434, "step": 24770 }, { "epoch": 0.27, "learning_rate": 1.7176052650608323e-05, "loss": 22.1075, "step": 24780 }, { "epoch": 0.27, "learning_rate": 1.7173613690431365e-05, "loss": 21.0248, "step": 24790 }, { "epoch": 0.27, "learning_rate": 1.717117385080514e-05, "loss": 21.4432, "step": 24800 }, { "epoch": 0.27, "learning_rate": 1.7168733132028754e-05, "loss": 21.8843, "step": 24810 }, { "epoch": 0.27, "learning_rate": 1.7166291534401432e-05, "loss": 21.7221, "step": 24820 }, { "epoch": 0.27, "learning_rate": 1.71638490582225e-05, "loss": 22.1173, "step": 24830 }, { "epoch": 0.27, "learning_rate": 1.7161405703791397e-05, "loss": 22.0424, "step": 24840 }, { "epoch": 0.27, "learning_rate": 1.715896147140766e-05, "loss": 21.7984, "step": 24850 }, { "epoch": 0.27, "learning_rate": 1.715651636137094e-05, "loss": 21.2739, "step": 24860 }, { "epoch": 0.27, "learning_rate": 1.7154070373981e-05, "loss": 21.3599, "step": 24870 }, { "epoch": 0.27, "learning_rate": 1.7151623509537704e-05, "loss": 21.6377, "step": 24880 }, { "epoch": 0.27, "learning_rate": 1.7149175768341025e-05, "loss": 21.4534, "step": 24890 }, { "epoch": 0.27, "learning_rate": 1.7146727150691048e-05, "loss": 21.0286, "step": 24900 }, { "epoch": 0.27, "learning_rate": 1.714427765688795e-05, "loss": 21.2482, "step": 24910 }, { "epoch": 0.27, "learning_rate": 1.7141827287232037e-05, "loss": 21.3434, "step": 24920 }, { "epoch": 0.27, "learning_rate": 1.713937604202371e-05, "loss": 21.0217, "step": 24930 }, { "epoch": 0.27, "learning_rate": 1.7136923921563476e-05, "loss": 21.7769, "step": 24940 }, { "epoch": 0.27, "learning_rate": 1.7134470926151955e-05, "loss": 21.844, "step": 24950 }, { "epoch": 0.27, "learning_rate": 1.7132017056089876e-05, "loss": 21.547, "step": 24960 }, { "epoch": 0.27, "learning_rate": 1.7129562311678064e-05, "loss": 21.5216, "step": 24970 }, { "epoch": 0.27, "learning_rate": 1.7127106693217463e-05, "loss": 21.9306, "step": 24980 }, { "epoch": 0.27, "learning_rate": 1.712465020100912e-05, "loss": 21.0174, "step": 24990 }, { "epoch": 0.27, "learning_rate": 1.7122192835354184e-05, "loss": 20.9439, "step": 25000 }, { "epoch": 0.27, "learning_rate": 1.7119734596553922e-05, "loss": 21.9415, "step": 25010 }, { "epoch": 0.27, "learning_rate": 1.7117275484909694e-05, "loss": 21.1127, "step": 25020 }, { "epoch": 0.27, "learning_rate": 1.7114815500722987e-05, "loss": 21.8462, "step": 25030 }, { "epoch": 0.27, "learning_rate": 1.711235464429537e-05, "loss": 21.1019, "step": 25040 }, { "epoch": 0.27, "learning_rate": 1.7109892915928535e-05, "loss": 21.0442, "step": 25050 }, { "epoch": 0.27, "learning_rate": 1.7107430315924282e-05, "loss": 21.4202, "step": 25060 }, { "epoch": 0.27, "learning_rate": 1.7104966844584514e-05, "loss": 21.7273, "step": 25070 }, { "epoch": 0.27, "learning_rate": 1.7102502502211235e-05, "loss": 21.5466, "step": 25080 }, { "epoch": 0.27, "learning_rate": 1.7100037289106565e-05, "loss": 21.3203, "step": 25090 }, { "epoch": 0.27, "learning_rate": 1.7097571205572726e-05, "loss": 20.8484, "step": 25100 }, { "epoch": 0.27, "learning_rate": 1.7095104251912043e-05, "loss": 21.8887, "step": 25110 }, { "epoch": 0.27, "learning_rate": 1.709263642842696e-05, "loss": 21.0074, "step": 25120 }, { "epoch": 0.27, "learning_rate": 1.7090167735420013e-05, "loss": 21.6731, "step": 25130 }, { "epoch": 0.27, "learning_rate": 1.7087698173193857e-05, "loss": 21.3058, "step": 25140 }, { "epoch": 0.27, "learning_rate": 1.7085227742051244e-05, "loss": 22.0825, "step": 25150 }, { "epoch": 0.27, "learning_rate": 1.708275644229504e-05, "loss": 22.092, "step": 25160 }, { "epoch": 0.27, "learning_rate": 1.708028427422821e-05, "loss": 21.4493, "step": 25170 }, { "epoch": 0.27, "learning_rate": 1.707781123815383e-05, "loss": 21.2917, "step": 25180 }, { "epoch": 0.27, "learning_rate": 1.7075337334375086e-05, "loss": 20.9149, "step": 25190 }, { "epoch": 0.27, "learning_rate": 1.7072862563195266e-05, "loss": 21.5216, "step": 25200 }, { "epoch": 0.27, "learning_rate": 1.7070386924917756e-05, "loss": 21.2782, "step": 25210 }, { "epoch": 0.27, "learning_rate": 1.7067910419846067e-05, "loss": 21.3505, "step": 25220 }, { "epoch": 0.27, "learning_rate": 1.7065433048283803e-05, "loss": 21.6624, "step": 25230 }, { "epoch": 0.27, "learning_rate": 1.7062954810534677e-05, "loss": 21.1092, "step": 25240 }, { "epoch": 0.27, "learning_rate": 1.7060475706902505e-05, "loss": 21.0515, "step": 25250 }, { "epoch": 0.27, "learning_rate": 1.705799573769122e-05, "loss": 21.4196, "step": 25260 }, { "epoch": 0.27, "learning_rate": 1.7055514903204846e-05, "loss": 22.1364, "step": 25270 }, { "epoch": 0.27, "learning_rate": 1.705303320374753e-05, "loss": 21.6214, "step": 25280 }, { "epoch": 0.27, "learning_rate": 1.7050550639623505e-05, "loss": 21.8538, "step": 25290 }, { "epoch": 0.27, "learning_rate": 1.7048067211137135e-05, "loss": 22.2564, "step": 25300 }, { "epoch": 0.27, "learning_rate": 1.704558291859286e-05, "loss": 21.8005, "step": 25310 }, { "epoch": 0.27, "learning_rate": 1.704309776229525e-05, "loss": 21.064, "step": 25320 }, { "epoch": 0.27, "learning_rate": 1.7040611742548978e-05, "loss": 21.3085, "step": 25330 }, { "epoch": 0.27, "learning_rate": 1.7038124859658808e-05, "loss": 21.6103, "step": 25340 }, { "epoch": 0.27, "learning_rate": 1.7035637113929622e-05, "loss": 21.6467, "step": 25350 }, { "epoch": 0.27, "learning_rate": 1.7033148505666414e-05, "loss": 20.9963, "step": 25360 }, { "epoch": 0.27, "learning_rate": 1.703065903517426e-05, "loss": 21.1418, "step": 25370 }, { "epoch": 0.27, "learning_rate": 1.702816870275837e-05, "loss": 21.5534, "step": 25380 }, { "epoch": 0.27, "learning_rate": 1.7025677508724037e-05, "loss": 21.5455, "step": 25390 }, { "epoch": 0.27, "learning_rate": 1.7023185453376678e-05, "loss": 21.5495, "step": 25400 }, { "epoch": 0.27, "learning_rate": 1.7020692537021795e-05, "loss": 21.7311, "step": 25410 }, { "epoch": 0.27, "learning_rate": 1.7018198759965018e-05, "loss": 21.9051, "step": 25420 }, { "epoch": 0.27, "learning_rate": 1.701570412251206e-05, "loss": 22.1954, "step": 25430 }, { "epoch": 0.28, "learning_rate": 1.7013208624968766e-05, "loss": 21.6152, "step": 25440 }, { "epoch": 0.28, "learning_rate": 1.7010712267641062e-05, "loss": 22.0579, "step": 25450 }, { "epoch": 0.28, "learning_rate": 1.7008215050834986e-05, "loss": 22.8699, "step": 25460 }, { "epoch": 0.28, "learning_rate": 1.7005716974856693e-05, "loss": 22.2694, "step": 25470 }, { "epoch": 0.28, "learning_rate": 1.700321804001243e-05, "loss": 21.4595, "step": 25480 }, { "epoch": 0.28, "learning_rate": 1.7000718246608554e-05, "loss": 21.9472, "step": 25490 }, { "epoch": 0.28, "learning_rate": 1.6998217594951527e-05, "loss": 20.753, "step": 25500 }, { "epoch": 0.28, "learning_rate": 1.699571608534792e-05, "loss": 21.5508, "step": 25510 }, { "epoch": 0.28, "learning_rate": 1.6993213718104403e-05, "loss": 20.9774, "step": 25520 }, { "epoch": 0.28, "learning_rate": 1.699071049352775e-05, "loss": 21.8558, "step": 25530 }, { "epoch": 0.28, "learning_rate": 1.698820641192485e-05, "loss": 20.4868, "step": 25540 }, { "epoch": 0.28, "learning_rate": 1.6985701473602686e-05, "loss": 21.0368, "step": 25550 }, { "epoch": 0.28, "learning_rate": 1.6983195678868355e-05, "loss": 22.1106, "step": 25560 }, { "epoch": 0.28, "learning_rate": 1.6980689028029054e-05, "loss": 22.1131, "step": 25570 }, { "epoch": 0.28, "learning_rate": 1.6978181521392084e-05, "loss": 21.1569, "step": 25580 }, { "epoch": 0.28, "learning_rate": 1.6975673159264854e-05, "loss": 22.6025, "step": 25590 }, { "epoch": 0.28, "learning_rate": 1.697316394195488e-05, "loss": 21.3992, "step": 25600 }, { "epoch": 0.28, "learning_rate": 1.697065386976977e-05, "loss": 21.6315, "step": 25610 }, { "epoch": 0.28, "learning_rate": 1.6968142943017253e-05, "loss": 21.5079, "step": 25620 }, { "epoch": 0.28, "learning_rate": 1.696563116200516e-05, "loss": 21.8239, "step": 25630 }, { "epoch": 0.28, "learning_rate": 1.6963118527041413e-05, "loss": 21.4807, "step": 25640 }, { "epoch": 0.28, "learning_rate": 1.696060503843406e-05, "loss": 20.9954, "step": 25650 }, { "epoch": 0.28, "learning_rate": 1.695809069649123e-05, "loss": 21.3373, "step": 25660 }, { "epoch": 0.28, "learning_rate": 1.695557550152118e-05, "loss": 21.0975, "step": 25670 }, { "epoch": 0.28, "learning_rate": 1.6953059453832254e-05, "loss": 22.0235, "step": 25680 }, { "epoch": 0.28, "learning_rate": 1.695054255373291e-05, "loss": 20.6282, "step": 25690 }, { "epoch": 0.28, "learning_rate": 1.69480248015317e-05, "loss": 21.8696, "step": 25700 }, { "epoch": 0.28, "learning_rate": 1.6945506197537298e-05, "loss": 21.2821, "step": 25710 }, { "epoch": 0.28, "learning_rate": 1.6942986742058465e-05, "loss": 21.5338, "step": 25720 }, { "epoch": 0.28, "learning_rate": 1.6940466435404078e-05, "loss": 21.5562, "step": 25730 }, { "epoch": 0.28, "learning_rate": 1.6937945277883113e-05, "loss": 22.4078, "step": 25740 }, { "epoch": 0.28, "learning_rate": 1.693542326980465e-05, "loss": 21.7984, "step": 25750 }, { "epoch": 0.28, "learning_rate": 1.6932900411477874e-05, "loss": 21.0917, "step": 25760 }, { "epoch": 0.28, "learning_rate": 1.6930376703212076e-05, "loss": 21.4607, "step": 25770 }, { "epoch": 0.28, "learning_rate": 1.6927852145316654e-05, "loss": 21.4219, "step": 25780 }, { "epoch": 0.28, "learning_rate": 1.69253267381011e-05, "loss": 21.9393, "step": 25790 }, { "epoch": 0.28, "learning_rate": 1.6922800481875018e-05, "loss": 21.5905, "step": 25800 }, { "epoch": 0.28, "learning_rate": 1.6920273376948117e-05, "loss": 21.453, "step": 25810 }, { "epoch": 0.28, "learning_rate": 1.6917745423630205e-05, "loss": 21.0464, "step": 25820 }, { "epoch": 0.28, "learning_rate": 1.6915216622231197e-05, "loss": 21.2284, "step": 25830 }, { "epoch": 0.28, "learning_rate": 1.6912686973061113e-05, "loss": 21.3885, "step": 25840 }, { "epoch": 0.28, "learning_rate": 1.6910156476430072e-05, "loss": 21.6782, "step": 25850 }, { "epoch": 0.28, "learning_rate": 1.6907625132648303e-05, "loss": 21.3027, "step": 25860 }, { "epoch": 0.28, "learning_rate": 1.6905092942026137e-05, "loss": 22.1036, "step": 25870 }, { "epoch": 0.28, "learning_rate": 1.6902559904874002e-05, "loss": 21.2696, "step": 25880 }, { "epoch": 0.28, "learning_rate": 1.690002602150244e-05, "loss": 21.818, "step": 25890 }, { "epoch": 0.28, "learning_rate": 1.68974912922221e-05, "loss": 21.4325, "step": 25900 }, { "epoch": 0.28, "learning_rate": 1.6894955717343713e-05, "loss": 21.8491, "step": 25910 }, { "epoch": 0.28, "learning_rate": 1.6892419297178138e-05, "loss": 21.4758, "step": 25920 }, { "epoch": 0.28, "learning_rate": 1.688988203203632e-05, "loss": 21.7171, "step": 25930 }, { "epoch": 0.28, "learning_rate": 1.688734392222932e-05, "loss": 21.3897, "step": 25940 }, { "epoch": 0.28, "learning_rate": 1.6884804968068303e-05, "loss": 21.4235, "step": 25950 }, { "epoch": 0.28, "learning_rate": 1.688226516986452e-05, "loss": 21.97, "step": 25960 }, { "epoch": 0.28, "learning_rate": 1.6879724527929343e-05, "loss": 21.2979, "step": 25970 }, { "epoch": 0.28, "learning_rate": 1.6877183042574246e-05, "loss": 21.1451, "step": 25980 }, { "epoch": 0.28, "learning_rate": 1.6874640714110793e-05, "loss": 21.965, "step": 25990 }, { "epoch": 0.28, "learning_rate": 1.6872097542850672e-05, "loss": 21.9542, "step": 26000 }, { "epoch": 0.28, "learning_rate": 1.6869553529105656e-05, "loss": 21.643, "step": 26010 }, { "epoch": 0.28, "learning_rate": 1.686700867318763e-05, "loss": 22.0746, "step": 26020 }, { "epoch": 0.28, "learning_rate": 1.686446297540858e-05, "loss": 21.8931, "step": 26030 }, { "epoch": 0.28, "learning_rate": 1.6861916436080597e-05, "loss": 21.3548, "step": 26040 }, { "epoch": 0.28, "learning_rate": 1.6859369055515876e-05, "loss": 21.4132, "step": 26050 }, { "epoch": 0.28, "learning_rate": 1.6856820834026708e-05, "loss": 21.7187, "step": 26060 }, { "epoch": 0.28, "learning_rate": 1.6854271771925495e-05, "loss": 21.5735, "step": 26070 }, { "epoch": 0.28, "learning_rate": 1.6851721869524742e-05, "loss": 21.6672, "step": 26080 }, { "epoch": 0.28, "learning_rate": 1.684917112713705e-05, "loss": 22.4142, "step": 26090 }, { "epoch": 0.28, "learning_rate": 1.6846619545075128e-05, "loss": 21.8551, "step": 26100 }, { "epoch": 0.28, "learning_rate": 1.684406712365179e-05, "loss": 21.3167, "step": 26110 }, { "epoch": 0.28, "learning_rate": 1.6841513863179947e-05, "loss": 21.3347, "step": 26120 }, { "epoch": 0.28, "learning_rate": 1.683895976397262e-05, "loss": 21.1492, "step": 26130 }, { "epoch": 0.28, "learning_rate": 1.6836404826342922e-05, "loss": 21.297, "step": 26140 }, { "epoch": 0.28, "learning_rate": 1.683384905060408e-05, "loss": 21.207, "step": 26150 }, { "epoch": 0.28, "learning_rate": 1.6831292437069425e-05, "loss": 21.8104, "step": 26160 }, { "epoch": 0.28, "learning_rate": 1.6828734986052375e-05, "loss": 21.1586, "step": 26170 }, { "epoch": 0.28, "learning_rate": 1.6826176697866467e-05, "loss": 22.0879, "step": 26180 }, { "epoch": 0.28, "learning_rate": 1.6823617572825332e-05, "loss": 21.9457, "step": 26190 }, { "epoch": 0.28, "learning_rate": 1.6821057611242705e-05, "loss": 21.7905, "step": 26200 }, { "epoch": 0.28, "learning_rate": 1.6818496813432425e-05, "loss": 21.7108, "step": 26210 }, { "epoch": 0.28, "learning_rate": 1.6815935179708436e-05, "loss": 21.3084, "step": 26220 }, { "epoch": 0.28, "learning_rate": 1.6813372710384775e-05, "loss": 21.7913, "step": 26230 }, { "epoch": 0.28, "learning_rate": 1.6810809405775595e-05, "loss": 21.3762, "step": 26240 }, { "epoch": 0.28, "learning_rate": 1.6808245266195146e-05, "loss": 21.2098, "step": 26250 }, { "epoch": 0.28, "learning_rate": 1.6805680291957772e-05, "loss": 21.1634, "step": 26260 }, { "epoch": 0.28, "learning_rate": 1.680311448337793e-05, "loss": 21.2239, "step": 26270 }, { "epoch": 0.28, "learning_rate": 1.680054784077017e-05, "loss": 21.1624, "step": 26280 }, { "epoch": 0.28, "learning_rate": 1.6797980364449152e-05, "loss": 21.5842, "step": 26290 }, { "epoch": 0.28, "learning_rate": 1.679541205472964e-05, "loss": 21.1933, "step": 26300 }, { "epoch": 0.28, "learning_rate": 1.6792842911926494e-05, "loss": 21.2718, "step": 26310 }, { "epoch": 0.28, "learning_rate": 1.6790272936354676e-05, "loss": 21.6403, "step": 26320 }, { "epoch": 0.28, "learning_rate": 1.6787702128329256e-05, "loss": 21.1438, "step": 26330 }, { "epoch": 0.28, "learning_rate": 1.6785130488165398e-05, "loss": 20.8673, "step": 26340 }, { "epoch": 0.28, "learning_rate": 1.6782558016178376e-05, "loss": 21.9909, "step": 26350 }, { "epoch": 0.28, "learning_rate": 1.6779984712683555e-05, "loss": 21.8302, "step": 26360 }, { "epoch": 0.29, "learning_rate": 1.677741057799642e-05, "loss": 21.2949, "step": 26370 }, { "epoch": 0.29, "learning_rate": 1.677483561243254e-05, "loss": 21.2875, "step": 26380 }, { "epoch": 0.29, "learning_rate": 1.6772259816307593e-05, "loss": 21.1816, "step": 26390 }, { "epoch": 0.29, "learning_rate": 1.676968318993736e-05, "loss": 22.2946, "step": 26400 }, { "epoch": 0.29, "learning_rate": 1.6767105733637724e-05, "loss": 21.0877, "step": 26410 }, { "epoch": 0.29, "learning_rate": 1.6764527447724664e-05, "loss": 21.3587, "step": 26420 }, { "epoch": 0.29, "learning_rate": 1.6761948332514273e-05, "loss": 20.6317, "step": 26430 }, { "epoch": 0.29, "learning_rate": 1.6759368388322732e-05, "loss": 21.0872, "step": 26440 }, { "epoch": 0.29, "learning_rate": 1.6756787615466326e-05, "loss": 21.2912, "step": 26450 }, { "epoch": 0.29, "learning_rate": 1.6754206014261452e-05, "loss": 21.5426, "step": 26460 }, { "epoch": 0.29, "learning_rate": 1.6751623585024596e-05, "loss": 21.7929, "step": 26470 }, { "epoch": 0.29, "learning_rate": 1.674904032807236e-05, "loss": 21.8562, "step": 26480 }, { "epoch": 0.29, "learning_rate": 1.6746456243721424e-05, "loss": 21.0936, "step": 26490 }, { "epoch": 0.29, "learning_rate": 1.6743871332288594e-05, "loss": 22.5624, "step": 26500 }, { "epoch": 0.29, "learning_rate": 1.6741285594090767e-05, "loss": 21.4717, "step": 26510 }, { "epoch": 0.29, "learning_rate": 1.6738699029444936e-05, "loss": 21.0167, "step": 26520 }, { "epoch": 0.29, "learning_rate": 1.6736111638668203e-05, "loss": 22.3838, "step": 26530 }, { "epoch": 0.29, "learning_rate": 1.673352342207778e-05, "loss": 22.0922, "step": 26540 }, { "epoch": 0.29, "learning_rate": 1.673093437999095e-05, "loss": 22.2234, "step": 26550 }, { "epoch": 0.29, "learning_rate": 1.6728344512725127e-05, "loss": 21.4294, "step": 26560 }, { "epoch": 0.29, "learning_rate": 1.6725753820597818e-05, "loss": 20.9333, "step": 26570 }, { "epoch": 0.29, "learning_rate": 1.6723162303926628e-05, "loss": 21.3491, "step": 26580 }, { "epoch": 0.29, "learning_rate": 1.672056996302926e-05, "loss": 21.874, "step": 26590 }, { "epoch": 0.29, "learning_rate": 1.6717976798223527e-05, "loss": 21.5892, "step": 26600 }, { "epoch": 0.29, "learning_rate": 1.6715382809827337e-05, "loss": 21.1523, "step": 26610 }, { "epoch": 0.29, "learning_rate": 1.6712787998158694e-05, "loss": 21.1469, "step": 26620 }, { "epoch": 0.29, "learning_rate": 1.6710192363535715e-05, "loss": 21.7546, "step": 26630 }, { "epoch": 0.29, "learning_rate": 1.670759590627661e-05, "loss": 20.8931, "step": 26640 }, { "epoch": 0.29, "learning_rate": 1.6704998626699692e-05, "loss": 21.4233, "step": 26650 }, { "epoch": 0.29, "learning_rate": 1.670240052512338e-05, "loss": 21.5387, "step": 26660 }, { "epoch": 0.29, "learning_rate": 1.6699801601866178e-05, "loss": 21.562, "step": 26670 }, { "epoch": 0.29, "learning_rate": 1.6697201857246707e-05, "loss": 20.8645, "step": 26680 }, { "epoch": 0.29, "learning_rate": 1.669460129158368e-05, "loss": 22.145, "step": 26690 }, { "epoch": 0.29, "learning_rate": 1.6691999905195917e-05, "loss": 20.8362, "step": 26700 }, { "epoch": 0.29, "learning_rate": 1.6689397698402333e-05, "loss": 21.5509, "step": 26710 }, { "epoch": 0.29, "learning_rate": 1.6686794671521945e-05, "loss": 21.5305, "step": 26720 }, { "epoch": 0.29, "learning_rate": 1.6684190824873875e-05, "loss": 21.8017, "step": 26730 }, { "epoch": 0.29, "learning_rate": 1.6681586158777334e-05, "loss": 21.3537, "step": 26740 }, { "epoch": 0.29, "learning_rate": 1.6678980673551644e-05, "loss": 21.3471, "step": 26750 }, { "epoch": 0.29, "learning_rate": 1.667637436951623e-05, "loss": 21.8242, "step": 26760 }, { "epoch": 0.29, "learning_rate": 1.667376724699061e-05, "loss": 21.6683, "step": 26770 }, { "epoch": 0.29, "learning_rate": 1.6671159306294397e-05, "loss": 21.4478, "step": 26780 }, { "epoch": 0.29, "learning_rate": 1.666855054774732e-05, "loss": 21.9741, "step": 26790 }, { "epoch": 0.29, "learning_rate": 1.6665940971669195e-05, "loss": 21.3025, "step": 26800 }, { "epoch": 0.29, "learning_rate": 1.6663330578379943e-05, "loss": 22.4047, "step": 26810 }, { "epoch": 0.29, "learning_rate": 1.666071936819959e-05, "loss": 21.3908, "step": 26820 }, { "epoch": 0.29, "learning_rate": 1.6658107341448252e-05, "loss": 21.5982, "step": 26830 }, { "epoch": 0.29, "learning_rate": 1.6655494498446154e-05, "loss": 21.0016, "step": 26840 }, { "epoch": 0.29, "learning_rate": 1.6652880839513615e-05, "loss": 21.2399, "step": 26850 }, { "epoch": 0.29, "learning_rate": 1.6650266364971056e-05, "loss": 21.5271, "step": 26860 }, { "epoch": 0.29, "learning_rate": 1.6647651075139e-05, "loss": 21.6543, "step": 26870 }, { "epoch": 0.29, "learning_rate": 1.664503497033807e-05, "loss": 21.8152, "step": 26880 }, { "epoch": 0.29, "learning_rate": 1.6642418050888985e-05, "loss": 21.428, "step": 26890 }, { "epoch": 0.29, "learning_rate": 1.663980031711257e-05, "loss": 21.6072, "step": 26900 }, { "epoch": 0.29, "learning_rate": 1.663718176932974e-05, "loss": 21.8684, "step": 26910 }, { "epoch": 0.29, "learning_rate": 1.663456240786152e-05, "loss": 21.8351, "step": 26920 }, { "epoch": 0.29, "learning_rate": 1.6631942233029034e-05, "loss": 22.345, "step": 26930 }, { "epoch": 0.29, "learning_rate": 1.6629321245153494e-05, "loss": 21.8939, "step": 26940 }, { "epoch": 0.29, "learning_rate": 1.6626699444556225e-05, "loss": 22.0321, "step": 26950 }, { "epoch": 0.29, "learning_rate": 1.6624076831558645e-05, "loss": 21.8133, "step": 26960 }, { "epoch": 0.29, "learning_rate": 1.6621453406482277e-05, "loss": 20.5813, "step": 26970 }, { "epoch": 0.29, "learning_rate": 1.6618829169648733e-05, "loss": 21.3001, "step": 26980 }, { "epoch": 0.29, "learning_rate": 1.6616204121379736e-05, "loss": 21.4155, "step": 26990 }, { "epoch": 0.29, "learning_rate": 1.661357826199711e-05, "loss": 21.8756, "step": 27000 }, { "epoch": 0.29, "learning_rate": 1.661095159182276e-05, "loss": 22.4733, "step": 27010 }, { "epoch": 0.29, "learning_rate": 1.6608324111178706e-05, "loss": 22.1948, "step": 27020 }, { "epoch": 0.29, "learning_rate": 1.6605695820387072e-05, "loss": 21.9767, "step": 27030 }, { "epoch": 0.29, "learning_rate": 1.6603066719770066e-05, "loss": 22.2678, "step": 27040 }, { "epoch": 0.29, "learning_rate": 1.660043680965e-05, "loss": 22.0155, "step": 27050 }, { "epoch": 0.29, "learning_rate": 1.6597806090349296e-05, "loss": 21.2259, "step": 27060 }, { "epoch": 0.29, "learning_rate": 1.659517456219046e-05, "loss": 21.2566, "step": 27070 }, { "epoch": 0.29, "learning_rate": 1.659254222549611e-05, "loss": 21.099, "step": 27080 }, { "epoch": 0.29, "learning_rate": 1.6589909080588954e-05, "loss": 22.065, "step": 27090 }, { "epoch": 0.29, "learning_rate": 1.6587275127791804e-05, "loss": 21.1278, "step": 27100 }, { "epoch": 0.29, "learning_rate": 1.6584640367427568e-05, "loss": 21.0846, "step": 27110 }, { "epoch": 0.29, "learning_rate": 1.658200479981926e-05, "loss": 21.8793, "step": 27120 }, { "epoch": 0.29, "learning_rate": 1.6579368425289976e-05, "loss": 21.7556, "step": 27130 }, { "epoch": 0.29, "learning_rate": 1.657673124416293e-05, "loss": 21.4954, "step": 27140 }, { "epoch": 0.29, "learning_rate": 1.6574093256761425e-05, "loss": 22.0279, "step": 27150 }, { "epoch": 0.29, "learning_rate": 1.6571454463408872e-05, "loss": 21.524, "step": 27160 }, { "epoch": 0.29, "learning_rate": 1.6568814864428762e-05, "loss": 21.1982, "step": 27170 }, { "epoch": 0.29, "learning_rate": 1.6566174460144705e-05, "loss": 21.2535, "step": 27180 }, { "epoch": 0.29, "learning_rate": 1.6563533250880404e-05, "loss": 21.3971, "step": 27190 }, { "epoch": 0.29, "learning_rate": 1.656089123695965e-05, "loss": 21.0373, "step": 27200 }, { "epoch": 0.29, "learning_rate": 1.655824841870634e-05, "loss": 22.2532, "step": 27210 }, { "epoch": 0.29, "learning_rate": 1.655560479644448e-05, "loss": 21.8088, "step": 27220 }, { "epoch": 0.29, "learning_rate": 1.6552960370498157e-05, "loss": 22.1383, "step": 27230 }, { "epoch": 0.29, "learning_rate": 1.6550315141191567e-05, "loss": 21.2044, "step": 27240 }, { "epoch": 0.29, "learning_rate": 1.6547669108849e-05, "loss": 22.4593, "step": 27250 }, { "epoch": 0.29, "learning_rate": 1.654502227379485e-05, "loss": 21.2038, "step": 27260 }, { "epoch": 0.29, "learning_rate": 1.6542374636353605e-05, "loss": 21.8405, "step": 27270 }, { "epoch": 0.29, "learning_rate": 1.653972619684985e-05, "loss": 20.79, "step": 27280 }, { "epoch": 0.3, "learning_rate": 1.6537076955608272e-05, "loss": 21.2995, "step": 27290 }, { "epoch": 0.3, "learning_rate": 1.6534426912953652e-05, "loss": 20.6619, "step": 27300 }, { "epoch": 0.3, "learning_rate": 1.6531776069210877e-05, "loss": 21.9116, "step": 27310 }, { "epoch": 0.3, "learning_rate": 1.652912442470492e-05, "loss": 21.7788, "step": 27320 }, { "epoch": 0.3, "learning_rate": 1.652647197976087e-05, "loss": 21.4847, "step": 27330 }, { "epoch": 0.3, "learning_rate": 1.6523818734703895e-05, "loss": 20.9894, "step": 27340 }, { "epoch": 0.3, "learning_rate": 1.652116468985927e-05, "loss": 21.3529, "step": 27350 }, { "epoch": 0.3, "learning_rate": 1.651850984555237e-05, "loss": 21.4317, "step": 27360 }, { "epoch": 0.3, "learning_rate": 1.6515854202108668e-05, "loss": 22.1601, "step": 27370 }, { "epoch": 0.3, "learning_rate": 1.651319775985373e-05, "loss": 22.1142, "step": 27380 }, { "epoch": 0.3, "learning_rate": 1.6510540519113222e-05, "loss": 21.3998, "step": 27390 }, { "epoch": 0.3, "learning_rate": 1.6507882480212908e-05, "loss": 21.1619, "step": 27400 }, { "epoch": 0.3, "learning_rate": 1.650522364347865e-05, "loss": 21.1908, "step": 27410 }, { "epoch": 0.3, "learning_rate": 1.650256400923641e-05, "loss": 22.0027, "step": 27420 }, { "epoch": 0.3, "learning_rate": 1.6499903577812252e-05, "loss": 22.1363, "step": 27430 }, { "epoch": 0.3, "learning_rate": 1.6497242349532317e-05, "loss": 21.6285, "step": 27440 }, { "epoch": 0.3, "learning_rate": 1.649458032472287e-05, "loss": 21.9248, "step": 27450 }, { "epoch": 0.3, "learning_rate": 1.6491917503710257e-05, "loss": 20.8433, "step": 27460 }, { "epoch": 0.3, "learning_rate": 1.6489253886820927e-05, "loss": 21.1439, "step": 27470 }, { "epoch": 0.3, "learning_rate": 1.6486589474381428e-05, "loss": 21.3815, "step": 27480 }, { "epoch": 0.3, "learning_rate": 1.6483924266718405e-05, "loss": 21.4846, "step": 27490 }, { "epoch": 0.3, "learning_rate": 1.6481258264158595e-05, "loss": 21.5401, "step": 27500 }, { "epoch": 0.3, "learning_rate": 1.6478591467028838e-05, "loss": 21.1087, "step": 27510 }, { "epoch": 0.3, "learning_rate": 1.6475923875656073e-05, "loss": 20.4721, "step": 27520 }, { "epoch": 0.3, "learning_rate": 1.6473255490367326e-05, "loss": 21.1728, "step": 27530 }, { "epoch": 0.3, "learning_rate": 1.6470586311489735e-05, "loss": 21.9755, "step": 27540 }, { "epoch": 0.3, "learning_rate": 1.646791633935053e-05, "loss": 21.3965, "step": 27550 }, { "epoch": 0.3, "learning_rate": 1.6465245574277028e-05, "loss": 20.8194, "step": 27560 }, { "epoch": 0.3, "learning_rate": 1.6462574016596655e-05, "loss": 21.531, "step": 27570 }, { "epoch": 0.3, "learning_rate": 1.645990166663693e-05, "loss": 21.5775, "step": 27580 }, { "epoch": 0.3, "learning_rate": 1.6457228524725475e-05, "loss": 20.8324, "step": 27590 }, { "epoch": 0.3, "learning_rate": 1.6454554591189997e-05, "loss": 21.4325, "step": 27600 }, { "epoch": 0.3, "learning_rate": 1.645187986635831e-05, "loss": 21.4341, "step": 27610 }, { "epoch": 0.3, "learning_rate": 1.6449204350558323e-05, "loss": 21.5612, "step": 27620 }, { "epoch": 0.3, "learning_rate": 1.644652804411804e-05, "loss": 21.6994, "step": 27630 }, { "epoch": 0.3, "learning_rate": 1.644385094736556e-05, "loss": 20.8437, "step": 27640 }, { "epoch": 0.3, "learning_rate": 1.6441173060629084e-05, "loss": 21.1692, "step": 27650 }, { "epoch": 0.3, "learning_rate": 1.643849438423691e-05, "loss": 21.3746, "step": 27660 }, { "epoch": 0.3, "learning_rate": 1.6435814918517427e-05, "loss": 20.8873, "step": 27670 }, { "epoch": 0.3, "learning_rate": 1.643313466379912e-05, "loss": 21.3713, "step": 27680 }, { "epoch": 0.3, "learning_rate": 1.6430453620410586e-05, "loss": 21.2, "step": 27690 }, { "epoch": 0.3, "learning_rate": 1.64277717886805e-05, "loss": 21.47, "step": 27700 }, { "epoch": 0.3, "learning_rate": 1.642508916893764e-05, "loss": 22.0008, "step": 27710 }, { "epoch": 0.3, "learning_rate": 1.6422405761510888e-05, "loss": 21.1029, "step": 27720 }, { "epoch": 0.3, "learning_rate": 1.6419721566729215e-05, "loss": 21.7045, "step": 27730 }, { "epoch": 0.3, "learning_rate": 1.6417036584921686e-05, "loss": 21.365, "step": 27740 }, { "epoch": 0.3, "learning_rate": 1.6414350816417466e-05, "loss": 22.0362, "step": 27750 }, { "epoch": 0.3, "learning_rate": 1.641166426154582e-05, "loss": 22.383, "step": 27760 }, { "epoch": 0.3, "learning_rate": 1.6408976920636105e-05, "loss": 21.1118, "step": 27770 }, { "epoch": 0.3, "learning_rate": 1.6406288794017775e-05, "loss": 21.2587, "step": 27780 }, { "epoch": 0.3, "learning_rate": 1.6403599882020382e-05, "loss": 20.7362, "step": 27790 }, { "epoch": 0.3, "learning_rate": 1.6400910184973576e-05, "loss": 22.4513, "step": 27800 }, { "epoch": 0.3, "learning_rate": 1.6398219703207095e-05, "loss": 21.1415, "step": 27810 }, { "epoch": 0.3, "learning_rate": 1.6395528437050782e-05, "loss": 21.5401, "step": 27820 }, { "epoch": 0.3, "learning_rate": 1.639283638683457e-05, "loss": 21.9897, "step": 27830 }, { "epoch": 0.3, "learning_rate": 1.6390143552888493e-05, "loss": 21.8449, "step": 27840 }, { "epoch": 0.3, "learning_rate": 1.638744993554268e-05, "loss": 21.5647, "step": 27850 }, { "epoch": 0.3, "learning_rate": 1.6384755535127355e-05, "loss": 21.0505, "step": 27860 }, { "epoch": 0.3, "learning_rate": 1.6382060351972833e-05, "loss": 20.8846, "step": 27870 }, { "epoch": 0.3, "learning_rate": 1.637936438640954e-05, "loss": 22.1434, "step": 27880 }, { "epoch": 0.3, "learning_rate": 1.6376667638767974e-05, "loss": 21.9295, "step": 27890 }, { "epoch": 0.3, "learning_rate": 1.6373970109378758e-05, "loss": 21.6484, "step": 27900 }, { "epoch": 0.3, "learning_rate": 1.6371271798572584e-05, "loss": 20.7097, "step": 27910 }, { "epoch": 0.3, "learning_rate": 1.636857270668026e-05, "loss": 21.4798, "step": 27920 }, { "epoch": 0.3, "learning_rate": 1.636587283403267e-05, "loss": 20.6952, "step": 27930 }, { "epoch": 0.3, "learning_rate": 1.6363172180960816e-05, "loss": 21.929, "step": 27940 }, { "epoch": 0.3, "learning_rate": 1.6360470747795782e-05, "loss": 20.9427, "step": 27950 }, { "epoch": 0.3, "learning_rate": 1.6357768534868747e-05, "loss": 21.0289, "step": 27960 }, { "epoch": 0.3, "learning_rate": 1.6355065542510992e-05, "loss": 21.1023, "step": 27970 }, { "epoch": 0.3, "learning_rate": 1.6352361771053885e-05, "loss": 21.5996, "step": 27980 }, { "epoch": 0.3, "learning_rate": 1.6349657220828902e-05, "loss": 21.4832, "step": 27990 }, { "epoch": 0.3, "learning_rate": 1.6346951892167603e-05, "loss": 21.7037, "step": 28000 }, { "epoch": 0.3, "learning_rate": 1.6344245785401653e-05, "loss": 20.6736, "step": 28010 }, { "epoch": 0.3, "learning_rate": 1.63415389008628e-05, "loss": 21.0259, "step": 28020 }, { "epoch": 0.3, "learning_rate": 1.6338831238882897e-05, "loss": 21.2749, "step": 28030 }, { "epoch": 0.3, "learning_rate": 1.633612279979389e-05, "loss": 21.6506, "step": 28040 }, { "epoch": 0.3, "learning_rate": 1.6333413583927825e-05, "loss": 21.315, "step": 28050 }, { "epoch": 0.3, "learning_rate": 1.633070359161683e-05, "loss": 21.9155, "step": 28060 }, { "epoch": 0.3, "learning_rate": 1.6327992823193142e-05, "loss": 21.1024, "step": 28070 }, { "epoch": 0.3, "learning_rate": 1.6325281278989087e-05, "loss": 21.5655, "step": 28080 }, { "epoch": 0.3, "learning_rate": 1.6322568959337086e-05, "loss": 21.4249, "step": 28090 }, { "epoch": 0.3, "learning_rate": 1.6319855864569656e-05, "loss": 21.3481, "step": 28100 }, { "epoch": 0.3, "learning_rate": 1.631714199501941e-05, "loss": 20.748, "step": 28110 }, { "epoch": 0.3, "learning_rate": 1.631442735101905e-05, "loss": 21.766, "step": 28120 }, { "epoch": 0.3, "learning_rate": 1.6311711932901385e-05, "loss": 22.0906, "step": 28130 }, { "epoch": 0.3, "learning_rate": 1.630899574099931e-05, "loss": 21.083, "step": 28140 }, { "epoch": 0.3, "learning_rate": 1.6306278775645813e-05, "loss": 20.2939, "step": 28150 }, { "epoch": 0.3, "learning_rate": 1.630356103717398e-05, "loss": 22.3667, "step": 28160 }, { "epoch": 0.3, "learning_rate": 1.6300842525916997e-05, "loss": 21.5183, "step": 28170 }, { "epoch": 0.3, "learning_rate": 1.6298123242208138e-05, "loss": 21.2128, "step": 28180 }, { "epoch": 0.3, "learning_rate": 1.629540318638077e-05, "loss": 21.7851, "step": 28190 }, { "epoch": 0.3, "learning_rate": 1.6292682358768362e-05, "loss": 21.4883, "step": 28200 }, { "epoch": 0.3, "learning_rate": 1.6289960759704476e-05, "loss": 21.6894, "step": 28210 }, { "epoch": 0.31, "learning_rate": 1.628723838952276e-05, "loss": 21.5273, "step": 28220 }, { "epoch": 0.31, "learning_rate": 1.628451524855697e-05, "loss": 21.821, "step": 28230 }, { "epoch": 0.31, "learning_rate": 1.6281791337140945e-05, "loss": 20.4838, "step": 28240 }, { "epoch": 0.31, "learning_rate": 1.6279066655608626e-05, "loss": 21.2771, "step": 28250 }, { "epoch": 0.31, "learning_rate": 1.627634120429404e-05, "loss": 20.9682, "step": 28260 }, { "epoch": 0.31, "learning_rate": 1.627361498353132e-05, "loss": 22.3233, "step": 28270 }, { "epoch": 0.31, "learning_rate": 1.6270887993654684e-05, "loss": 21.8026, "step": 28280 }, { "epoch": 0.31, "learning_rate": 1.6268160234998448e-05, "loss": 21.7378, "step": 28290 }, { "epoch": 0.31, "learning_rate": 1.6265431707897018e-05, "loss": 21.2936, "step": 28300 }, { "epoch": 0.31, "learning_rate": 1.6262702412684906e-05, "loss": 20.2798, "step": 28310 }, { "epoch": 0.31, "learning_rate": 1.6259972349696702e-05, "loss": 20.5898, "step": 28320 }, { "epoch": 0.31, "learning_rate": 1.62572415192671e-05, "loss": 21.9375, "step": 28330 }, { "epoch": 0.31, "learning_rate": 1.625450992173089e-05, "loss": 21.999, "step": 28340 }, { "epoch": 0.31, "learning_rate": 1.6251777557422953e-05, "loss": 20.4994, "step": 28350 }, { "epoch": 0.31, "learning_rate": 1.6249044426678255e-05, "loss": 21.643, "step": 28360 }, { "epoch": 0.31, "learning_rate": 1.624631052983187e-05, "loss": 21.5335, "step": 28370 }, { "epoch": 0.31, "learning_rate": 1.624357586721896e-05, "loss": 22.443, "step": 28380 }, { "epoch": 0.31, "learning_rate": 1.624084043917478e-05, "loss": 20.8569, "step": 28390 }, { "epoch": 0.31, "learning_rate": 1.623810424603468e-05, "loss": 20.954, "step": 28400 }, { "epoch": 0.31, "learning_rate": 1.6235367288134103e-05, "loss": 21.6665, "step": 28410 }, { "epoch": 0.31, "learning_rate": 1.623262956580859e-05, "loss": 22.2583, "step": 28420 }, { "epoch": 0.31, "learning_rate": 1.6229891079393764e-05, "loss": 21.7426, "step": 28430 }, { "epoch": 0.31, "learning_rate": 1.622715182922536e-05, "loss": 21.1295, "step": 28440 }, { "epoch": 0.31, "learning_rate": 1.622441181563919e-05, "loss": 21.9941, "step": 28450 }, { "epoch": 0.31, "learning_rate": 1.6221671038971164e-05, "loss": 20.8844, "step": 28460 }, { "epoch": 0.31, "learning_rate": 1.6218929499557295e-05, "loss": 20.5562, "step": 28470 }, { "epoch": 0.31, "learning_rate": 1.621618719773368e-05, "loss": 21.0373, "step": 28480 }, { "epoch": 0.31, "learning_rate": 1.6213444133836505e-05, "loss": 21.2941, "step": 28490 }, { "epoch": 0.31, "learning_rate": 1.621070030820206e-05, "loss": 20.9401, "step": 28500 }, { "epoch": 0.31, "learning_rate": 1.620795572116673e-05, "loss": 21.8854, "step": 28510 }, { "epoch": 0.31, "learning_rate": 1.620521037306698e-05, "loss": 21.8394, "step": 28520 }, { "epoch": 0.31, "learning_rate": 1.6202464264239376e-05, "loss": 21.6478, "step": 28530 }, { "epoch": 0.31, "learning_rate": 1.619971739502058e-05, "loss": 21.1368, "step": 28540 }, { "epoch": 0.31, "learning_rate": 1.619696976574735e-05, "loss": 21.69, "step": 28550 }, { "epoch": 0.31, "learning_rate": 1.619422137675652e-05, "loss": 21.2728, "step": 28560 }, { "epoch": 0.31, "learning_rate": 1.6191472228385035e-05, "loss": 21.9686, "step": 28570 }, { "epoch": 0.31, "learning_rate": 1.6188722320969928e-05, "loss": 21.0466, "step": 28580 }, { "epoch": 0.31, "learning_rate": 1.6185971654848325e-05, "loss": 21.1424, "step": 28590 }, { "epoch": 0.31, "learning_rate": 1.618322023035744e-05, "loss": 21.1034, "step": 28600 }, { "epoch": 0.31, "learning_rate": 1.6180468047834584e-05, "loss": 21.6735, "step": 28610 }, { "epoch": 0.31, "learning_rate": 1.6177715107617166e-05, "loss": 21.0015, "step": 28620 }, { "epoch": 0.31, "learning_rate": 1.617496141004267e-05, "loss": 21.624, "step": 28630 }, { "epoch": 0.31, "learning_rate": 1.6172206955448703e-05, "loss": 20.2769, "step": 28640 }, { "epoch": 0.31, "learning_rate": 1.6169451744172936e-05, "loss": 21.979, "step": 28650 }, { "epoch": 0.31, "learning_rate": 1.6166695776553147e-05, "loss": 21.0809, "step": 28660 }, { "epoch": 0.31, "learning_rate": 1.6163939052927206e-05, "loss": 21.2559, "step": 28670 }, { "epoch": 0.31, "learning_rate": 1.6161181573633072e-05, "loss": 21.1987, "step": 28680 }, { "epoch": 0.31, "learning_rate": 1.6158423339008793e-05, "loss": 21.9595, "step": 28690 }, { "epoch": 0.31, "learning_rate": 1.6155664349392522e-05, "loss": 21.2728, "step": 28700 }, { "epoch": 0.31, "learning_rate": 1.6152904605122496e-05, "loss": 21.1449, "step": 28710 }, { "epoch": 0.31, "learning_rate": 1.6150144106537046e-05, "loss": 21.4287, "step": 28720 }, { "epoch": 0.31, "learning_rate": 1.6147382853974594e-05, "loss": 21.1582, "step": 28730 }, { "epoch": 0.31, "learning_rate": 1.6144620847773653e-05, "loss": 22.2177, "step": 28740 }, { "epoch": 0.31, "learning_rate": 1.6141858088272838e-05, "loss": 20.9953, "step": 28750 }, { "epoch": 0.31, "learning_rate": 1.6139094575810842e-05, "loss": 21.1912, "step": 28760 }, { "epoch": 0.31, "learning_rate": 1.6136330310726463e-05, "loss": 21.1558, "step": 28770 }, { "epoch": 0.31, "learning_rate": 1.6133565293358587e-05, "loss": 22.078, "step": 28780 }, { "epoch": 0.31, "learning_rate": 1.6130799524046188e-05, "loss": 21.4096, "step": 28790 }, { "epoch": 0.31, "learning_rate": 1.6128033003128332e-05, "loss": 21.9245, "step": 28800 }, { "epoch": 0.31, "learning_rate": 1.6125265730944192e-05, "loss": 21.8235, "step": 28810 }, { "epoch": 0.31, "learning_rate": 1.612249770783301e-05, "loss": 21.7617, "step": 28820 }, { "epoch": 0.31, "learning_rate": 1.6119728934134142e-05, "loss": 21.1038, "step": 28830 }, { "epoch": 0.31, "learning_rate": 1.6116959410187017e-05, "loss": 21.6357, "step": 28840 }, { "epoch": 0.31, "learning_rate": 1.6114189136331168e-05, "loss": 21.0554, "step": 28850 }, { "epoch": 0.31, "learning_rate": 1.611141811290622e-05, "loss": 21.0963, "step": 28860 }, { "epoch": 0.31, "learning_rate": 1.6108646340251884e-05, "loss": 21.0275, "step": 28870 }, { "epoch": 0.31, "learning_rate": 1.6105873818707963e-05, "loss": 21.5083, "step": 28880 }, { "epoch": 0.31, "learning_rate": 1.6103100548614358e-05, "loss": 21.8649, "step": 28890 }, { "epoch": 0.31, "learning_rate": 1.6100326530311055e-05, "loss": 21.3077, "step": 28900 }, { "epoch": 0.31, "learning_rate": 1.609755176413814e-05, "loss": 22.5204, "step": 28910 }, { "epoch": 0.31, "learning_rate": 1.6094776250435782e-05, "loss": 21.4795, "step": 28920 }, { "epoch": 0.31, "learning_rate": 1.6091999989544243e-05, "loss": 21.8198, "step": 28930 }, { "epoch": 0.31, "learning_rate": 1.6089222981803884e-05, "loss": 21.6818, "step": 28940 }, { "epoch": 0.31, "learning_rate": 1.6086445227555146e-05, "loss": 21.4822, "step": 28950 }, { "epoch": 0.31, "learning_rate": 1.6083666727138575e-05, "loss": 21.4494, "step": 28960 }, { "epoch": 0.31, "learning_rate": 1.6080887480894792e-05, "loss": 22.4222, "step": 28970 }, { "epoch": 0.31, "learning_rate": 1.6078107489164526e-05, "loss": 20.7242, "step": 28980 }, { "epoch": 0.31, "learning_rate": 1.607532675228859e-05, "loss": 21.3236, "step": 28990 }, { "epoch": 0.31, "learning_rate": 1.6072545270607893e-05, "loss": 21.2826, "step": 29000 }, { "epoch": 0.31, "learning_rate": 1.6069763044463414e-05, "loss": 21.8612, "step": 29010 }, { "epoch": 0.31, "learning_rate": 1.6066980074196257e-05, "loss": 21.1751, "step": 29020 }, { "epoch": 0.31, "learning_rate": 1.606419636014759e-05, "loss": 20.9727, "step": 29030 }, { "epoch": 0.31, "learning_rate": 1.6061411902658687e-05, "loss": 21.5074, "step": 29040 }, { "epoch": 0.31, "learning_rate": 1.605862670207091e-05, "loss": 21.8402, "step": 29050 }, { "epoch": 0.31, "learning_rate": 1.605584075872571e-05, "loss": 22.0144, "step": 29060 }, { "epoch": 0.31, "learning_rate": 1.6053054072964626e-05, "loss": 20.7026, "step": 29070 }, { "epoch": 0.31, "learning_rate": 1.6050266645129293e-05, "loss": 21.0387, "step": 29080 }, { "epoch": 0.31, "learning_rate": 1.604747847556144e-05, "loss": 22.1676, "step": 29090 }, { "epoch": 0.31, "learning_rate": 1.6044689564602878e-05, "loss": 21.676, "step": 29100 }, { "epoch": 0.31, "learning_rate": 1.6041899912595517e-05, "loss": 21.45, "step": 29110 }, { "epoch": 0.31, "learning_rate": 1.603910951988135e-05, "loss": 20.9311, "step": 29120 }, { "epoch": 0.31, "learning_rate": 1.603631838680247e-05, "loss": 21.2272, "step": 29130 }, { "epoch": 0.32, "learning_rate": 1.6033526513701053e-05, "loss": 21.1192, "step": 29140 }, { "epoch": 0.32, "learning_rate": 1.603073390091937e-05, "loss": 21.3691, "step": 29150 }, { "epoch": 0.32, "learning_rate": 1.602794054879978e-05, "loss": 22.0361, "step": 29160 }, { "epoch": 0.32, "learning_rate": 1.602514645768474e-05, "loss": 20.7393, "step": 29170 }, { "epoch": 0.32, "learning_rate": 1.6022351627916783e-05, "loss": 21.1884, "step": 29180 }, { "epoch": 0.32, "learning_rate": 1.6019556059838542e-05, "loss": 21.6668, "step": 29190 }, { "epoch": 0.32, "learning_rate": 1.6016759753792746e-05, "loss": 21.8779, "step": 29200 }, { "epoch": 0.32, "learning_rate": 1.6013962710122203e-05, "loss": 20.8328, "step": 29210 }, { "epoch": 0.32, "learning_rate": 1.601116492916982e-05, "loss": 21.4774, "step": 29220 }, { "epoch": 0.32, "learning_rate": 1.600836641127859e-05, "loss": 21.5217, "step": 29230 }, { "epoch": 0.32, "learning_rate": 1.6005567156791593e-05, "loss": 22.5339, "step": 29240 }, { "epoch": 0.32, "learning_rate": 1.6002767166052012e-05, "loss": 22.2747, "step": 29250 }, { "epoch": 0.32, "learning_rate": 1.5999966439403105e-05, "loss": 21.3707, "step": 29260 }, { "epoch": 0.32, "learning_rate": 1.599716497718823e-05, "loss": 21.3443, "step": 29270 }, { "epoch": 0.32, "learning_rate": 1.5994362779750833e-05, "loss": 21.5261, "step": 29280 }, { "epoch": 0.32, "learning_rate": 1.5991559847434447e-05, "loss": 21.7279, "step": 29290 }, { "epoch": 0.32, "learning_rate": 1.5988756180582696e-05, "loss": 21.442, "step": 29300 }, { "epoch": 0.32, "learning_rate": 1.59859517795393e-05, "loss": 21.3451, "step": 29310 }, { "epoch": 0.32, "learning_rate": 1.5983146644648067e-05, "loss": 21.4056, "step": 29320 }, { "epoch": 0.32, "learning_rate": 1.598034077625288e-05, "loss": 21.8411, "step": 29330 }, { "epoch": 0.32, "learning_rate": 1.597753417469774e-05, "loss": 20.9334, "step": 29340 }, { "epoch": 0.32, "learning_rate": 1.5974726840326712e-05, "loss": 20.7815, "step": 29350 }, { "epoch": 0.32, "learning_rate": 1.5971918773483966e-05, "loss": 22.332, "step": 29360 }, { "epoch": 0.32, "learning_rate": 1.5969109974513758e-05, "loss": 21.309, "step": 29370 }, { "epoch": 0.32, "learning_rate": 1.596630044376043e-05, "loss": 21.2583, "step": 29380 }, { "epoch": 0.32, "learning_rate": 1.596349018156841e-05, "loss": 21.3636, "step": 29390 }, { "epoch": 0.32, "learning_rate": 1.5960679188282235e-05, "loss": 22.0163, "step": 29400 }, { "epoch": 0.32, "learning_rate": 1.595786746424651e-05, "loss": 22.0796, "step": 29410 }, { "epoch": 0.32, "learning_rate": 1.595505500980594e-05, "loss": 21.4367, "step": 29420 }, { "epoch": 0.32, "learning_rate": 1.595224182530532e-05, "loss": 20.9653, "step": 29430 }, { "epoch": 0.32, "learning_rate": 1.5949427911089527e-05, "loss": 21.2009, "step": 29440 }, { "epoch": 0.32, "learning_rate": 1.5946613267503545e-05, "loss": 21.0915, "step": 29450 }, { "epoch": 0.32, "learning_rate": 1.594379789489242e-05, "loss": 22.2568, "step": 29460 }, { "epoch": 0.32, "learning_rate": 1.5940981793601313e-05, "loss": 21.9155, "step": 29470 }, { "epoch": 0.32, "learning_rate": 1.5938164963975462e-05, "loss": 21.6619, "step": 29480 }, { "epoch": 0.32, "learning_rate": 1.5935347406360192e-05, "loss": 21.2287, "step": 29490 }, { "epoch": 0.32, "learning_rate": 1.593252912110093e-05, "loss": 21.6198, "step": 29500 }, { "epoch": 0.32, "learning_rate": 1.5929710108543174e-05, "loss": 22.3012, "step": 29510 }, { "epoch": 0.32, "learning_rate": 1.5926890369032527e-05, "loss": 21.212, "step": 29520 }, { "epoch": 0.32, "learning_rate": 1.5924069902914673e-05, "loss": 21.1191, "step": 29530 }, { "epoch": 0.32, "learning_rate": 1.5921248710535388e-05, "loss": 21.6687, "step": 29540 }, { "epoch": 0.32, "learning_rate": 1.591842679224053e-05, "loss": 22.3649, "step": 29550 }, { "epoch": 0.32, "learning_rate": 1.5915604148376064e-05, "loss": 22.1159, "step": 29560 }, { "epoch": 0.32, "learning_rate": 1.5912780779288028e-05, "loss": 21.6469, "step": 29570 }, { "epoch": 0.32, "learning_rate": 1.590995668532254e-05, "loss": 21.6003, "step": 29580 }, { "epoch": 0.32, "learning_rate": 1.590713186682584e-05, "loss": 21.1069, "step": 29590 }, { "epoch": 0.32, "learning_rate": 1.5904306324144224e-05, "loss": 21.5021, "step": 29600 }, { "epoch": 0.32, "learning_rate": 1.5901480057624094e-05, "loss": 21.7106, "step": 29610 }, { "epoch": 0.32, "learning_rate": 1.589865306761193e-05, "loss": 21.6505, "step": 29620 }, { "epoch": 0.32, "learning_rate": 1.5895825354454316e-05, "loss": 20.4315, "step": 29630 }, { "epoch": 0.32, "learning_rate": 1.589299691849791e-05, "loss": 21.5717, "step": 29640 }, { "epoch": 0.32, "learning_rate": 1.5890167760089466e-05, "loss": 21.0319, "step": 29650 }, { "epoch": 0.32, "learning_rate": 1.5887337879575825e-05, "loss": 21.4252, "step": 29660 }, { "epoch": 0.32, "learning_rate": 1.5884507277303912e-05, "loss": 21.3566, "step": 29670 }, { "epoch": 0.32, "learning_rate": 1.5881675953620753e-05, "loss": 21.2216, "step": 29680 }, { "epoch": 0.32, "learning_rate": 1.5878843908873446e-05, "loss": 21.4948, "step": 29690 }, { "epoch": 0.32, "learning_rate": 1.587601114340919e-05, "loss": 20.9647, "step": 29700 }, { "epoch": 0.32, "learning_rate": 1.587317765757526e-05, "loss": 20.8822, "step": 29710 }, { "epoch": 0.32, "learning_rate": 1.5870343451719043e-05, "loss": 21.754, "step": 29720 }, { "epoch": 0.32, "learning_rate": 1.5867508526187985e-05, "loss": 21.4599, "step": 29730 }, { "epoch": 0.32, "learning_rate": 1.5864672881329637e-05, "loss": 21.1978, "step": 29740 }, { "epoch": 0.32, "learning_rate": 1.586183651749164e-05, "loss": 21.4339, "step": 29750 }, { "epoch": 0.32, "learning_rate": 1.585899943502171e-05, "loss": 21.0204, "step": 29760 }, { "epoch": 0.32, "learning_rate": 1.585616163426767e-05, "loss": 21.0124, "step": 29770 }, { "epoch": 0.32, "learning_rate": 1.5853323115577408e-05, "loss": 21.7692, "step": 29780 }, { "epoch": 0.32, "learning_rate": 1.5850483879298916e-05, "loss": 21.5508, "step": 29790 }, { "epoch": 0.32, "learning_rate": 1.5847643925780274e-05, "loss": 22.3579, "step": 29800 }, { "epoch": 0.32, "learning_rate": 1.5844803255369642e-05, "loss": 21.9529, "step": 29810 }, { "epoch": 0.32, "learning_rate": 1.584196186841528e-05, "loss": 21.1094, "step": 29820 }, { "epoch": 0.32, "learning_rate": 1.5839119765265517e-05, "loss": 21.7314, "step": 29830 }, { "epoch": 0.32, "learning_rate": 1.5836276946268787e-05, "loss": 20.5095, "step": 29840 }, { "epoch": 0.32, "learning_rate": 1.5833433411773605e-05, "loss": 20.9323, "step": 29850 }, { "epoch": 0.32, "learning_rate": 1.5830589162128574e-05, "loss": 21.6713, "step": 29860 }, { "epoch": 0.32, "learning_rate": 1.5827744197682384e-05, "loss": 21.5524, "step": 29870 }, { "epoch": 0.32, "learning_rate": 1.582489851878381e-05, "loss": 21.9779, "step": 29880 }, { "epoch": 0.32, "learning_rate": 1.5822052125781724e-05, "loss": 22.0754, "step": 29890 }, { "epoch": 0.32, "learning_rate": 1.5819205019025078e-05, "loss": 21.1651, "step": 29900 }, { "epoch": 0.32, "learning_rate": 1.581635719886291e-05, "loss": 21.0596, "step": 29910 }, { "epoch": 0.32, "learning_rate": 1.5813508665644354e-05, "loss": 22.4895, "step": 29920 }, { "epoch": 0.32, "learning_rate": 1.581065941971862e-05, "loss": 20.7934, "step": 29930 }, { "epoch": 0.32, "learning_rate": 1.5807809461435014e-05, "loss": 21.5903, "step": 29940 }, { "epoch": 0.32, "learning_rate": 1.580495879114293e-05, "loss": 21.2387, "step": 29950 }, { "epoch": 0.32, "learning_rate": 1.580210740919184e-05, "loss": 20.4376, "step": 29960 }, { "epoch": 0.32, "learning_rate": 1.5799255315931312e-05, "loss": 21.8517, "step": 29970 }, { "epoch": 0.32, "learning_rate": 1.5796402511710996e-05, "loss": 21.2387, "step": 29980 }, { "epoch": 0.32, "learning_rate": 1.579354899688064e-05, "loss": 21.7067, "step": 29990 }, { "epoch": 0.32, "learning_rate": 1.579069477179006e-05, "loss": 21.6076, "step": 30000 }, { "epoch": 0.32, "learning_rate": 1.5787839836789176e-05, "loss": 21.8509, "step": 30010 }, { "epoch": 0.32, "learning_rate": 1.5784984192227986e-05, "loss": 21.5172, "step": 30020 }, { "epoch": 0.32, "learning_rate": 1.578212783845658e-05, "loss": 21.4869, "step": 30030 }, { "epoch": 0.32, "learning_rate": 1.577927077582513e-05, "loss": 21.2808, "step": 30040 }, { "epoch": 0.32, "learning_rate": 1.5776413004683905e-05, "loss": 20.7049, "step": 30050 }, { "epoch": 0.32, "learning_rate": 1.5773554525383243e-05, "loss": 21.7379, "step": 30060 }, { "epoch": 0.33, "learning_rate": 1.5770695338273586e-05, "loss": 21.8427, "step": 30070 }, { "epoch": 0.33, "learning_rate": 1.5767835443705454e-05, "loss": 22.1128, "step": 30080 }, { "epoch": 0.33, "learning_rate": 1.5764974842029454e-05, "loss": 21.5828, "step": 30090 }, { "epoch": 0.33, "learning_rate": 1.5762113533596288e-05, "loss": 20.8566, "step": 30100 }, { "epoch": 0.33, "learning_rate": 1.575925151875673e-05, "loss": 21.3878, "step": 30110 }, { "epoch": 0.33, "learning_rate": 1.5756388797861652e-05, "loss": 21.9113, "step": 30120 }, { "epoch": 0.33, "learning_rate": 1.575352537126201e-05, "loss": 21.8298, "step": 30130 }, { "epoch": 0.33, "learning_rate": 1.5750661239308846e-05, "loss": 21.2178, "step": 30140 }, { "epoch": 0.33, "learning_rate": 1.574779640235329e-05, "loss": 21.3658, "step": 30150 }, { "epoch": 0.33, "learning_rate": 1.574493086074655e-05, "loss": 21.6441, "step": 30160 }, { "epoch": 0.33, "learning_rate": 1.5742064614839937e-05, "loss": 21.3988, "step": 30170 }, { "epoch": 0.33, "learning_rate": 1.573919766498483e-05, "loss": 21.397, "step": 30180 }, { "epoch": 0.33, "learning_rate": 1.5736330011532705e-05, "loss": 20.9005, "step": 30190 }, { "epoch": 0.33, "learning_rate": 1.5733461654835128e-05, "loss": 21.6615, "step": 30200 }, { "epoch": 0.33, "learning_rate": 1.5730592595243736e-05, "loss": 21.7746, "step": 30210 }, { "epoch": 0.33, "learning_rate": 1.5727722833110265e-05, "loss": 21.5252, "step": 30220 }, { "epoch": 0.33, "learning_rate": 1.572485236878654e-05, "loss": 21.1663, "step": 30230 }, { "epoch": 0.33, "learning_rate": 1.572198120262445e-05, "loss": 21.1358, "step": 30240 }, { "epoch": 0.33, "learning_rate": 1.5719109334976002e-05, "loss": 21.8955, "step": 30250 }, { "epoch": 0.33, "learning_rate": 1.5716236766193267e-05, "loss": 21.4088, "step": 30260 }, { "epoch": 0.33, "learning_rate": 1.5713363496628403e-05, "loss": 21.1088, "step": 30270 }, { "epoch": 0.33, "learning_rate": 1.5710489526633663e-05, "loss": 21.1624, "step": 30280 }, { "epoch": 0.33, "learning_rate": 1.570761485656138e-05, "loss": 21.9974, "step": 30290 }, { "epoch": 0.33, "learning_rate": 1.570473948676398e-05, "loss": 22.0061, "step": 30300 }, { "epoch": 0.33, "learning_rate": 1.570186341759396e-05, "loss": 20.7595, "step": 30310 }, { "epoch": 0.33, "learning_rate": 1.569898664940391e-05, "loss": 21.9825, "step": 30320 }, { "epoch": 0.33, "learning_rate": 1.569610918254652e-05, "loss": 21.6508, "step": 30330 }, { "epoch": 0.33, "learning_rate": 1.5693231017374545e-05, "loss": 21.7464, "step": 30340 }, { "epoch": 0.33, "learning_rate": 1.5690352154240834e-05, "loss": 20.9642, "step": 30350 }, { "epoch": 0.33, "learning_rate": 1.5687472593498322e-05, "loss": 21.6337, "step": 30360 }, { "epoch": 0.33, "learning_rate": 1.5684592335500027e-05, "loss": 21.3202, "step": 30370 }, { "epoch": 0.33, "learning_rate": 1.568171138059906e-05, "loss": 21.528, "step": 30380 }, { "epoch": 0.33, "learning_rate": 1.5678829729148606e-05, "loss": 21.2095, "step": 30390 }, { "epoch": 0.33, "learning_rate": 1.567594738150194e-05, "loss": 21.703, "step": 30400 }, { "epoch": 0.33, "learning_rate": 1.567306433801243e-05, "loss": 21.3029, "step": 30410 }, { "epoch": 0.33, "learning_rate": 1.5670180599033518e-05, "loss": 22.5646, "step": 30420 }, { "epoch": 0.33, "learning_rate": 1.566729616491874e-05, "loss": 21.1597, "step": 30430 }, { "epoch": 0.33, "learning_rate": 1.56644110360217e-05, "loss": 20.6929, "step": 30440 }, { "epoch": 0.33, "learning_rate": 1.566152521269612e-05, "loss": 21.4081, "step": 30450 }, { "epoch": 0.33, "learning_rate": 1.5658638695295777e-05, "loss": 21.2308, "step": 30460 }, { "epoch": 0.33, "learning_rate": 1.5655751484174545e-05, "loss": 20.8839, "step": 30470 }, { "epoch": 0.33, "learning_rate": 1.565286357968638e-05, "loss": 20.8899, "step": 30480 }, { "epoch": 0.33, "learning_rate": 1.5649974982185324e-05, "loss": 21.7449, "step": 30490 }, { "epoch": 0.33, "learning_rate": 1.564708569202551e-05, "loss": 21.4733, "step": 30500 }, { "epoch": 0.33, "learning_rate": 1.5644195709561148e-05, "loss": 21.4741, "step": 30510 }, { "epoch": 0.33, "learning_rate": 1.5641305035146537e-05, "loss": 21.5757, "step": 30520 }, { "epoch": 0.33, "learning_rate": 1.5638413669136053e-05, "loss": 21.3113, "step": 30530 }, { "epoch": 0.33, "learning_rate": 1.563552161188417e-05, "loss": 21.4777, "step": 30540 }, { "epoch": 0.33, "learning_rate": 1.5632628863745436e-05, "loss": 21.0778, "step": 30550 }, { "epoch": 0.33, "learning_rate": 1.562973542507449e-05, "loss": 20.912, "step": 30560 }, { "epoch": 0.33, "learning_rate": 1.5626841296226046e-05, "loss": 20.9893, "step": 30570 }, { "epoch": 0.33, "learning_rate": 1.5623946477554923e-05, "loss": 21.8335, "step": 30580 }, { "epoch": 0.33, "learning_rate": 1.5621050969416e-05, "loss": 21.7372, "step": 30590 }, { "epoch": 0.33, "learning_rate": 1.5618154772164257e-05, "loss": 21.658, "step": 30600 }, { "epoch": 0.33, "learning_rate": 1.561525788615475e-05, "loss": 21.9068, "step": 30610 }, { "epoch": 0.33, "learning_rate": 1.5612360311742626e-05, "loss": 21.9026, "step": 30620 }, { "epoch": 0.33, "learning_rate": 1.5609462049283114e-05, "loss": 21.197, "step": 30630 }, { "epoch": 0.33, "learning_rate": 1.5606563099131525e-05, "loss": 20.3435, "step": 30640 }, { "epoch": 0.33, "learning_rate": 1.560366346164325e-05, "loss": 21.2285, "step": 30650 }, { "epoch": 0.33, "learning_rate": 1.560076313717378e-05, "loss": 21.0208, "step": 30660 }, { "epoch": 0.33, "learning_rate": 1.5597862126078674e-05, "loss": 21.7297, "step": 30670 }, { "epoch": 0.33, "learning_rate": 1.5594960428713583e-05, "loss": 21.8695, "step": 30680 }, { "epoch": 0.33, "learning_rate": 1.5592058045434245e-05, "loss": 22.1348, "step": 30690 }, { "epoch": 0.33, "learning_rate": 1.558915497659647e-05, "loss": 21.2889, "step": 30700 }, { "epoch": 0.33, "learning_rate": 1.558625122255616e-05, "loss": 21.2185, "step": 30710 }, { "epoch": 0.33, "learning_rate": 1.5583346783669312e-05, "loss": 20.4222, "step": 30720 }, { "epoch": 0.33, "learning_rate": 1.558044166029198e-05, "loss": 21.0578, "step": 30730 }, { "epoch": 0.33, "learning_rate": 1.5577535852780334e-05, "loss": 21.0245, "step": 30740 }, { "epoch": 0.33, "learning_rate": 1.5574629361490593e-05, "loss": 21.391, "step": 30750 }, { "epoch": 0.33, "learning_rate": 1.5571722186779095e-05, "loss": 21.2763, "step": 30760 }, { "epoch": 0.33, "learning_rate": 1.5568814329002238e-05, "loss": 20.7812, "step": 30770 }, { "epoch": 0.33, "learning_rate": 1.556590578851651e-05, "loss": 21.9478, "step": 30780 }, { "epoch": 0.33, "learning_rate": 1.5562996565678484e-05, "loss": 20.9183, "step": 30790 }, { "epoch": 0.33, "learning_rate": 1.556008666084482e-05, "loss": 21.9718, "step": 30800 }, { "epoch": 0.33, "learning_rate": 1.5557176074372252e-05, "loss": 21.9404, "step": 30810 }, { "epoch": 0.33, "learning_rate": 1.555426480661761e-05, "loss": 21.9347, "step": 30820 }, { "epoch": 0.33, "learning_rate": 1.5551352857937795e-05, "loss": 21.0377, "step": 30830 }, { "epoch": 0.33, "learning_rate": 1.55484402286898e-05, "loss": 20.757, "step": 30840 }, { "epoch": 0.33, "learning_rate": 1.55455269192307e-05, "loss": 20.8507, "step": 30850 }, { "epoch": 0.33, "learning_rate": 1.5542612929917647e-05, "loss": 21.3238, "step": 30860 }, { "epoch": 0.33, "learning_rate": 1.5539698261107885e-05, "loss": 21.6945, "step": 30870 }, { "epoch": 0.33, "learning_rate": 1.5536782913158744e-05, "loss": 21.4312, "step": 30880 }, { "epoch": 0.33, "learning_rate": 1.5533866886427617e-05, "loss": 21.3794, "step": 30890 }, { "epoch": 0.33, "learning_rate": 1.5530950181272007e-05, "loss": 21.4835, "step": 30900 }, { "epoch": 0.33, "learning_rate": 1.5528032798049485e-05, "loss": 22.111, "step": 30910 }, { "epoch": 0.33, "learning_rate": 1.5525114737117703e-05, "loss": 21.3164, "step": 30920 }, { "epoch": 0.33, "learning_rate": 1.5522195998834406e-05, "loss": 21.3954, "step": 30930 }, { "epoch": 0.33, "learning_rate": 1.5519276583557413e-05, "loss": 21.5046, "step": 30940 }, { "epoch": 0.33, "learning_rate": 1.551635649164463e-05, "loss": 21.4675, "step": 30950 }, { "epoch": 0.33, "learning_rate": 1.5513435723454047e-05, "loss": 21.606, "step": 30960 }, { "epoch": 0.33, "learning_rate": 1.5510514279343736e-05, "loss": 21.3626, "step": 30970 }, { "epoch": 0.33, "learning_rate": 1.550759215967185e-05, "loss": 21.049, "step": 30980 }, { "epoch": 0.34, "learning_rate": 1.5504669364796625e-05, "loss": 21.8954, "step": 30990 }, { "epoch": 0.34, "learning_rate": 1.5501745895076386e-05, "loss": 21.5282, "step": 31000 }, { "epoch": 0.34, "learning_rate": 1.5498821750869533e-05, "loss": 20.8371, "step": 31010 }, { "epoch": 0.34, "learning_rate": 1.5495896932534548e-05, "loss": 21.4487, "step": 31020 }, { "epoch": 0.34, "learning_rate": 1.5492971440430007e-05, "loss": 21.5427, "step": 31030 }, { "epoch": 0.34, "learning_rate": 1.5490045274914557e-05, "loss": 21.2094, "step": 31040 }, { "epoch": 0.34, "learning_rate": 1.5487118436346928e-05, "loss": 21.6507, "step": 31050 }, { "epoch": 0.34, "learning_rate": 1.5484190925085935e-05, "loss": 20.4593, "step": 31060 }, { "epoch": 0.34, "learning_rate": 1.5481262741490487e-05, "loss": 21.9865, "step": 31070 }, { "epoch": 0.34, "learning_rate": 1.5478333885919553e-05, "loss": 21.4145, "step": 31080 }, { "epoch": 0.34, "learning_rate": 1.54754043587322e-05, "loss": 20.9127, "step": 31090 }, { "epoch": 0.34, "learning_rate": 1.5472474160287575e-05, "loss": 21.6524, "step": 31100 }, { "epoch": 0.34, "learning_rate": 1.5469543290944903e-05, "loss": 20.6656, "step": 31110 }, { "epoch": 0.34, "learning_rate": 1.5466611751063503e-05, "loss": 21.6238, "step": 31120 }, { "epoch": 0.34, "learning_rate": 1.5463679541002754e-05, "loss": 21.8668, "step": 31130 }, { "epoch": 0.34, "learning_rate": 1.5460746661122136e-05, "loss": 21.1966, "step": 31140 }, { "epoch": 0.34, "learning_rate": 1.5457813111781205e-05, "loss": 21.3178, "step": 31150 }, { "epoch": 0.34, "learning_rate": 1.54548788933396e-05, "loss": 20.6896, "step": 31160 }, { "epoch": 0.34, "learning_rate": 1.5451944006157046e-05, "loss": 21.7939, "step": 31170 }, { "epoch": 0.34, "learning_rate": 1.5449008450593338e-05, "loss": 21.4454, "step": 31180 }, { "epoch": 0.34, "learning_rate": 1.544607222700836e-05, "loss": 21.295, "step": 31190 }, { "epoch": 0.34, "learning_rate": 1.544313533576209e-05, "loss": 20.9288, "step": 31200 }, { "epoch": 0.34, "learning_rate": 1.5440197777214563e-05, "loss": 20.9178, "step": 31210 }, { "epoch": 0.34, "learning_rate": 1.5437259551725915e-05, "loss": 20.9856, "step": 31220 }, { "epoch": 0.34, "learning_rate": 1.5434320659656358e-05, "loss": 21.6692, "step": 31230 }, { "epoch": 0.34, "learning_rate": 1.5431381101366185e-05, "loss": 21.0103, "step": 31240 }, { "epoch": 0.34, "learning_rate": 1.542844087721577e-05, "loss": 22.0543, "step": 31250 }, { "epoch": 0.34, "learning_rate": 1.542549998756557e-05, "loss": 21.3209, "step": 31260 }, { "epoch": 0.34, "learning_rate": 1.5422558432776125e-05, "loss": 20.9889, "step": 31270 }, { "epoch": 0.34, "learning_rate": 1.5419616213208057e-05, "loss": 21.6919, "step": 31280 }, { "epoch": 0.34, "learning_rate": 1.541667332922206e-05, "loss": 21.3985, "step": 31290 }, { "epoch": 0.34, "learning_rate": 1.541372978117892e-05, "loss": 21.8912, "step": 31300 }, { "epoch": 0.34, "learning_rate": 1.5410785569439505e-05, "loss": 21.7553, "step": 31310 }, { "epoch": 0.34, "learning_rate": 1.540784069436476e-05, "loss": 21.6459, "step": 31320 }, { "epoch": 0.34, "learning_rate": 1.5404895156315707e-05, "loss": 21.1566, "step": 31330 }, { "epoch": 0.34, "learning_rate": 1.540194895565346e-05, "loss": 21.3851, "step": 31340 }, { "epoch": 0.34, "learning_rate": 1.5399002092739206e-05, "loss": 21.6226, "step": 31350 }, { "epoch": 0.34, "learning_rate": 1.5396054567934216e-05, "loss": 20.9989, "step": 31360 }, { "epoch": 0.34, "learning_rate": 1.5393106381599842e-05, "loss": 21.0559, "step": 31370 }, { "epoch": 0.34, "learning_rate": 1.5390157534097515e-05, "loss": 20.7063, "step": 31380 }, { "epoch": 0.34, "learning_rate": 1.538720802578875e-05, "loss": 21.5835, "step": 31390 }, { "epoch": 0.34, "learning_rate": 1.5384257857035146e-05, "loss": 20.5817, "step": 31400 }, { "epoch": 0.34, "learning_rate": 1.5381307028198368e-05, "loss": 21.1177, "step": 31410 }, { "epoch": 0.34, "learning_rate": 1.537835553964019e-05, "loss": 21.73, "step": 31420 }, { "epoch": 0.34, "learning_rate": 1.5375403391722438e-05, "loss": 21.3004, "step": 31430 }, { "epoch": 0.34, "learning_rate": 1.537245058480703e-05, "loss": 21.2269, "step": 31440 }, { "epoch": 0.34, "learning_rate": 1.536949711925597e-05, "loss": 20.87, "step": 31450 }, { "epoch": 0.34, "learning_rate": 1.536654299543133e-05, "loss": 21.44, "step": 31460 }, { "epoch": 0.34, "learning_rate": 1.5363588213695286e-05, "loss": 20.7006, "step": 31470 }, { "epoch": 0.34, "learning_rate": 1.5360632774410068e-05, "loss": 21.3418, "step": 31480 }, { "epoch": 0.34, "learning_rate": 1.5357676677938e-05, "loss": 21.5614, "step": 31490 }, { "epoch": 0.34, "learning_rate": 1.5354719924641486e-05, "loss": 20.7353, "step": 31500 }, { "epoch": 0.34, "learning_rate": 1.5351762514883008e-05, "loss": 20.6867, "step": 31510 }, { "epoch": 0.34, "learning_rate": 1.5348804449025134e-05, "loss": 21.7377, "step": 31520 }, { "epoch": 0.34, "learning_rate": 1.53458457274305e-05, "loss": 20.72, "step": 31530 }, { "epoch": 0.34, "learning_rate": 1.5342886350461837e-05, "loss": 21.9838, "step": 31540 }, { "epoch": 0.34, "learning_rate": 1.5339926318481952e-05, "loss": 21.674, "step": 31550 }, { "epoch": 0.34, "learning_rate": 1.533696563185372e-05, "loss": 21.9265, "step": 31560 }, { "epoch": 0.34, "learning_rate": 1.5334004290940117e-05, "loss": 21.5964, "step": 31570 }, { "epoch": 0.34, "learning_rate": 1.5331042296104183e-05, "loss": 21.4754, "step": 31580 }, { "epoch": 0.34, "learning_rate": 1.532807964770904e-05, "loss": 21.9382, "step": 31590 }, { "epoch": 0.34, "learning_rate": 1.5325116346117907e-05, "loss": 22.3557, "step": 31600 }, { "epoch": 0.34, "learning_rate": 1.5322152391694058e-05, "loss": 20.7925, "step": 31610 }, { "epoch": 0.34, "learning_rate": 1.5319187784800866e-05, "loss": 20.7016, "step": 31620 }, { "epoch": 0.34, "learning_rate": 1.531622252580177e-05, "loss": 21.6221, "step": 31630 }, { "epoch": 0.34, "learning_rate": 1.53132566150603e-05, "loss": 22.145, "step": 31640 }, { "epoch": 0.34, "learning_rate": 1.5310290052940065e-05, "loss": 21.0328, "step": 31650 }, { "epoch": 0.34, "learning_rate": 1.5307322839804743e-05, "loss": 21.2037, "step": 31660 }, { "epoch": 0.34, "learning_rate": 1.5304354976018108e-05, "loss": 22.2117, "step": 31670 }, { "epoch": 0.34, "learning_rate": 1.5301386461944e-05, "loss": 21.9857, "step": 31680 }, { "epoch": 0.34, "learning_rate": 1.529841729794635e-05, "loss": 21.3027, "step": 31690 }, { "epoch": 0.34, "learning_rate": 1.529544748438915e-05, "loss": 21.2872, "step": 31700 }, { "epoch": 0.34, "learning_rate": 1.5292477021636498e-05, "loss": 21.7709, "step": 31710 }, { "epoch": 0.34, "learning_rate": 1.528950591005255e-05, "loss": 20.951, "step": 31720 }, { "epoch": 0.34, "learning_rate": 1.5286534150001552e-05, "loss": 21.7401, "step": 31730 }, { "epoch": 0.34, "learning_rate": 1.5283561741847827e-05, "loss": 21.7343, "step": 31740 }, { "epoch": 0.34, "learning_rate": 1.528058868595578e-05, "loss": 21.5696, "step": 31750 }, { "epoch": 0.34, "learning_rate": 1.5277614982689884e-05, "loss": 21.5308, "step": 31760 }, { "epoch": 0.34, "learning_rate": 1.527464063241471e-05, "loss": 21.4456, "step": 31770 }, { "epoch": 0.34, "learning_rate": 1.5271665635494897e-05, "loss": 21.3593, "step": 31780 }, { "epoch": 0.34, "learning_rate": 1.526868999229516e-05, "loss": 21.4474, "step": 31790 }, { "epoch": 0.34, "learning_rate": 1.52657137031803e-05, "loss": 21.7654, "step": 31800 }, { "epoch": 0.34, "learning_rate": 1.5262736768515196e-05, "loss": 20.7034, "step": 31810 }, { "epoch": 0.34, "learning_rate": 1.5259759188664805e-05, "loss": 21.7083, "step": 31820 }, { "epoch": 0.34, "learning_rate": 1.5256780963994167e-05, "loss": 21.1428, "step": 31830 }, { "epoch": 0.34, "learning_rate": 1.5253802094868388e-05, "loss": 21.6167, "step": 31840 }, { "epoch": 0.34, "learning_rate": 1.5250822581652673e-05, "loss": 22.0441, "step": 31850 }, { "epoch": 0.34, "learning_rate": 1.524784242471229e-05, "loss": 21.4737, "step": 31860 }, { "epoch": 0.34, "learning_rate": 1.5244861624412592e-05, "loss": 22.0275, "step": 31870 }, { "epoch": 0.34, "learning_rate": 1.5241880181119011e-05, "loss": 21.5001, "step": 31880 }, { "epoch": 0.34, "learning_rate": 1.5238898095197057e-05, "loss": 21.4726, "step": 31890 }, { "epoch": 0.34, "learning_rate": 1.5235915367012317e-05, "loss": 21.8483, "step": 31900 }, { "epoch": 0.34, "learning_rate": 1.5232931996930463e-05, "loss": 21.09, "step": 31910 }, { "epoch": 0.35, "learning_rate": 1.5229947985317235e-05, "loss": 21.367, "step": 31920 }, { "epoch": 0.35, "learning_rate": 1.5226963332538464e-05, "loss": 21.2002, "step": 31930 }, { "epoch": 0.35, "learning_rate": 1.5223978038960053e-05, "loss": 21.4288, "step": 31940 }, { "epoch": 0.35, "learning_rate": 1.5220992104947975e-05, "loss": 20.9051, "step": 31950 }, { "epoch": 0.35, "learning_rate": 1.5218005530868306e-05, "loss": 21.1446, "step": 31960 }, { "epoch": 0.35, "learning_rate": 1.5215018317087168e-05, "loss": 21.1247, "step": 31970 }, { "epoch": 0.35, "learning_rate": 1.5212030463970796e-05, "loss": 21.3292, "step": 31980 }, { "epoch": 0.35, "learning_rate": 1.5209041971885475e-05, "loss": 21.6417, "step": 31990 }, { "epoch": 0.35, "learning_rate": 1.5206052841197578e-05, "loss": 21.681, "step": 32000 }, { "epoch": 0.35, "learning_rate": 1.5203063072273563e-05, "loss": 21.6737, "step": 32010 }, { "epoch": 0.35, "learning_rate": 1.5200072665479958e-05, "loss": 21.8954, "step": 32020 }, { "epoch": 0.35, "learning_rate": 1.5197081621183374e-05, "loss": 22.0224, "step": 32030 }, { "epoch": 0.35, "learning_rate": 1.5194089939750497e-05, "loss": 21.5556, "step": 32040 }, { "epoch": 0.35, "learning_rate": 1.519109762154809e-05, "loss": 21.6781, "step": 32050 }, { "epoch": 0.35, "learning_rate": 1.5188104666943e-05, "loss": 20.7375, "step": 32060 }, { "epoch": 0.35, "learning_rate": 1.5185111076302146e-05, "loss": 20.4573, "step": 32070 }, { "epoch": 0.35, "learning_rate": 1.5182116849992528e-05, "loss": 20.8532, "step": 32080 }, { "epoch": 0.35, "learning_rate": 1.5179121988381224e-05, "loss": 21.4042, "step": 32090 }, { "epoch": 0.35, "learning_rate": 1.5176126491835388e-05, "loss": 21.2719, "step": 32100 }, { "epoch": 0.35, "learning_rate": 1.517313036072225e-05, "loss": 21.652, "step": 32110 }, { "epoch": 0.35, "learning_rate": 1.517013359540913e-05, "loss": 21.1211, "step": 32120 }, { "epoch": 0.35, "learning_rate": 1.5167136196263405e-05, "loss": 21.6817, "step": 32130 }, { "epoch": 0.35, "learning_rate": 1.516413816365255e-05, "loss": 21.2994, "step": 32140 }, { "epoch": 0.35, "learning_rate": 1.5161139497944105e-05, "loss": 21.0308, "step": 32150 }, { "epoch": 0.35, "learning_rate": 1.5158140199505691e-05, "loss": 20.5991, "step": 32160 }, { "epoch": 0.35, "learning_rate": 1.5155140268705007e-05, "loss": 21.0714, "step": 32170 }, { "epoch": 0.35, "learning_rate": 1.515213970590983e-05, "loss": 21.6197, "step": 32180 }, { "epoch": 0.35, "learning_rate": 1.5149138511488017e-05, "loss": 21.5894, "step": 32190 }, { "epoch": 0.35, "learning_rate": 1.5146136685807497e-05, "loss": 21.2283, "step": 32200 }, { "epoch": 0.35, "learning_rate": 1.5143134229236278e-05, "loss": 21.1571, "step": 32210 }, { "epoch": 0.35, "learning_rate": 1.5140131142142446e-05, "loss": 21.0615, "step": 32220 }, { "epoch": 0.35, "learning_rate": 1.5137127424894168e-05, "loss": 20.761, "step": 32230 }, { "epoch": 0.35, "learning_rate": 1.513412307785968e-05, "loss": 20.8702, "step": 32240 }, { "epoch": 0.35, "learning_rate": 1.5131118101407302e-05, "loss": 20.5344, "step": 32250 }, { "epoch": 0.35, "learning_rate": 1.5128112495905432e-05, "loss": 21.5449, "step": 32260 }, { "epoch": 0.35, "learning_rate": 1.5125106261722537e-05, "loss": 21.3211, "step": 32270 }, { "epoch": 0.35, "learning_rate": 1.512209939922717e-05, "loss": 21.7958, "step": 32280 }, { "epoch": 0.35, "learning_rate": 1.5119091908787957e-05, "loss": 21.3847, "step": 32290 }, { "epoch": 0.35, "learning_rate": 1.5116083790773601e-05, "loss": 21.5541, "step": 32300 }, { "epoch": 0.35, "learning_rate": 1.5113075045552882e-05, "loss": 21.3525, "step": 32310 }, { "epoch": 0.35, "learning_rate": 1.5110065673494655e-05, "loss": 21.5421, "step": 32320 }, { "epoch": 0.35, "learning_rate": 1.5107055674967858e-05, "loss": 21.6282, "step": 32330 }, { "epoch": 0.35, "learning_rate": 1.51040450503415e-05, "loss": 21.3401, "step": 32340 }, { "epoch": 0.35, "learning_rate": 1.5101033799984668e-05, "loss": 21.0626, "step": 32350 }, { "epoch": 0.35, "learning_rate": 1.5098021924266525e-05, "loss": 21.5959, "step": 32360 }, { "epoch": 0.35, "learning_rate": 1.5095009423556318e-05, "loss": 21.5975, "step": 32370 }, { "epoch": 0.35, "learning_rate": 1.5091996298223355e-05, "loss": 21.3762, "step": 32380 }, { "epoch": 0.35, "learning_rate": 1.5088982548637041e-05, "loss": 21.5366, "step": 32390 }, { "epoch": 0.35, "learning_rate": 1.5085968175166837e-05, "loss": 21.5233, "step": 32400 }, { "epoch": 0.35, "learning_rate": 1.5082953178182296e-05, "loss": 21.3339, "step": 32410 }, { "epoch": 0.35, "learning_rate": 1.5079937558053042e-05, "loss": 21.1918, "step": 32420 }, { "epoch": 0.35, "learning_rate": 1.5076921315148768e-05, "loss": 21.4505, "step": 32430 }, { "epoch": 0.35, "learning_rate": 1.5073904449839258e-05, "loss": 21.1646, "step": 32440 }, { "epoch": 0.35, "learning_rate": 1.507088696249436e-05, "loss": 21.823, "step": 32450 }, { "epoch": 0.35, "learning_rate": 1.5067868853484004e-05, "loss": 21.9622, "step": 32460 }, { "epoch": 0.35, "learning_rate": 1.5064850123178203e-05, "loss": 21.6514, "step": 32470 }, { "epoch": 0.35, "learning_rate": 1.5061830771947023e-05, "loss": 21.4154, "step": 32480 }, { "epoch": 0.35, "learning_rate": 1.5058810800160632e-05, "loss": 21.5179, "step": 32490 }, { "epoch": 0.35, "learning_rate": 1.5055790208189262e-05, "loss": 21.5951, "step": 32500 }, { "epoch": 0.35, "learning_rate": 1.5052768996403221e-05, "loss": 21.4449, "step": 32510 }, { "epoch": 0.35, "learning_rate": 1.5049747165172898e-05, "loss": 20.8752, "step": 32520 }, { "epoch": 0.35, "learning_rate": 1.5046724714868745e-05, "loss": 21.8628, "step": 32530 }, { "epoch": 0.35, "learning_rate": 1.504370164586131e-05, "loss": 20.4868, "step": 32540 }, { "epoch": 0.35, "learning_rate": 1.5040677958521204e-05, "loss": 21.8831, "step": 32550 }, { "epoch": 0.35, "learning_rate": 1.5037653653219112e-05, "loss": 20.7495, "step": 32560 }, { "epoch": 0.35, "learning_rate": 1.50346287303258e-05, "loss": 21.6119, "step": 32570 }, { "epoch": 0.35, "learning_rate": 1.5031603190212107e-05, "loss": 22.0439, "step": 32580 }, { "epoch": 0.35, "learning_rate": 1.5028577033248954e-05, "loss": 21.2679, "step": 32590 }, { "epoch": 0.35, "learning_rate": 1.5025550259807333e-05, "loss": 21.9444, "step": 32600 }, { "epoch": 0.35, "learning_rate": 1.5022522870258302e-05, "loss": 21.251, "step": 32610 }, { "epoch": 0.35, "learning_rate": 1.5019494864973015e-05, "loss": 22.0518, "step": 32620 }, { "epoch": 0.35, "learning_rate": 1.5016466244322682e-05, "loss": 21.3359, "step": 32630 }, { "epoch": 0.35, "learning_rate": 1.5013437008678607e-05, "loss": 21.3925, "step": 32640 }, { "epoch": 0.35, "learning_rate": 1.5010407158412146e-05, "loss": 21.5336, "step": 32650 }, { "epoch": 0.35, "learning_rate": 1.5007376693894753e-05, "loss": 20.9505, "step": 32660 }, { "epoch": 0.35, "learning_rate": 1.5004345615497946e-05, "loss": 21.2036, "step": 32670 }, { "epoch": 0.35, "learning_rate": 1.5001313923593315e-05, "loss": 21.24, "step": 32680 }, { "epoch": 0.35, "learning_rate": 1.4998281618552537e-05, "loss": 21.5692, "step": 32690 }, { "epoch": 0.35, "learning_rate": 1.4995248700747355e-05, "loss": 21.233, "step": 32700 }, { "epoch": 0.35, "learning_rate": 1.499221517054959e-05, "loss": 21.1804, "step": 32710 }, { "epoch": 0.35, "learning_rate": 1.4989181028331136e-05, "loss": 21.029, "step": 32720 }, { "epoch": 0.35, "learning_rate": 1.4986146274463967e-05, "loss": 21.0666, "step": 32730 }, { "epoch": 0.35, "learning_rate": 1.4983110909320124e-05, "loss": 21.7252, "step": 32740 }, { "epoch": 0.35, "learning_rate": 1.4980074933271733e-05, "loss": 21.8432, "step": 32750 }, { "epoch": 0.35, "learning_rate": 1.4977038346690985e-05, "loss": 20.9971, "step": 32760 }, { "epoch": 0.35, "learning_rate": 1.4974001149950153e-05, "loss": 21.8612, "step": 32770 }, { "epoch": 0.35, "learning_rate": 1.4970963343421578e-05, "loss": 20.7655, "step": 32780 }, { "epoch": 0.35, "learning_rate": 1.4967924927477686e-05, "loss": 20.7539, "step": 32790 }, { "epoch": 0.35, "learning_rate": 1.496488590249097e-05, "loss": 20.6455, "step": 32800 }, { "epoch": 0.35, "learning_rate": 1.4961846268833992e-05, "loss": 20.8759, "step": 32810 }, { "epoch": 0.35, "learning_rate": 1.4958806026879411e-05, "loss": 21.3632, "step": 32820 }, { "epoch": 0.35, "learning_rate": 1.495576517699993e-05, "loss": 21.0256, "step": 32830 }, { "epoch": 0.36, "learning_rate": 1.4952723719568353e-05, "loss": 20.7133, "step": 32840 }, { "epoch": 0.36, "learning_rate": 1.494968165495754e-05, "loss": 21.4927, "step": 32850 }, { "epoch": 0.36, "learning_rate": 1.4946638983540434e-05, "loss": 21.4827, "step": 32860 }, { "epoch": 0.36, "learning_rate": 1.4943595705690059e-05, "loss": 21.4508, "step": 32870 }, { "epoch": 0.36, "learning_rate": 1.4940551821779498e-05, "loss": 21.0473, "step": 32880 }, { "epoch": 0.36, "learning_rate": 1.4937507332181915e-05, "loss": 21.4386, "step": 32890 }, { "epoch": 0.36, "learning_rate": 1.4934462237270558e-05, "loss": 20.8251, "step": 32900 }, { "epoch": 0.36, "learning_rate": 1.4931416537418733e-05, "loss": 21.8035, "step": 32910 }, { "epoch": 0.36, "learning_rate": 1.4928370232999825e-05, "loss": 21.0694, "step": 32920 }, { "epoch": 0.36, "learning_rate": 1.4925323324387307e-05, "loss": 21.278, "step": 32930 }, { "epoch": 0.36, "learning_rate": 1.49222758119547e-05, "loss": 21.2951, "step": 32940 }, { "epoch": 0.36, "learning_rate": 1.4919227696075628e-05, "loss": 21.0382, "step": 32950 }, { "epoch": 0.36, "learning_rate": 1.4916178977123768e-05, "loss": 22.0148, "step": 32960 }, { "epoch": 0.36, "learning_rate": 1.4913129655472876e-05, "loss": 21.078, "step": 32970 }, { "epoch": 0.36, "learning_rate": 1.491007973149679e-05, "loss": 20.658, "step": 32980 }, { "epoch": 0.36, "learning_rate": 1.4907029205569405e-05, "loss": 21.1342, "step": 32990 }, { "epoch": 0.36, "learning_rate": 1.4903978078064711e-05, "loss": 21.7622, "step": 33000 }, { "epoch": 0.36, "learning_rate": 1.490092634935676e-05, "loss": 20.869, "step": 33010 }, { "epoch": 0.36, "learning_rate": 1.4897874019819667e-05, "loss": 21.6627, "step": 33020 }, { "epoch": 0.36, "learning_rate": 1.4894821089827648e-05, "loss": 21.9046, "step": 33030 }, { "epoch": 0.36, "learning_rate": 1.4891767559754966e-05, "loss": 20.5896, "step": 33040 }, { "epoch": 0.36, "learning_rate": 1.4888713429975971e-05, "loss": 21.098, "step": 33050 }, { "epoch": 0.36, "learning_rate": 1.4885658700865092e-05, "loss": 20.9201, "step": 33060 }, { "epoch": 0.36, "learning_rate": 1.4882603372796812e-05, "loss": 21.0266, "step": 33070 }, { "epoch": 0.36, "learning_rate": 1.4879547446145703e-05, "loss": 21.3879, "step": 33080 }, { "epoch": 0.36, "learning_rate": 1.487649092128641e-05, "loss": 21.6931, "step": 33090 }, { "epoch": 0.36, "learning_rate": 1.4873433798593646e-05, "loss": 21.482, "step": 33100 }, { "epoch": 0.36, "learning_rate": 1.4870376078442198e-05, "loss": 21.2843, "step": 33110 }, { "epoch": 0.36, "learning_rate": 1.4867317761206925e-05, "loss": 21.7568, "step": 33120 }, { "epoch": 0.36, "learning_rate": 1.4864258847262765e-05, "loss": 21.2755, "step": 33130 }, { "epoch": 0.36, "learning_rate": 1.4861199336984724e-05, "loss": 22.117, "step": 33140 }, { "epoch": 0.36, "learning_rate": 1.4858139230747883e-05, "loss": 21.4456, "step": 33150 }, { "epoch": 0.36, "learning_rate": 1.4855078528927396e-05, "loss": 20.3511, "step": 33160 }, { "epoch": 0.36, "learning_rate": 1.485201723189849e-05, "loss": 21.0661, "step": 33170 }, { "epoch": 0.36, "learning_rate": 1.4848955340036464e-05, "loss": 21.1159, "step": 33180 }, { "epoch": 0.36, "learning_rate": 1.4845892853716692e-05, "loss": 20.7096, "step": 33190 }, { "epoch": 0.36, "learning_rate": 1.4842829773314618e-05, "loss": 21.6132, "step": 33200 }, { "epoch": 0.36, "learning_rate": 1.4839766099205761e-05, "loss": 21.4665, "step": 33210 }, { "epoch": 0.36, "learning_rate": 1.4836701831765711e-05, "loss": 20.8333, "step": 33220 }, { "epoch": 0.36, "learning_rate": 1.4833636971370133e-05, "loss": 21.2521, "step": 33230 }, { "epoch": 0.36, "learning_rate": 1.4830571518394767e-05, "loss": 21.6158, "step": 33240 }, { "epoch": 0.36, "learning_rate": 1.4827505473215415e-05, "loss": 21.4558, "step": 33250 }, { "epoch": 0.36, "learning_rate": 1.4824438836207967e-05, "loss": 21.1133, "step": 33260 }, { "epoch": 0.36, "learning_rate": 1.4821371607748366e-05, "loss": 21.1915, "step": 33270 }, { "epoch": 0.36, "learning_rate": 1.4818303788212655e-05, "loss": 21.4772, "step": 33280 }, { "epoch": 0.36, "learning_rate": 1.481523537797692e-05, "loss": 21.4384, "step": 33290 }, { "epoch": 0.36, "learning_rate": 1.4812166377417336e-05, "loss": 21.6937, "step": 33300 }, { "epoch": 0.36, "learning_rate": 1.4809096786910152e-05, "loss": 21.1075, "step": 33310 }, { "epoch": 0.36, "learning_rate": 1.4806026606831676e-05, "loss": 21.7746, "step": 33320 }, { "epoch": 0.36, "learning_rate": 1.4802955837558308e-05, "loss": 21.3845, "step": 33330 }, { "epoch": 0.36, "learning_rate": 1.4799884479466498e-05, "loss": 21.4943, "step": 33340 }, { "epoch": 0.36, "learning_rate": 1.4796812532932783e-05, "loss": 21.0406, "step": 33350 }, { "epoch": 0.36, "learning_rate": 1.4793739998333774e-05, "loss": 20.9933, "step": 33360 }, { "epoch": 0.36, "learning_rate": 1.479066687604614e-05, "loss": 21.3139, "step": 33370 }, { "epoch": 0.36, "learning_rate": 1.4787593166446636e-05, "loss": 21.5668, "step": 33380 }, { "epoch": 0.36, "learning_rate": 1.4784518869912081e-05, "loss": 21.7323, "step": 33390 }, { "epoch": 0.36, "learning_rate": 1.4781443986819369e-05, "loss": 20.9675, "step": 33400 }, { "epoch": 0.36, "learning_rate": 1.4778368517545465e-05, "loss": 21.7949, "step": 33410 }, { "epoch": 0.36, "learning_rate": 1.4775292462467406e-05, "loss": 21.6814, "step": 33420 }, { "epoch": 0.36, "learning_rate": 1.4772215821962302e-05, "loss": 21.7424, "step": 33430 }, { "epoch": 0.36, "learning_rate": 1.4769138596407336e-05, "loss": 21.2667, "step": 33440 }, { "epoch": 0.36, "learning_rate": 1.4766060786179752e-05, "loss": 21.2683, "step": 33450 }, { "epoch": 0.36, "learning_rate": 1.4762982391656886e-05, "loss": 21.9482, "step": 33460 }, { "epoch": 0.36, "learning_rate": 1.4759903413216123e-05, "loss": 22.2254, "step": 33470 }, { "epoch": 0.36, "learning_rate": 1.4756823851234937e-05, "loss": 21.1439, "step": 33480 }, { "epoch": 0.36, "learning_rate": 1.4753743706090871e-05, "loss": 21.1551, "step": 33490 }, { "epoch": 0.36, "learning_rate": 1.475066297816152e-05, "loss": 21.6087, "step": 33500 }, { "epoch": 0.36, "learning_rate": 1.4747581667824581e-05, "loss": 21.7554, "step": 33510 }, { "epoch": 0.36, "learning_rate": 1.47444997754578e-05, "loss": 21.801, "step": 33520 }, { "epoch": 0.36, "learning_rate": 1.4741417301439004e-05, "loss": 21.26, "step": 33530 }, { "epoch": 0.36, "learning_rate": 1.4738334246146091e-05, "loss": 21.5877, "step": 33540 }, { "epoch": 0.36, "learning_rate": 1.4735250609957024e-05, "loss": 21.5943, "step": 33550 }, { "epoch": 0.36, "learning_rate": 1.473216639324984e-05, "loss": 21.7748, "step": 33560 }, { "epoch": 0.36, "learning_rate": 1.4729081596402655e-05, "loss": 21.4059, "step": 33570 }, { "epoch": 0.36, "learning_rate": 1.4725996219793645e-05, "loss": 20.7783, "step": 33580 }, { "epoch": 0.36, "learning_rate": 1.4722910263801064e-05, "loss": 21.1901, "step": 33590 }, { "epoch": 0.36, "learning_rate": 1.4719823728803233e-05, "loss": 21.3185, "step": 33600 }, { "epoch": 0.36, "learning_rate": 1.4716736615178547e-05, "loss": 21.7452, "step": 33610 }, { "epoch": 0.36, "learning_rate": 1.471364892330547e-05, "loss": 21.1968, "step": 33620 }, { "epoch": 0.36, "learning_rate": 1.4710560653562538e-05, "loss": 20.773, "step": 33630 }, { "epoch": 0.36, "learning_rate": 1.4707471806328359e-05, "loss": 21.4922, "step": 33640 }, { "epoch": 0.36, "learning_rate": 1.4704382381981608e-05, "loss": 21.8992, "step": 33650 }, { "epoch": 0.36, "learning_rate": 1.4701292380901034e-05, "loss": 21.84, "step": 33660 }, { "epoch": 0.36, "learning_rate": 1.4698201803465456e-05, "loss": 20.7969, "step": 33670 }, { "epoch": 0.36, "learning_rate": 1.4695110650053762e-05, "loss": 21.6708, "step": 33680 }, { "epoch": 0.36, "learning_rate": 1.4692018921044913e-05, "loss": 21.1685, "step": 33690 }, { "epoch": 0.36, "learning_rate": 1.468892661681794e-05, "loss": 20.9559, "step": 33700 }, { "epoch": 0.36, "learning_rate": 1.4685833737751942e-05, "loss": 21.7526, "step": 33710 }, { "epoch": 0.36, "learning_rate": 1.4682740284226093e-05, "loss": 21.3514, "step": 33720 }, { "epoch": 0.36, "learning_rate": 1.4679646256619634e-05, "loss": 21.0037, "step": 33730 }, { "epoch": 0.36, "learning_rate": 1.4676551655311882e-05, "loss": 21.8607, "step": 33740 }, { "epoch": 0.36, "learning_rate": 1.467345648068221e-05, "loss": 21.2053, "step": 33750 }, { "epoch": 0.36, "learning_rate": 1.4670360733110079e-05, "loss": 21.3173, "step": 33760 }, { "epoch": 0.37, "learning_rate": 1.4667264412975007e-05, "loss": 21.4801, "step": 33770 }, { "epoch": 0.37, "learning_rate": 1.466416752065659e-05, "loss": 21.3724, "step": 33780 }, { "epoch": 0.37, "learning_rate": 1.4661070056534493e-05, "loss": 20.7321, "step": 33790 }, { "epoch": 0.37, "learning_rate": 1.4657972020988447e-05, "loss": 20.9142, "step": 33800 }, { "epoch": 0.37, "learning_rate": 1.4654873414398256e-05, "loss": 21.7343, "step": 33810 }, { "epoch": 0.37, "learning_rate": 1.4651774237143794e-05, "loss": 20.8217, "step": 33820 }, { "epoch": 0.37, "learning_rate": 1.4648674489605006e-05, "loss": 21.1798, "step": 33830 }, { "epoch": 0.37, "learning_rate": 1.4645574172161908e-05, "loss": 21.524, "step": 33840 }, { "epoch": 0.37, "learning_rate": 1.4642473285194576e-05, "loss": 20.4598, "step": 33850 }, { "epoch": 0.37, "learning_rate": 1.4639371829083167e-05, "loss": 21.7451, "step": 33860 }, { "epoch": 0.37, "learning_rate": 1.4636269804207906e-05, "loss": 21.1445, "step": 33870 }, { "epoch": 0.37, "learning_rate": 1.4633167210949082e-05, "loss": 21.6447, "step": 33880 }, { "epoch": 0.37, "learning_rate": 1.4630064049687063e-05, "loss": 21.8392, "step": 33890 }, { "epoch": 0.37, "learning_rate": 1.462696032080228e-05, "loss": 21.8956, "step": 33900 }, { "epoch": 0.37, "learning_rate": 1.4623856024675227e-05, "loss": 21.1042, "step": 33910 }, { "epoch": 0.37, "learning_rate": 1.4620751161686484e-05, "loss": 21.1176, "step": 33920 }, { "epoch": 0.37, "learning_rate": 1.4617645732216686e-05, "loss": 20.6308, "step": 33930 }, { "epoch": 0.37, "learning_rate": 1.4614539736646547e-05, "loss": 21.6251, "step": 33940 }, { "epoch": 0.37, "learning_rate": 1.4611433175356848e-05, "loss": 21.5329, "step": 33950 }, { "epoch": 0.37, "learning_rate": 1.460832604872843e-05, "loss": 21.0004, "step": 33960 }, { "epoch": 0.37, "learning_rate": 1.460521835714222e-05, "loss": 21.5771, "step": 33970 }, { "epoch": 0.37, "learning_rate": 1.4602110100979198e-05, "loss": 21.6235, "step": 33980 }, { "epoch": 0.37, "learning_rate": 1.4599001280620428e-05, "loss": 21.5603, "step": 33990 }, { "epoch": 0.37, "learning_rate": 1.4595891896447034e-05, "loss": 20.9244, "step": 34000 }, { "epoch": 0.37, "learning_rate": 1.4592781948840204e-05, "loss": 21.3671, "step": 34010 }, { "epoch": 0.37, "learning_rate": 1.4589671438181212e-05, "loss": 21.3463, "step": 34020 }, { "epoch": 0.37, "learning_rate": 1.4586560364851386e-05, "loss": 21.6761, "step": 34030 }, { "epoch": 0.37, "learning_rate": 1.4583448729232128e-05, "loss": 21.7516, "step": 34040 }, { "epoch": 0.37, "learning_rate": 1.4580336531704909e-05, "loss": 21.3671, "step": 34050 }, { "epoch": 0.37, "learning_rate": 1.457722377265127e-05, "loss": 20.7787, "step": 34060 }, { "epoch": 0.37, "learning_rate": 1.4574110452452819e-05, "loss": 21.4909, "step": 34070 }, { "epoch": 0.37, "learning_rate": 1.4570996571491236e-05, "loss": 21.4239, "step": 34080 }, { "epoch": 0.37, "learning_rate": 1.4567882130148263e-05, "loss": 22.2645, "step": 34090 }, { "epoch": 0.37, "learning_rate": 1.4564767128805716e-05, "loss": 21.2225, "step": 34100 }, { "epoch": 0.37, "learning_rate": 1.4561651567845483e-05, "loss": 21.5216, "step": 34110 }, { "epoch": 0.37, "learning_rate": 1.4558535447649512e-05, "loss": 20.9423, "step": 34120 }, { "epoch": 0.37, "learning_rate": 1.4555418768599823e-05, "loss": 21.5943, "step": 34130 }, { "epoch": 0.37, "learning_rate": 1.4552301531078508e-05, "loss": 21.1272, "step": 34140 }, { "epoch": 0.37, "learning_rate": 1.4549183735467725e-05, "loss": 20.9877, "step": 34150 }, { "epoch": 0.37, "learning_rate": 1.4546065382149697e-05, "loss": 21.0884, "step": 34160 }, { "epoch": 0.37, "learning_rate": 1.4542946471506723e-05, "loss": 21.9883, "step": 34170 }, { "epoch": 0.37, "learning_rate": 1.4539827003921161e-05, "loss": 21.6225, "step": 34180 }, { "epoch": 0.37, "learning_rate": 1.4536706979775445e-05, "loss": 22.3655, "step": 34190 }, { "epoch": 0.37, "learning_rate": 1.4533586399452077e-05, "loss": 20.7671, "step": 34200 }, { "epoch": 0.37, "learning_rate": 1.4530465263333619e-05, "loss": 21.7048, "step": 34210 }, { "epoch": 0.37, "learning_rate": 1.452734357180271e-05, "loss": 21.4407, "step": 34220 }, { "epoch": 0.37, "learning_rate": 1.4524221325242054e-05, "loss": 21.2512, "step": 34230 }, { "epoch": 0.37, "learning_rate": 1.4521098524034417e-05, "loss": 20.8208, "step": 34240 }, { "epoch": 0.37, "learning_rate": 1.4517975168562652e-05, "loss": 21.0485, "step": 34250 }, { "epoch": 0.37, "learning_rate": 1.4514851259209658e-05, "loss": 21.4701, "step": 34260 }, { "epoch": 0.37, "learning_rate": 1.4511726796358408e-05, "loss": 21.5802, "step": 34270 }, { "epoch": 0.37, "learning_rate": 1.4508601780391949e-05, "loss": 21.0936, "step": 34280 }, { "epoch": 0.37, "learning_rate": 1.450547621169339e-05, "loss": 21.7015, "step": 34290 }, { "epoch": 0.37, "learning_rate": 1.4502350090645919e-05, "loss": 20.8067, "step": 34300 }, { "epoch": 0.37, "learning_rate": 1.4499223417632772e-05, "loss": 21.4118, "step": 34310 }, { "epoch": 0.37, "learning_rate": 1.4496096193037268e-05, "loss": 21.8745, "step": 34320 }, { "epoch": 0.37, "learning_rate": 1.4492968417242793e-05, "loss": 20.7336, "step": 34330 }, { "epoch": 0.37, "learning_rate": 1.4489840090632787e-05, "loss": 20.0058, "step": 34340 }, { "epoch": 0.37, "learning_rate": 1.4486711213590779e-05, "loss": 21.1765, "step": 34350 }, { "epoch": 0.37, "learning_rate": 1.4483581786500342e-05, "loss": 21.8135, "step": 34360 }, { "epoch": 0.37, "learning_rate": 1.4480451809745138e-05, "loss": 21.5908, "step": 34370 }, { "epoch": 0.37, "learning_rate": 1.447732128370888e-05, "loss": 20.9713, "step": 34380 }, { "epoch": 0.37, "learning_rate": 1.4474190208775358e-05, "loss": 21.2202, "step": 34390 }, { "epoch": 0.37, "learning_rate": 1.4471058585328426e-05, "loss": 21.565, "step": 34400 }, { "epoch": 0.37, "learning_rate": 1.4467926413752007e-05, "loss": 21.2798, "step": 34410 }, { "epoch": 0.37, "learning_rate": 1.4464793694430084e-05, "loss": 21.5375, "step": 34420 }, { "epoch": 0.37, "learning_rate": 1.4461660427746717e-05, "loss": 20.0121, "step": 34430 }, { "epoch": 0.37, "learning_rate": 1.4458526614086029e-05, "loss": 21.2963, "step": 34440 }, { "epoch": 0.37, "learning_rate": 1.4455392253832208e-05, "loss": 21.6159, "step": 34450 }, { "epoch": 0.37, "learning_rate": 1.4452257347369516e-05, "loss": 21.0983, "step": 34460 }, { "epoch": 0.37, "learning_rate": 1.4449121895082268e-05, "loss": 21.6905, "step": 34470 }, { "epoch": 0.37, "learning_rate": 1.4445985897354862e-05, "loss": 20.8333, "step": 34480 }, { "epoch": 0.37, "learning_rate": 1.4442849354571753e-05, "loss": 21.2926, "step": 34490 }, { "epoch": 0.37, "learning_rate": 1.4439712267117467e-05, "loss": 21.1327, "step": 34500 }, { "epoch": 0.37, "learning_rate": 1.4436574635376594e-05, "loss": 21.4857, "step": 34510 }, { "epoch": 0.37, "learning_rate": 1.443343645973379e-05, "loss": 21.9807, "step": 34520 }, { "epoch": 0.37, "learning_rate": 1.4430297740573784e-05, "loss": 21.1605, "step": 34530 }, { "epoch": 0.37, "learning_rate": 1.4427158478281365e-05, "loss": 21.7695, "step": 34540 }, { "epoch": 0.37, "learning_rate": 1.442401867324139e-05, "loss": 21.2887, "step": 34550 }, { "epoch": 0.37, "learning_rate": 1.4420878325838788e-05, "loss": 21.7259, "step": 34560 }, { "epoch": 0.37, "learning_rate": 1.4417737436458543e-05, "loss": 22.2204, "step": 34570 }, { "epoch": 0.37, "learning_rate": 1.4414596005485717e-05, "loss": 21.465, "step": 34580 }, { "epoch": 0.37, "learning_rate": 1.4411454033305434e-05, "loss": 21.3442, "step": 34590 }, { "epoch": 0.37, "learning_rate": 1.440831152030288e-05, "loss": 20.1003, "step": 34600 }, { "epoch": 0.37, "learning_rate": 1.4405168466863315e-05, "loss": 21.6209, "step": 34610 }, { "epoch": 0.37, "learning_rate": 1.4402024873372063e-05, "loss": 21.0275, "step": 34620 }, { "epoch": 0.37, "learning_rate": 1.4398880740214509e-05, "loss": 21.4959, "step": 34630 }, { "epoch": 0.37, "learning_rate": 1.4395736067776112e-05, "loss": 21.7487, "step": 34640 }, { "epoch": 0.37, "learning_rate": 1.4392590856442388e-05, "loss": 20.8762, "step": 34650 }, { "epoch": 0.37, "learning_rate": 1.438944510659893e-05, "loss": 21.1041, "step": 34660 }, { "epoch": 0.37, "learning_rate": 1.4386298818631388e-05, "loss": 21.3924, "step": 34670 }, { "epoch": 0.37, "learning_rate": 1.438315199292548e-05, "loss": 21.3592, "step": 34680 }, { "epoch": 0.38, "learning_rate": 1.4380004629866993e-05, "loss": 21.3324, "step": 34690 }, { "epoch": 0.38, "learning_rate": 1.437685672984178e-05, "loss": 22.2567, "step": 34700 }, { "epoch": 0.38, "learning_rate": 1.4373708293235753e-05, "loss": 21.383, "step": 34710 }, { "epoch": 0.38, "learning_rate": 1.4370559320434899e-05, "loss": 21.8395, "step": 34720 }, { "epoch": 0.38, "learning_rate": 1.4367409811825264e-05, "loss": 21.4659, "step": 34730 }, { "epoch": 0.38, "learning_rate": 1.4364259767792963e-05, "loss": 21.383, "step": 34740 }, { "epoch": 0.38, "learning_rate": 1.4361109188724174e-05, "loss": 21.1815, "step": 34750 }, { "epoch": 0.38, "learning_rate": 1.4357958075005147e-05, "loss": 21.2465, "step": 34760 }, { "epoch": 0.38, "learning_rate": 1.4354806427022187e-05, "loss": 20.8452, "step": 34770 }, { "epoch": 0.38, "learning_rate": 1.4351654245161675e-05, "loss": 21.7178, "step": 34780 }, { "epoch": 0.38, "learning_rate": 1.4348501529810048e-05, "loss": 21.1135, "step": 34790 }, { "epoch": 0.38, "learning_rate": 1.4345348281353814e-05, "loss": 21.4315, "step": 34800 }, { "epoch": 0.38, "learning_rate": 1.4342194500179554e-05, "loss": 21.4609, "step": 34810 }, { "epoch": 0.38, "learning_rate": 1.4339040186673895e-05, "loss": 21.5505, "step": 34820 }, { "epoch": 0.38, "learning_rate": 1.4335885341223543e-05, "loss": 21.2583, "step": 34830 }, { "epoch": 0.38, "learning_rate": 1.4332729964215273e-05, "loss": 21.6472, "step": 34840 }, { "epoch": 0.38, "learning_rate": 1.4329574056035908e-05, "loss": 21.505, "step": 34850 }, { "epoch": 0.38, "learning_rate": 1.4326417617072354e-05, "loss": 20.5836, "step": 34860 }, { "epoch": 0.38, "learning_rate": 1.4323260647711574e-05, "loss": 21.7205, "step": 34870 }, { "epoch": 0.38, "learning_rate": 1.4320103148340592e-05, "loss": 21.0495, "step": 34880 }, { "epoch": 0.38, "learning_rate": 1.4316945119346505e-05, "loss": 20.8459, "step": 34890 }, { "epoch": 0.38, "learning_rate": 1.4313786561116475e-05, "loss": 19.8367, "step": 34900 }, { "epoch": 0.38, "learning_rate": 1.4310627474037717e-05, "loss": 20.6907, "step": 34910 }, { "epoch": 0.38, "learning_rate": 1.4307467858497531e-05, "loss": 21.0939, "step": 34920 }, { "epoch": 0.38, "learning_rate": 1.4304307714883255e-05, "loss": 21.6963, "step": 34930 }, { "epoch": 0.38, "learning_rate": 1.430114704358232e-05, "loss": 21.6539, "step": 34940 }, { "epoch": 0.38, "learning_rate": 1.42979858449822e-05, "loss": 21.8401, "step": 34950 }, { "epoch": 0.38, "learning_rate": 1.4294824119470451e-05, "loss": 21.3907, "step": 34960 }, { "epoch": 0.38, "learning_rate": 1.4291661867434678e-05, "loss": 21.2248, "step": 34970 }, { "epoch": 0.38, "learning_rate": 1.4288499089262557e-05, "loss": 21.3075, "step": 34980 }, { "epoch": 0.38, "learning_rate": 1.4285335785341834e-05, "loss": 21.6618, "step": 34990 }, { "epoch": 0.38, "learning_rate": 1.4282171956060308e-05, "loss": 21.2137, "step": 35000 }, { "epoch": 0.38, "learning_rate": 1.4279007601805854e-05, "loss": 21.6487, "step": 35010 }, { "epoch": 0.38, "learning_rate": 1.4275842722966405e-05, "loss": 21.8418, "step": 35020 }, { "epoch": 0.38, "learning_rate": 1.4272677319929955e-05, "loss": 21.7158, "step": 35030 }, { "epoch": 0.38, "learning_rate": 1.4269511393084572e-05, "loss": 21.6248, "step": 35040 }, { "epoch": 0.38, "learning_rate": 1.4266344942818382e-05, "loss": 21.4521, "step": 35050 }, { "epoch": 0.38, "learning_rate": 1.4263177969519571e-05, "loss": 20.8755, "step": 35060 }, { "epoch": 0.38, "learning_rate": 1.42600104735764e-05, "loss": 21.6756, "step": 35070 }, { "epoch": 0.38, "learning_rate": 1.4256842455377186e-05, "loss": 21.1886, "step": 35080 }, { "epoch": 0.38, "learning_rate": 1.4253673915310313e-05, "loss": 21.7147, "step": 35090 }, { "epoch": 0.38, "learning_rate": 1.425050485376423e-05, "loss": 21.5506, "step": 35100 }, { "epoch": 0.38, "learning_rate": 1.4247335271127441e-05, "loss": 20.5076, "step": 35110 }, { "epoch": 0.38, "learning_rate": 1.4244165167788527e-05, "loss": 21.479, "step": 35120 }, { "epoch": 0.38, "learning_rate": 1.4240994544136127e-05, "loss": 21.2509, "step": 35130 }, { "epoch": 0.38, "learning_rate": 1.4237823400558939e-05, "loss": 21.0062, "step": 35140 }, { "epoch": 0.38, "learning_rate": 1.4234651737445738e-05, "loss": 20.8996, "step": 35150 }, { "epoch": 0.38, "learning_rate": 1.4231479555185343e-05, "loss": 21.0531, "step": 35160 }, { "epoch": 0.38, "learning_rate": 1.4228306854166656e-05, "loss": 21.9514, "step": 35170 }, { "epoch": 0.38, "learning_rate": 1.422513363477863e-05, "loss": 20.9747, "step": 35180 }, { "epoch": 0.38, "learning_rate": 1.4221959897410291e-05, "loss": 21.0204, "step": 35190 }, { "epoch": 0.38, "learning_rate": 1.4218785642450718e-05, "loss": 21.2738, "step": 35200 }, { "epoch": 0.38, "learning_rate": 1.421561087028906e-05, "loss": 21.2987, "step": 35210 }, { "epoch": 0.38, "learning_rate": 1.4212435581314533e-05, "loss": 21.7243, "step": 35220 }, { "epoch": 0.38, "learning_rate": 1.4209259775916402e-05, "loss": 21.1322, "step": 35230 }, { "epoch": 0.38, "learning_rate": 1.4206083454484016e-05, "loss": 21.1199, "step": 35240 }, { "epoch": 0.38, "learning_rate": 1.4202906617406768e-05, "loss": 21.4387, "step": 35250 }, { "epoch": 0.38, "learning_rate": 1.4199729265074124e-05, "loss": 21.8315, "step": 35260 }, { "epoch": 0.38, "learning_rate": 1.4196551397875617e-05, "loss": 21.2638, "step": 35270 }, { "epoch": 0.38, "learning_rate": 1.4193373016200828e-05, "loss": 21.9488, "step": 35280 }, { "epoch": 0.38, "learning_rate": 1.419019412043942e-05, "loss": 21.1275, "step": 35290 }, { "epoch": 0.38, "learning_rate": 1.4187014710981106e-05, "loss": 21.4525, "step": 35300 }, { "epoch": 0.38, "learning_rate": 1.4183834788215663e-05, "loss": 21.3088, "step": 35310 }, { "epoch": 0.38, "learning_rate": 1.4180654352532938e-05, "loss": 21.5528, "step": 35320 }, { "epoch": 0.38, "learning_rate": 1.4177473404322836e-05, "loss": 21.5545, "step": 35330 }, { "epoch": 0.38, "learning_rate": 1.417429194397532e-05, "loss": 20.6543, "step": 35340 }, { "epoch": 0.38, "learning_rate": 1.417110997188043e-05, "loss": 21.3112, "step": 35350 }, { "epoch": 0.38, "learning_rate": 1.4167927488428253e-05, "loss": 21.6122, "step": 35360 }, { "epoch": 0.38, "learning_rate": 1.4164744494008948e-05, "loss": 21.3514, "step": 35370 }, { "epoch": 0.38, "learning_rate": 1.4161560989012738e-05, "loss": 21.1417, "step": 35380 }, { "epoch": 0.38, "learning_rate": 1.4158376973829894e-05, "loss": 21.9787, "step": 35390 }, { "epoch": 0.38, "learning_rate": 1.4155192448850774e-05, "loss": 21.4064, "step": 35400 }, { "epoch": 0.38, "learning_rate": 1.4152007414465771e-05, "loss": 20.8739, "step": 35410 }, { "epoch": 0.38, "learning_rate": 1.4148821871065367e-05, "loss": 21.9028, "step": 35420 }, { "epoch": 0.38, "learning_rate": 1.4145635819040089e-05, "loss": 21.4645, "step": 35430 }, { "epoch": 0.38, "learning_rate": 1.4142449258780527e-05, "loss": 21.0454, "step": 35440 }, { "epoch": 0.38, "learning_rate": 1.4139262190677343e-05, "loss": 21.2242, "step": 35450 }, { "epoch": 0.38, "learning_rate": 1.4136074615121253e-05, "loss": 21.3242, "step": 35460 }, { "epoch": 0.38, "learning_rate": 1.4132886532503039e-05, "loss": 21.0412, "step": 35470 }, { "epoch": 0.38, "learning_rate": 1.4129697943213545e-05, "loss": 21.4789, "step": 35480 }, { "epoch": 0.38, "learning_rate": 1.412650884764367e-05, "loss": 21.1413, "step": 35490 }, { "epoch": 0.38, "learning_rate": 1.4123319246184388e-05, "loss": 21.4304, "step": 35500 }, { "epoch": 0.38, "learning_rate": 1.4120129139226727e-05, "loss": 21.7277, "step": 35510 }, { "epoch": 0.38, "learning_rate": 1.4116938527161776e-05, "loss": 21.888, "step": 35520 }, { "epoch": 0.38, "learning_rate": 1.4113747410380692e-05, "loss": 21.7764, "step": 35530 }, { "epoch": 0.38, "learning_rate": 1.4110555789274684e-05, "loss": 20.9758, "step": 35540 }, { "epoch": 0.38, "learning_rate": 1.4107363664235035e-05, "loss": 21.7323, "step": 35550 }, { "epoch": 0.38, "learning_rate": 1.4104171035653077e-05, "loss": 21.3814, "step": 35560 }, { "epoch": 0.38, "learning_rate": 1.4100977903920217e-05, "loss": 20.9296, "step": 35570 }, { "epoch": 0.38, "learning_rate": 1.4097784269427915e-05, "loss": 21.8279, "step": 35580 }, { "epoch": 0.38, "learning_rate": 1.4094590132567692e-05, "loss": 20.8267, "step": 35590 }, { "epoch": 0.38, "learning_rate": 1.4091395493731134e-05, "loss": 21.0298, "step": 35600 }, { "epoch": 0.38, "learning_rate": 1.4088200353309894e-05, "loss": 20.8502, "step": 35610 }, { "epoch": 0.39, "learning_rate": 1.408500471169567e-05, "loss": 21.5368, "step": 35620 }, { "epoch": 0.39, "learning_rate": 1.408180856928024e-05, "loss": 21.9958, "step": 35630 }, { "epoch": 0.39, "learning_rate": 1.4078611926455428e-05, "loss": 21.5616, "step": 35640 }, { "epoch": 0.39, "learning_rate": 1.4075414783613135e-05, "loss": 20.6728, "step": 35650 }, { "epoch": 0.39, "learning_rate": 1.4072217141145308e-05, "loss": 21.7007, "step": 35660 }, { "epoch": 0.39, "learning_rate": 1.4069018999443964e-05, "loss": 21.1708, "step": 35670 }, { "epoch": 0.39, "learning_rate": 1.4065820358901182e-05, "loss": 21.3457, "step": 35680 }, { "epoch": 0.39, "learning_rate": 1.4062621219909091e-05, "loss": 21.0754, "step": 35690 }, { "epoch": 0.39, "learning_rate": 1.4059421582859902e-05, "loss": 20.589, "step": 35700 }, { "epoch": 0.39, "learning_rate": 1.4056221448145866e-05, "loss": 20.9562, "step": 35710 }, { "epoch": 0.39, "learning_rate": 1.4053020816159303e-05, "loss": 21.6626, "step": 35720 }, { "epoch": 0.39, "learning_rate": 1.40498196872926e-05, "loss": 21.9056, "step": 35730 }, { "epoch": 0.39, "learning_rate": 1.4046618061938193e-05, "loss": 21.6216, "step": 35740 }, { "epoch": 0.39, "learning_rate": 1.4043415940488594e-05, "loss": 21.2153, "step": 35750 }, { "epoch": 0.39, "learning_rate": 1.4040213323336361e-05, "loss": 21.5484, "step": 35760 }, { "epoch": 0.39, "learning_rate": 1.4037010210874114e-05, "loss": 21.0042, "step": 35770 }, { "epoch": 0.39, "learning_rate": 1.403380660349455e-05, "loss": 21.2531, "step": 35780 }, { "epoch": 0.39, "learning_rate": 1.4030602501590407e-05, "loss": 21.5866, "step": 35790 }, { "epoch": 0.39, "learning_rate": 1.4027397905554497e-05, "loss": 21.692, "step": 35800 }, { "epoch": 0.39, "learning_rate": 1.4024192815779683e-05, "loss": 20.8253, "step": 35810 }, { "epoch": 0.39, "learning_rate": 1.4020987232658896e-05, "loss": 21.5601, "step": 35820 }, { "epoch": 0.39, "learning_rate": 1.4017781156585124e-05, "loss": 21.1521, "step": 35830 }, { "epoch": 0.39, "learning_rate": 1.4014574587951414e-05, "loss": 21.6704, "step": 35840 }, { "epoch": 0.39, "learning_rate": 1.4011367527150876e-05, "loss": 21.3363, "step": 35850 }, { "epoch": 0.39, "learning_rate": 1.4008159974576685e-05, "loss": 21.0636, "step": 35860 }, { "epoch": 0.39, "learning_rate": 1.4004951930622061e-05, "loss": 21.2501, "step": 35870 }, { "epoch": 0.39, "learning_rate": 1.4001743395680306e-05, "loss": 21.551, "step": 35880 }, { "epoch": 0.39, "learning_rate": 1.3998534370144758e-05, "loss": 21.6603, "step": 35890 }, { "epoch": 0.39, "learning_rate": 1.3995324854408836e-05, "loss": 21.3401, "step": 35900 }, { "epoch": 0.39, "learning_rate": 1.3992114848866009e-05, "loss": 21.181, "step": 35910 }, { "epoch": 0.39, "learning_rate": 1.3988904353909807e-05, "loss": 20.8352, "step": 35920 }, { "epoch": 0.39, "learning_rate": 1.398569336993382e-05, "loss": 21.2376, "step": 35930 }, { "epoch": 0.39, "learning_rate": 1.3982481897331698e-05, "loss": 21.1323, "step": 35940 }, { "epoch": 0.39, "learning_rate": 1.3979269936497155e-05, "loss": 20.8176, "step": 35950 }, { "epoch": 0.39, "learning_rate": 1.397605748782396e-05, "loss": 21.9652, "step": 35960 }, { "epoch": 0.39, "learning_rate": 1.397284455170594e-05, "loss": 20.9293, "step": 35970 }, { "epoch": 0.39, "learning_rate": 1.3969631128536986e-05, "loss": 21.1269, "step": 35980 }, { "epoch": 0.39, "learning_rate": 1.3966417218711053e-05, "loss": 21.6995, "step": 35990 }, { "epoch": 0.39, "learning_rate": 1.3963202822622145e-05, "loss": 22.3265, "step": 36000 }, { "epoch": 0.39, "learning_rate": 1.3959987940664328e-05, "loss": 20.7602, "step": 36010 }, { "epoch": 0.39, "learning_rate": 1.3956772573231737e-05, "loss": 21.5811, "step": 36020 }, { "epoch": 0.39, "learning_rate": 1.395355672071856e-05, "loss": 20.8455, "step": 36030 }, { "epoch": 0.39, "learning_rate": 1.3950340383519041e-05, "loss": 21.2874, "step": 36040 }, { "epoch": 0.39, "learning_rate": 1.394712356202749e-05, "loss": 20.8436, "step": 36050 }, { "epoch": 0.39, "learning_rate": 1.3943906256638266e-05, "loss": 20.6552, "step": 36060 }, { "epoch": 0.39, "learning_rate": 1.3940688467745804e-05, "loss": 21.2529, "step": 36070 }, { "epoch": 0.39, "learning_rate": 1.3937470195744584e-05, "loss": 21.6799, "step": 36080 }, { "epoch": 0.39, "learning_rate": 1.3934251441029152e-05, "loss": 21.4219, "step": 36090 }, { "epoch": 0.39, "learning_rate": 1.3931032203994108e-05, "loss": 20.7553, "step": 36100 }, { "epoch": 0.39, "learning_rate": 1.3927812485034119e-05, "loss": 20.3159, "step": 36110 }, { "epoch": 0.39, "learning_rate": 1.3924592284543904e-05, "loss": 21.005, "step": 36120 }, { "epoch": 0.39, "learning_rate": 1.3921371602918239e-05, "loss": 21.0935, "step": 36130 }, { "epoch": 0.39, "learning_rate": 1.3918150440551971e-05, "loss": 21.804, "step": 36140 }, { "epoch": 0.39, "learning_rate": 1.3914928797839996e-05, "loss": 21.0853, "step": 36150 }, { "epoch": 0.39, "learning_rate": 1.3911706675177273e-05, "loss": 21.1952, "step": 36160 }, { "epoch": 0.39, "learning_rate": 1.3908484072958814e-05, "loss": 21.2925, "step": 36170 }, { "epoch": 0.39, "learning_rate": 1.3905260991579697e-05, "loss": 21.1481, "step": 36180 }, { "epoch": 0.39, "learning_rate": 1.3902037431435054e-05, "loss": 21.6943, "step": 36190 }, { "epoch": 0.39, "learning_rate": 1.3898813392920074e-05, "loss": 21.7501, "step": 36200 }, { "epoch": 0.39, "learning_rate": 1.389558887643002e-05, "loss": 20.7856, "step": 36210 }, { "epoch": 0.39, "learning_rate": 1.3892363882360189e-05, "loss": 21.1075, "step": 36220 }, { "epoch": 0.39, "learning_rate": 1.3889138411105953e-05, "loss": 21.8163, "step": 36230 }, { "epoch": 0.39, "learning_rate": 1.3885912463062744e-05, "loss": 20.4891, "step": 36240 }, { "epoch": 0.39, "learning_rate": 1.388268603862604e-05, "loss": 21.1215, "step": 36250 }, { "epoch": 0.39, "learning_rate": 1.3879459138191388e-05, "loss": 20.7893, "step": 36260 }, { "epoch": 0.39, "learning_rate": 1.387623176215439e-05, "loss": 21.099, "step": 36270 }, { "epoch": 0.39, "learning_rate": 1.3873003910910704e-05, "loss": 22.1323, "step": 36280 }, { "epoch": 0.39, "learning_rate": 1.3869775584856054e-05, "loss": 21.5152, "step": 36290 }, { "epoch": 0.39, "learning_rate": 1.3866546784386208e-05, "loss": 21.2515, "step": 36300 }, { "epoch": 0.39, "learning_rate": 1.3863317509897007e-05, "loss": 21.9391, "step": 36310 }, { "epoch": 0.39, "learning_rate": 1.3860087761784344e-05, "loss": 21.6154, "step": 36320 }, { "epoch": 0.39, "learning_rate": 1.3856857540444166e-05, "loss": 21.211, "step": 36330 }, { "epoch": 0.39, "learning_rate": 1.3853626846272486e-05, "loss": 21.373, "step": 36340 }, { "epoch": 0.39, "learning_rate": 1.385039567966537e-05, "loss": 21.821, "step": 36350 }, { "epoch": 0.39, "learning_rate": 1.3847164041018941e-05, "loss": 21.1318, "step": 36360 }, { "epoch": 0.39, "learning_rate": 1.3843931930729387e-05, "loss": 21.2648, "step": 36370 }, { "epoch": 0.39, "learning_rate": 1.384069934919294e-05, "loss": 21.3104, "step": 36380 }, { "epoch": 0.39, "learning_rate": 1.3837466296805904e-05, "loss": 21.4551, "step": 36390 }, { "epoch": 0.39, "learning_rate": 1.3834232773964636e-05, "loss": 21.2201, "step": 36400 }, { "epoch": 0.39, "learning_rate": 1.3830998781065545e-05, "loss": 21.6827, "step": 36410 }, { "epoch": 0.39, "learning_rate": 1.3827764318505108e-05, "loss": 20.812, "step": 36420 }, { "epoch": 0.39, "learning_rate": 1.3824529386679853e-05, "loss": 21.3637, "step": 36430 }, { "epoch": 0.39, "learning_rate": 1.3821293985986363e-05, "loss": 21.2393, "step": 36440 }, { "epoch": 0.39, "learning_rate": 1.3818058116821282e-05, "loss": 21.6456, "step": 36450 }, { "epoch": 0.39, "learning_rate": 1.3814821779581318e-05, "loss": 20.9225, "step": 36460 }, { "epoch": 0.39, "learning_rate": 1.381158497466322e-05, "loss": 21.2887, "step": 36470 }, { "epoch": 0.39, "learning_rate": 1.3808347702463813e-05, "loss": 20.6327, "step": 36480 }, { "epoch": 0.39, "learning_rate": 1.3805109963379967e-05, "loss": 20.8868, "step": 36490 }, { "epoch": 0.39, "learning_rate": 1.3801871757808612e-05, "loss": 20.9635, "step": 36500 }, { "epoch": 0.39, "learning_rate": 1.3798633086146736e-05, "loss": 21.0455, "step": 36510 }, { "epoch": 0.39, "learning_rate": 1.3795393948791382e-05, "loss": 21.1336, "step": 36520 }, { "epoch": 0.39, "learning_rate": 1.3792154346139657e-05, "loss": 21.1081, "step": 36530 }, { "epoch": 0.4, "learning_rate": 1.3788914278588719e-05, "loss": 21.9311, "step": 36540 }, { "epoch": 0.4, "learning_rate": 1.378567374653578e-05, "loss": 21.16, "step": 36550 }, { "epoch": 0.4, "learning_rate": 1.3782432750378117e-05, "loss": 21.2553, "step": 36560 }, { "epoch": 0.4, "learning_rate": 1.3779191290513057e-05, "loss": 21.3089, "step": 36570 }, { "epoch": 0.4, "learning_rate": 1.3775949367337988e-05, "loss": 20.8622, "step": 36580 }, { "epoch": 0.4, "learning_rate": 1.3772706981250357e-05, "loss": 21.6832, "step": 36590 }, { "epoch": 0.4, "learning_rate": 1.3769464132647659e-05, "loss": 20.8205, "step": 36600 }, { "epoch": 0.4, "learning_rate": 1.3766220821927453e-05, "loss": 21.7955, "step": 36610 }, { "epoch": 0.4, "learning_rate": 1.3762977049487357e-05, "loss": 21.2354, "step": 36620 }, { "epoch": 0.4, "learning_rate": 1.3759732815725035e-05, "loss": 21.7288, "step": 36630 }, { "epoch": 0.4, "learning_rate": 1.3756488121038216e-05, "loss": 21.1888, "step": 36640 }, { "epoch": 0.4, "learning_rate": 1.3753242965824687e-05, "loss": 21.0926, "step": 36650 }, { "epoch": 0.4, "learning_rate": 1.374999735048228e-05, "loss": 21.8438, "step": 36660 }, { "epoch": 0.4, "learning_rate": 1.37467512754089e-05, "loss": 21.5407, "step": 36670 }, { "epoch": 0.4, "learning_rate": 1.3743504741002495e-05, "loss": 20.8154, "step": 36680 }, { "epoch": 0.4, "learning_rate": 1.374025774766107e-05, "loss": 21.1559, "step": 36690 }, { "epoch": 0.4, "learning_rate": 1.3737010295782702e-05, "loss": 21.5061, "step": 36700 }, { "epoch": 0.4, "learning_rate": 1.37337623857655e-05, "loss": 21.7917, "step": 36710 }, { "epoch": 0.4, "learning_rate": 1.373051401800765e-05, "loss": 21.8021, "step": 36720 }, { "epoch": 0.4, "learning_rate": 1.372726519290738e-05, "loss": 22.3536, "step": 36730 }, { "epoch": 0.4, "learning_rate": 1.3724015910862982e-05, "loss": 21.9233, "step": 36740 }, { "epoch": 0.4, "learning_rate": 1.3720766172272804e-05, "loss": 21.2794, "step": 36750 }, { "epoch": 0.4, "learning_rate": 1.3717515977535244e-05, "loss": 20.5255, "step": 36760 }, { "epoch": 0.4, "learning_rate": 1.371426532704876e-05, "loss": 20.918, "step": 36770 }, { "epoch": 0.4, "learning_rate": 1.3711014221211871e-05, "loss": 21.3836, "step": 36780 }, { "epoch": 0.4, "learning_rate": 1.3707762660423138e-05, "loss": 20.5418, "step": 36790 }, { "epoch": 0.4, "learning_rate": 1.3704510645081195e-05, "loss": 21.0181, "step": 36800 }, { "epoch": 0.4, "learning_rate": 1.3701258175584713e-05, "loss": 21.819, "step": 36810 }, { "epoch": 0.4, "learning_rate": 1.3698005252332435e-05, "loss": 21.1403, "step": 36820 }, { "epoch": 0.4, "learning_rate": 1.3694751875723155e-05, "loss": 21.1866, "step": 36830 }, { "epoch": 0.4, "learning_rate": 1.3691498046155715e-05, "loss": 21.4949, "step": 36840 }, { "epoch": 0.4, "learning_rate": 1.3688243764029024e-05, "loss": 21.0712, "step": 36850 }, { "epoch": 0.4, "learning_rate": 1.3684989029742032e-05, "loss": 21.5034, "step": 36860 }, { "epoch": 0.4, "learning_rate": 1.3681733843693766e-05, "loss": 21.1266, "step": 36870 }, { "epoch": 0.4, "learning_rate": 1.3678478206283283e-05, "loss": 21.0178, "step": 36880 }, { "epoch": 0.4, "learning_rate": 1.3675222117909716e-05, "loss": 21.0412, "step": 36890 }, { "epoch": 0.4, "learning_rate": 1.3671965578972244e-05, "loss": 21.7277, "step": 36900 }, { "epoch": 0.4, "learning_rate": 1.36687085898701e-05, "loss": 21.4726, "step": 36910 }, { "epoch": 0.4, "learning_rate": 1.3665451151002574e-05, "loss": 21.8562, "step": 36920 }, { "epoch": 0.4, "learning_rate": 1.3662193262769014e-05, "loss": 20.7965, "step": 36930 }, { "epoch": 0.4, "learning_rate": 1.3658934925568823e-05, "loss": 21.5026, "step": 36940 }, { "epoch": 0.4, "learning_rate": 1.3655676139801451e-05, "loss": 20.9165, "step": 36950 }, { "epoch": 0.4, "learning_rate": 1.3652416905866414e-05, "loss": 21.4897, "step": 36960 }, { "epoch": 0.4, "learning_rate": 1.3649157224163277e-05, "loss": 20.517, "step": 36970 }, { "epoch": 0.4, "learning_rate": 1.3645897095091655e-05, "loss": 21.7329, "step": 36980 }, { "epoch": 0.4, "learning_rate": 1.3642636519051232e-05, "loss": 21.4756, "step": 36990 }, { "epoch": 0.4, "learning_rate": 1.3639375496441733e-05, "loss": 21.4406, "step": 37000 }, { "epoch": 0.4, "learning_rate": 1.3636114027662947e-05, "loss": 20.8184, "step": 37010 }, { "epoch": 0.4, "learning_rate": 1.363285211311471e-05, "loss": 20.7085, "step": 37020 }, { "epoch": 0.4, "learning_rate": 1.3629589753196917e-05, "loss": 22.0433, "step": 37030 }, { "epoch": 0.4, "learning_rate": 1.362632694830952e-05, "loss": 21.3004, "step": 37040 }, { "epoch": 0.4, "learning_rate": 1.3623063698852521e-05, "loss": 21.6924, "step": 37050 }, { "epoch": 0.4, "learning_rate": 1.3619800005225976e-05, "loss": 20.9645, "step": 37060 }, { "epoch": 0.4, "learning_rate": 1.3616535867829998e-05, "loss": 21.2424, "step": 37070 }, { "epoch": 0.4, "learning_rate": 1.3613271287064758e-05, "loss": 21.2973, "step": 37080 }, { "epoch": 0.4, "learning_rate": 1.3610006263330475e-05, "loss": 21.7246, "step": 37090 }, { "epoch": 0.4, "learning_rate": 1.3606740797027423e-05, "loss": 21.9421, "step": 37100 }, { "epoch": 0.4, "learning_rate": 1.3603474888555932e-05, "loss": 21.3392, "step": 37110 }, { "epoch": 0.4, "learning_rate": 1.3600208538316386e-05, "loss": 22.1001, "step": 37120 }, { "epoch": 0.4, "learning_rate": 1.3596941746709229e-05, "loss": 21.5798, "step": 37130 }, { "epoch": 0.4, "learning_rate": 1.3593674514134947e-05, "loss": 20.8153, "step": 37140 }, { "epoch": 0.4, "learning_rate": 1.3590406840994088e-05, "loss": 21.5814, "step": 37150 }, { "epoch": 0.4, "learning_rate": 1.3587138727687253e-05, "loss": 20.3914, "step": 37160 }, { "epoch": 0.4, "learning_rate": 1.3583870174615092e-05, "loss": 21.7447, "step": 37170 }, { "epoch": 0.4, "learning_rate": 1.3580601182178323e-05, "loss": 21.3598, "step": 37180 }, { "epoch": 0.4, "learning_rate": 1.3577331750777703e-05, "loss": 20.8759, "step": 37190 }, { "epoch": 0.4, "learning_rate": 1.3574061880814042e-05, "loss": 20.7861, "step": 37200 }, { "epoch": 0.4, "learning_rate": 1.357079157268822e-05, "loss": 21.3529, "step": 37210 }, { "epoch": 0.4, "learning_rate": 1.3567520826801153e-05, "loss": 21.426, "step": 37220 }, { "epoch": 0.4, "learning_rate": 1.3564249643553823e-05, "loss": 21.143, "step": 37230 }, { "epoch": 0.4, "learning_rate": 1.356097802334726e-05, "loss": 21.3933, "step": 37240 }, { "epoch": 0.4, "learning_rate": 1.3557705966582541e-05, "loss": 21.6713, "step": 37250 }, { "epoch": 0.4, "learning_rate": 1.3554433473660818e-05, "loss": 21.1898, "step": 37260 }, { "epoch": 0.4, "learning_rate": 1.3551160544983265e-05, "loss": 21.7705, "step": 37270 }, { "epoch": 0.4, "learning_rate": 1.3547887180951143e-05, "loss": 21.3032, "step": 37280 }, { "epoch": 0.4, "learning_rate": 1.3544613381965743e-05, "loss": 21.2115, "step": 37290 }, { "epoch": 0.4, "learning_rate": 1.3541339148428411e-05, "loss": 20.9928, "step": 37300 }, { "epoch": 0.4, "learning_rate": 1.3538064480740563e-05, "loss": 21.2776, "step": 37310 }, { "epoch": 0.4, "learning_rate": 1.3534789379303647e-05, "loss": 21.3796, "step": 37320 }, { "epoch": 0.4, "learning_rate": 1.353151384451918e-05, "loss": 21.5717, "step": 37330 }, { "epoch": 0.4, "learning_rate": 1.3528237876788728e-05, "loss": 21.1576, "step": 37340 }, { "epoch": 0.4, "learning_rate": 1.3524961476513899e-05, "loss": 21.7849, "step": 37350 }, { "epoch": 0.4, "learning_rate": 1.352168464409637e-05, "loss": 21.3009, "step": 37360 }, { "epoch": 0.4, "learning_rate": 1.3518407379937863e-05, "loss": 21.7398, "step": 37370 }, { "epoch": 0.4, "learning_rate": 1.3515129684440158e-05, "loss": 20.8021, "step": 37380 }, { "epoch": 0.4, "learning_rate": 1.3511851558005078e-05, "loss": 21.152, "step": 37390 }, { "epoch": 0.4, "learning_rate": 1.3508573001034508e-05, "loss": 22.1949, "step": 37400 }, { "epoch": 0.4, "learning_rate": 1.3505294013930383e-05, "loss": 21.6833, "step": 37410 }, { "epoch": 0.4, "learning_rate": 1.350201459709469e-05, "loss": 21.8582, "step": 37420 }, { "epoch": 0.4, "learning_rate": 1.349873475092947e-05, "loss": 21.2098, "step": 37430 }, { "epoch": 0.4, "learning_rate": 1.3495454475836813e-05, "loss": 20.9828, "step": 37440 }, { "epoch": 0.4, "learning_rate": 1.3492173772218866e-05, "loss": 21.46, "step": 37450 }, { "epoch": 0.4, "learning_rate": 1.348889264047783e-05, "loss": 21.9479, "step": 37460 }, { "epoch": 0.41, "learning_rate": 1.3485611081015949e-05, "loss": 21.718, "step": 37470 }, { "epoch": 0.41, "learning_rate": 1.3482329094235531e-05, "loss": 21.4783, "step": 37480 }, { "epoch": 0.41, "learning_rate": 1.347904668053893e-05, "loss": 20.8174, "step": 37490 }, { "epoch": 0.41, "learning_rate": 1.347576384032855e-05, "loss": 21.1477, "step": 37500 }, { "epoch": 0.41, "learning_rate": 1.347248057400686e-05, "loss": 21.0785, "step": 37510 }, { "epoch": 0.41, "learning_rate": 1.346919688197636e-05, "loss": 21.8303, "step": 37520 }, { "epoch": 0.41, "learning_rate": 1.3465912764639624e-05, "loss": 21.4011, "step": 37530 }, { "epoch": 0.41, "learning_rate": 1.3462628222399263e-05, "loss": 21.1129, "step": 37540 }, { "epoch": 0.41, "learning_rate": 1.3459343255657946e-05, "loss": 21.3497, "step": 37550 }, { "epoch": 0.41, "learning_rate": 1.34560578648184e-05, "loss": 21.5243, "step": 37560 }, { "epoch": 0.41, "learning_rate": 1.3452772050283387e-05, "loss": 21.2922, "step": 37570 }, { "epoch": 0.41, "learning_rate": 1.3449485812455735e-05, "loss": 21.9105, "step": 37580 }, { "epoch": 0.41, "learning_rate": 1.344619915173833e-05, "loss": 21.8582, "step": 37590 }, { "epoch": 0.41, "learning_rate": 1.3442912068534087e-05, "loss": 20.7648, "step": 37600 }, { "epoch": 0.41, "learning_rate": 1.3439624563245995e-05, "loss": 21.6403, "step": 37610 }, { "epoch": 0.41, "learning_rate": 1.3436336636277078e-05, "loss": 21.659, "step": 37620 }, { "epoch": 0.41, "learning_rate": 1.3433048288030424e-05, "loss": 20.9649, "step": 37630 }, { "epoch": 0.41, "learning_rate": 1.342975951890917e-05, "loss": 21.7083, "step": 37640 }, { "epoch": 0.41, "learning_rate": 1.3426470329316497e-05, "loss": 21.6075, "step": 37650 }, { "epoch": 0.41, "learning_rate": 1.3423180719655649e-05, "loss": 21.6727, "step": 37660 }, { "epoch": 0.41, "learning_rate": 1.3419890690329915e-05, "loss": 21.8834, "step": 37670 }, { "epoch": 0.41, "learning_rate": 1.341660024174263e-05, "loss": 21.3389, "step": 37680 }, { "epoch": 0.41, "learning_rate": 1.3413309374297197e-05, "loss": 20.4465, "step": 37690 }, { "epoch": 0.41, "learning_rate": 1.3410018088397047e-05, "loss": 21.6095, "step": 37700 }, { "epoch": 0.41, "learning_rate": 1.3406726384445687e-05, "loss": 21.2334, "step": 37710 }, { "epoch": 0.41, "learning_rate": 1.3403434262846662e-05, "loss": 21.143, "step": 37720 }, { "epoch": 0.41, "learning_rate": 1.340014172400356e-05, "loss": 20.94, "step": 37730 }, { "epoch": 0.41, "learning_rate": 1.3396848768320039e-05, "loss": 21.8623, "step": 37740 }, { "epoch": 0.41, "learning_rate": 1.3393555396199799e-05, "loss": 21.6356, "step": 37750 }, { "epoch": 0.41, "learning_rate": 1.3390261608046582e-05, "loss": 20.6121, "step": 37760 }, { "epoch": 0.41, "learning_rate": 1.3386967404264201e-05, "loss": 21.303, "step": 37770 }, { "epoch": 0.41, "learning_rate": 1.33836727852565e-05, "loss": 21.7506, "step": 37780 }, { "epoch": 0.41, "learning_rate": 1.3380377751427392e-05, "loss": 21.2122, "step": 37790 }, { "epoch": 0.41, "learning_rate": 1.3377082303180826e-05, "loss": 20.5145, "step": 37800 }, { "epoch": 0.41, "learning_rate": 1.3373786440920806e-05, "loss": 20.7127, "step": 37810 }, { "epoch": 0.41, "learning_rate": 1.3370490165051393e-05, "loss": 21.6765, "step": 37820 }, { "epoch": 0.41, "learning_rate": 1.3367193475976689e-05, "loss": 21.8454, "step": 37830 }, { "epoch": 0.41, "learning_rate": 1.3363896374100858e-05, "loss": 20.9521, "step": 37840 }, { "epoch": 0.41, "learning_rate": 1.3360598859828105e-05, "loss": 21.5275, "step": 37850 }, { "epoch": 0.41, "learning_rate": 1.3357300933562682e-05, "loss": 21.4269, "step": 37860 }, { "epoch": 0.41, "learning_rate": 1.3354002595708909e-05, "loss": 21.1079, "step": 37870 }, { "epoch": 0.41, "learning_rate": 1.335070384667114e-05, "loss": 21.4369, "step": 37880 }, { "epoch": 0.41, "learning_rate": 1.3347404686853789e-05, "loss": 21.4515, "step": 37890 }, { "epoch": 0.41, "learning_rate": 1.3344105116661313e-05, "loss": 21.2952, "step": 37900 }, { "epoch": 0.41, "learning_rate": 1.3340805136498222e-05, "loss": 21.4797, "step": 37910 }, { "epoch": 0.41, "learning_rate": 1.3337504746769081e-05, "loss": 21.1108, "step": 37920 }, { "epoch": 0.41, "learning_rate": 1.33342039478785e-05, "loss": 21.1677, "step": 37930 }, { "epoch": 0.41, "learning_rate": 1.3330902740231137e-05, "loss": 21.6814, "step": 37940 }, { "epoch": 0.41, "learning_rate": 1.332760112423171e-05, "loss": 21.3942, "step": 37950 }, { "epoch": 0.41, "learning_rate": 1.3324299100284973e-05, "loss": 20.3068, "step": 37960 }, { "epoch": 0.41, "learning_rate": 1.3320996668795747e-05, "loss": 21.4316, "step": 37970 }, { "epoch": 0.41, "learning_rate": 1.3317693830168886e-05, "loss": 21.4168, "step": 37980 }, { "epoch": 0.41, "learning_rate": 1.3314390584809304e-05, "loss": 21.2671, "step": 37990 }, { "epoch": 0.41, "learning_rate": 1.3311086933121961e-05, "loss": 21.0558, "step": 38000 }, { "epoch": 0.41, "learning_rate": 1.330778287551187e-05, "loss": 20.9657, "step": 38010 }, { "epoch": 0.41, "learning_rate": 1.3304478412384097e-05, "loss": 21.2537, "step": 38020 }, { "epoch": 0.41, "learning_rate": 1.3301173544143742e-05, "loss": 21.5307, "step": 38030 }, { "epoch": 0.41, "learning_rate": 1.3297868271195973e-05, "loss": 20.8342, "step": 38040 }, { "epoch": 0.41, "learning_rate": 1.3294562593945997e-05, "loss": 21.2124, "step": 38050 }, { "epoch": 0.41, "learning_rate": 1.3291256512799071e-05, "loss": 21.2362, "step": 38060 }, { "epoch": 0.41, "learning_rate": 1.3287950028160512e-05, "loss": 21.5948, "step": 38070 }, { "epoch": 0.41, "learning_rate": 1.3284643140435671e-05, "loss": 20.9739, "step": 38080 }, { "epoch": 0.41, "learning_rate": 1.328133585002996e-05, "loss": 20.4482, "step": 38090 }, { "epoch": 0.41, "learning_rate": 1.3278028157348837e-05, "loss": 20.8839, "step": 38100 }, { "epoch": 0.41, "learning_rate": 1.3274720062797801e-05, "loss": 21.22, "step": 38110 }, { "epoch": 0.41, "learning_rate": 1.327141156678242e-05, "loss": 22.5368, "step": 38120 }, { "epoch": 0.41, "learning_rate": 1.3268102669708292e-05, "loss": 21.8541, "step": 38130 }, { "epoch": 0.41, "learning_rate": 1.3264793371981066e-05, "loss": 21.0746, "step": 38140 }, { "epoch": 0.41, "learning_rate": 1.326148367400646e-05, "loss": 22.0282, "step": 38150 }, { "epoch": 0.41, "learning_rate": 1.3258173576190209e-05, "loss": 21.2936, "step": 38160 }, { "epoch": 0.41, "learning_rate": 1.3254863078938129e-05, "loss": 20.8277, "step": 38170 }, { "epoch": 0.41, "learning_rate": 1.3251552182656066e-05, "loss": 22.1128, "step": 38180 }, { "epoch": 0.41, "learning_rate": 1.3248240887749913e-05, "loss": 21.2258, "step": 38190 }, { "epoch": 0.41, "learning_rate": 1.3244929194625627e-05, "loss": 21.2001, "step": 38200 }, { "epoch": 0.41, "learning_rate": 1.32416171036892e-05, "loss": 21.2737, "step": 38210 }, { "epoch": 0.41, "learning_rate": 1.323830461534668e-05, "loss": 21.5478, "step": 38220 }, { "epoch": 0.41, "learning_rate": 1.3234991730004163e-05, "loss": 21.688, "step": 38230 }, { "epoch": 0.41, "learning_rate": 1.3231678448067789e-05, "loss": 21.1628, "step": 38240 }, { "epoch": 0.41, "learning_rate": 1.3228364769943749e-05, "loss": 21.0453, "step": 38250 }, { "epoch": 0.41, "learning_rate": 1.3225050696038286e-05, "loss": 22.7574, "step": 38260 }, { "epoch": 0.41, "learning_rate": 1.322173622675769e-05, "loss": 21.3282, "step": 38270 }, { "epoch": 0.41, "learning_rate": 1.3218421362508297e-05, "loss": 21.2898, "step": 38280 }, { "epoch": 0.41, "learning_rate": 1.321510610369649e-05, "loss": 21.8581, "step": 38290 }, { "epoch": 0.41, "learning_rate": 1.3211790450728707e-05, "loss": 21.3344, "step": 38300 }, { "epoch": 0.41, "learning_rate": 1.3208474404011429e-05, "loss": 21.2439, "step": 38310 }, { "epoch": 0.41, "learning_rate": 1.3205157963951188e-05, "loss": 21.5681, "step": 38320 }, { "epoch": 0.41, "learning_rate": 1.3201841130954563e-05, "loss": 21.355, "step": 38330 }, { "epoch": 0.41, "learning_rate": 1.3198523905428178e-05, "loss": 21.1416, "step": 38340 }, { "epoch": 0.41, "learning_rate": 1.3195206287778712e-05, "loss": 21.7534, "step": 38350 }, { "epoch": 0.41, "learning_rate": 1.3191888278412886e-05, "loss": 21.7948, "step": 38360 }, { "epoch": 0.41, "learning_rate": 1.3188569877737474e-05, "loss": 21.0281, "step": 38370 }, { "epoch": 0.41, "learning_rate": 1.3185251086159292e-05, "loss": 21.522, "step": 38380 }, { "epoch": 0.42, "learning_rate": 1.318193190408521e-05, "loss": 21.825, "step": 38390 }, { "epoch": 0.42, "learning_rate": 1.3178612331922143e-05, "loss": 21.4967, "step": 38400 }, { "epoch": 0.42, "learning_rate": 1.317529237007705e-05, "loss": 21.7434, "step": 38410 }, { "epoch": 0.42, "learning_rate": 1.3171972018956948e-05, "loss": 20.9388, "step": 38420 }, { "epoch": 0.42, "learning_rate": 1.316865127896889e-05, "loss": 21.6253, "step": 38430 }, { "epoch": 0.42, "learning_rate": 1.316533015051999e-05, "loss": 21.3691, "step": 38440 }, { "epoch": 0.42, "learning_rate": 1.316200863401739e-05, "loss": 21.6935, "step": 38450 }, { "epoch": 0.42, "learning_rate": 1.3158686729868304e-05, "loss": 21.4182, "step": 38460 }, { "epoch": 0.42, "learning_rate": 1.3155364438479969e-05, "loss": 21.3836, "step": 38470 }, { "epoch": 0.42, "learning_rate": 1.3152041760259691e-05, "loss": 21.4933, "step": 38480 }, { "epoch": 0.42, "learning_rate": 1.3148718695614808e-05, "loss": 21.3255, "step": 38490 }, { "epoch": 0.42, "learning_rate": 1.3145395244952712e-05, "loss": 20.8277, "step": 38500 }, { "epoch": 0.42, "learning_rate": 1.3142071408680845e-05, "loss": 22.3681, "step": 38510 }, { "epoch": 0.42, "learning_rate": 1.3138747187206686e-05, "loss": 21.1811, "step": 38520 }, { "epoch": 0.42, "learning_rate": 1.3135422580937777e-05, "loss": 20.4909, "step": 38530 }, { "epoch": 0.42, "learning_rate": 1.3132097590281692e-05, "loss": 21.2939, "step": 38540 }, { "epoch": 0.42, "learning_rate": 1.3128772215646058e-05, "loss": 21.3409, "step": 38550 }, { "epoch": 0.42, "learning_rate": 1.3125446457438553e-05, "loss": 20.9308, "step": 38560 }, { "epoch": 0.42, "learning_rate": 1.3122120316066896e-05, "loss": 21.7677, "step": 38570 }, { "epoch": 0.42, "learning_rate": 1.3118793791938856e-05, "loss": 22.4843, "step": 38580 }, { "epoch": 0.42, "learning_rate": 1.3115466885462246e-05, "loss": 21.4681, "step": 38590 }, { "epoch": 0.42, "learning_rate": 1.3112139597044928e-05, "loss": 21.3759, "step": 38600 }, { "epoch": 0.42, "learning_rate": 1.310881192709482e-05, "loss": 20.967, "step": 38610 }, { "epoch": 0.42, "learning_rate": 1.3105483876019865e-05, "loss": 21.5025, "step": 38620 }, { "epoch": 0.42, "learning_rate": 1.3102155444228072e-05, "loss": 20.3812, "step": 38630 }, { "epoch": 0.42, "learning_rate": 1.3098826632127495e-05, "loss": 20.8746, "step": 38640 }, { "epoch": 0.42, "learning_rate": 1.3095497440126217e-05, "loss": 20.9567, "step": 38650 }, { "epoch": 0.42, "learning_rate": 1.3092167868632392e-05, "loss": 22.1854, "step": 38660 }, { "epoch": 0.42, "learning_rate": 1.3088837918054202e-05, "loss": 21.6014, "step": 38670 }, { "epoch": 0.42, "learning_rate": 1.3085507588799886e-05, "loss": 21.2234, "step": 38680 }, { "epoch": 0.42, "learning_rate": 1.3082176881277726e-05, "loss": 21.4272, "step": 38690 }, { "epoch": 0.42, "learning_rate": 1.3078845795896044e-05, "loss": 21.0838, "step": 38700 }, { "epoch": 0.42, "learning_rate": 1.3075514333063221e-05, "loss": 21.3791, "step": 38710 }, { "epoch": 0.42, "learning_rate": 1.3072182493187677e-05, "loss": 21.3101, "step": 38720 }, { "epoch": 0.42, "learning_rate": 1.306885027667788e-05, "loss": 20.6627, "step": 38730 }, { "epoch": 0.42, "learning_rate": 1.3065517683942339e-05, "loss": 21.7709, "step": 38740 }, { "epoch": 0.42, "learning_rate": 1.3062184715389612e-05, "loss": 21.8192, "step": 38750 }, { "epoch": 0.42, "learning_rate": 1.3058851371428312e-05, "loss": 21.7772, "step": 38760 }, { "epoch": 0.42, "learning_rate": 1.3055517652467083e-05, "loss": 20.6774, "step": 38770 }, { "epoch": 0.42, "learning_rate": 1.3052183558914626e-05, "loss": 21.3858, "step": 38780 }, { "epoch": 0.42, "learning_rate": 1.3048849091179685e-05, "loss": 21.3949, "step": 38790 }, { "epoch": 0.42, "learning_rate": 1.3045514249671046e-05, "loss": 21.3499, "step": 38800 }, { "epoch": 0.42, "learning_rate": 1.3042179034797544e-05, "loss": 21.3323, "step": 38810 }, { "epoch": 0.42, "learning_rate": 1.3038843446968064e-05, "loss": 21.4113, "step": 38820 }, { "epoch": 0.42, "learning_rate": 1.3035507486591527e-05, "loss": 20.433, "step": 38830 }, { "epoch": 0.42, "learning_rate": 1.3032171154076909e-05, "loss": 21.7003, "step": 38840 }, { "epoch": 0.42, "learning_rate": 1.3028834449833228e-05, "loss": 21.2066, "step": 38850 }, { "epoch": 0.42, "learning_rate": 1.3025497374269542e-05, "loss": 21.3324, "step": 38860 }, { "epoch": 0.42, "learning_rate": 1.3022159927794969e-05, "loss": 21.013, "step": 38870 }, { "epoch": 0.42, "learning_rate": 1.3018822110818654e-05, "loss": 21.2987, "step": 38880 }, { "epoch": 0.42, "learning_rate": 1.3015483923749802e-05, "loss": 21.1619, "step": 38890 }, { "epoch": 0.42, "learning_rate": 1.3012145366997655e-05, "loss": 21.5253, "step": 38900 }, { "epoch": 0.42, "learning_rate": 1.3008806440971506e-05, "loss": 21.0636, "step": 38910 }, { "epoch": 0.42, "learning_rate": 1.300546714608069e-05, "loss": 22.1499, "step": 38920 }, { "epoch": 0.42, "learning_rate": 1.3002127482734588e-05, "loss": 21.4276, "step": 38930 }, { "epoch": 0.42, "learning_rate": 1.2998787451342625e-05, "loss": 22.2916, "step": 38940 }, { "epoch": 0.42, "learning_rate": 1.2995447052314272e-05, "loss": 21.224, "step": 38950 }, { "epoch": 0.42, "learning_rate": 1.2992106286059047e-05, "loss": 21.263, "step": 38960 }, { "epoch": 0.42, "learning_rate": 1.2988765152986513e-05, "loss": 21.3005, "step": 38970 }, { "epoch": 0.42, "learning_rate": 1.2985423653506269e-05, "loss": 20.5258, "step": 38980 }, { "epoch": 0.42, "learning_rate": 1.2982081788027975e-05, "loss": 20.8138, "step": 38990 }, { "epoch": 0.42, "learning_rate": 1.2978739556961322e-05, "loss": 21.7663, "step": 39000 }, { "epoch": 0.42, "learning_rate": 1.2975396960716051e-05, "loss": 21.2998, "step": 39010 }, { "epoch": 0.42, "learning_rate": 1.297205399970195e-05, "loss": 21.6158, "step": 39020 }, { "epoch": 0.42, "learning_rate": 1.2968710674328846e-05, "loss": 20.9274, "step": 39030 }, { "epoch": 0.42, "learning_rate": 1.2965366985006618e-05, "loss": 20.9673, "step": 39040 }, { "epoch": 0.42, "learning_rate": 1.2962022932145182e-05, "loss": 21.571, "step": 39050 }, { "epoch": 0.42, "learning_rate": 1.2958678516154502e-05, "loss": 20.8661, "step": 39060 }, { "epoch": 0.42, "learning_rate": 1.2955333737444592e-05, "loss": 20.7788, "step": 39070 }, { "epoch": 0.42, "learning_rate": 1.2951988596425498e-05, "loss": 21.5105, "step": 39080 }, { "epoch": 0.42, "learning_rate": 1.2948643093507326e-05, "loss": 21.3875, "step": 39090 }, { "epoch": 0.42, "learning_rate": 1.294529722910021e-05, "loss": 21.2266, "step": 39100 }, { "epoch": 0.42, "learning_rate": 1.2941951003614337e-05, "loss": 21.5863, "step": 39110 }, { "epoch": 0.42, "learning_rate": 1.2938604417459945e-05, "loss": 21.9278, "step": 39120 }, { "epoch": 0.42, "learning_rate": 1.29352574710473e-05, "loss": 21.1404, "step": 39130 }, { "epoch": 0.42, "learning_rate": 1.2931910164786726e-05, "loss": 21.1534, "step": 39140 }, { "epoch": 0.42, "learning_rate": 1.2928562499088587e-05, "loss": 21.5023, "step": 39150 }, { "epoch": 0.42, "learning_rate": 1.2925214474363283e-05, "loss": 21.6048, "step": 39160 }, { "epoch": 0.42, "learning_rate": 1.2921866091021276e-05, "loss": 21.8077, "step": 39170 }, { "epoch": 0.42, "learning_rate": 1.291851734947305e-05, "loss": 22.3039, "step": 39180 }, { "epoch": 0.42, "learning_rate": 1.2915168250129152e-05, "loss": 21.6205, "step": 39190 }, { "epoch": 0.42, "learning_rate": 1.2911818793400164e-05, "loss": 21.1204, "step": 39200 }, { "epoch": 0.42, "learning_rate": 1.2908468979696707e-05, "loss": 21.5095, "step": 39210 }, { "epoch": 0.42, "learning_rate": 1.2905118809429455e-05, "loss": 21.2037, "step": 39220 }, { "epoch": 0.42, "learning_rate": 1.2901768283009127e-05, "loss": 21.6346, "step": 39230 }, { "epoch": 0.42, "learning_rate": 1.289841740084647e-05, "loss": 21.2899, "step": 39240 }, { "epoch": 0.42, "learning_rate": 1.2895066163352296e-05, "loss": 21.5116, "step": 39250 }, { "epoch": 0.42, "learning_rate": 1.2891714570937446e-05, "loss": 20.8601, "step": 39260 }, { "epoch": 0.42, "learning_rate": 1.2888362624012807e-05, "loss": 20.7133, "step": 39270 }, { "epoch": 0.42, "learning_rate": 1.2885010322989311e-05, "loss": 21.2673, "step": 39280 }, { "epoch": 0.42, "learning_rate": 1.2881657668277936e-05, "loss": 21.1595, "step": 39290 }, { "epoch": 0.42, "learning_rate": 1.2878304660289698e-05, "loss": 21.4439, "step": 39300 }, { "epoch": 0.42, "learning_rate": 1.2874951299435663e-05, "loss": 21.6153, "step": 39310 }, { "epoch": 0.43, "learning_rate": 1.2871597586126932e-05, "loss": 21.2061, "step": 39320 }, { "epoch": 0.43, "learning_rate": 1.2868243520774654e-05, "loss": 21.2966, "step": 39330 }, { "epoch": 0.43, "learning_rate": 1.2864889103790024e-05, "loss": 21.9294, "step": 39340 }, { "epoch": 0.43, "learning_rate": 1.2861534335584274e-05, "loss": 21.533, "step": 39350 }, { "epoch": 0.43, "learning_rate": 1.2858179216568682e-05, "loss": 21.0947, "step": 39360 }, { "epoch": 0.43, "learning_rate": 1.285482374715457e-05, "loss": 22.2089, "step": 39370 }, { "epoch": 0.43, "learning_rate": 1.28514679277533e-05, "loss": 21.7586, "step": 39380 }, { "epoch": 0.43, "learning_rate": 1.2848111758776283e-05, "loss": 20.8855, "step": 39390 }, { "epoch": 0.43, "learning_rate": 1.2844755240634964e-05, "loss": 21.6492, "step": 39400 }, { "epoch": 0.43, "learning_rate": 1.2841398373740835e-05, "loss": 21.3194, "step": 39410 }, { "epoch": 0.43, "learning_rate": 1.2838041158505437e-05, "loss": 21.5142, "step": 39420 }, { "epoch": 0.43, "learning_rate": 1.283468359534034e-05, "loss": 21.6899, "step": 39430 }, { "epoch": 0.43, "learning_rate": 1.283132568465717e-05, "loss": 21.2262, "step": 39440 }, { "epoch": 0.43, "learning_rate": 1.2827967426867591e-05, "loss": 20.4106, "step": 39450 }, { "epoch": 0.43, "learning_rate": 1.2824608822383304e-05, "loss": 21.8307, "step": 39460 }, { "epoch": 0.43, "learning_rate": 1.282124987161606e-05, "loss": 21.7357, "step": 39470 }, { "epoch": 0.43, "learning_rate": 1.2817890574977648e-05, "loss": 21.3218, "step": 39480 }, { "epoch": 0.43, "learning_rate": 1.2814530932879899e-05, "loss": 21.8133, "step": 39490 }, { "epoch": 0.43, "learning_rate": 1.2811170945734696e-05, "loss": 20.8588, "step": 39500 }, { "epoch": 0.43, "learning_rate": 1.2807810613953953e-05, "loss": 21.2721, "step": 39510 }, { "epoch": 0.43, "learning_rate": 1.2804449937949626e-05, "loss": 21.2708, "step": 39520 }, { "epoch": 0.43, "learning_rate": 1.280108891813372e-05, "loss": 20.6195, "step": 39530 }, { "epoch": 0.43, "learning_rate": 1.2797727554918277e-05, "loss": 21.4353, "step": 39540 }, { "epoch": 0.43, "learning_rate": 1.2794365848715393e-05, "loss": 20.9086, "step": 39550 }, { "epoch": 0.43, "learning_rate": 1.2791003799937185e-05, "loss": 21.1186, "step": 39560 }, { "epoch": 0.43, "learning_rate": 1.2787641408995825e-05, "loss": 21.7268, "step": 39570 }, { "epoch": 0.43, "learning_rate": 1.2784278676303532e-05, "loss": 21.1793, "step": 39580 }, { "epoch": 0.43, "learning_rate": 1.2780915602272554e-05, "loss": 21.3805, "step": 39590 }, { "epoch": 0.43, "learning_rate": 1.277755218731519e-05, "loss": 21.8044, "step": 39600 }, { "epoch": 0.43, "learning_rate": 1.277418843184378e-05, "loss": 21.3268, "step": 39610 }, { "epoch": 0.43, "learning_rate": 1.2770824336270695e-05, "loss": 21.4199, "step": 39620 }, { "epoch": 0.43, "learning_rate": 1.2767459901008367e-05, "loss": 21.5143, "step": 39630 }, { "epoch": 0.43, "learning_rate": 1.2764095126469251e-05, "loss": 20.7156, "step": 39640 }, { "epoch": 0.43, "learning_rate": 1.2760730013065856e-05, "loss": 21.0907, "step": 39650 }, { "epoch": 0.43, "learning_rate": 1.275736456121073e-05, "loss": 20.8103, "step": 39660 }, { "epoch": 0.43, "learning_rate": 1.2753998771316453e-05, "loss": 20.8888, "step": 39670 }, { "epoch": 0.43, "learning_rate": 1.2750632643795659e-05, "loss": 21.0968, "step": 39680 }, { "epoch": 0.43, "learning_rate": 1.274726617906102e-05, "loss": 21.7395, "step": 39690 }, { "epoch": 0.43, "learning_rate": 1.2743899377525243e-05, "loss": 21.4695, "step": 39700 }, { "epoch": 0.43, "learning_rate": 1.2740532239601091e-05, "loss": 21.3237, "step": 39710 }, { "epoch": 0.43, "learning_rate": 1.2737164765701344e-05, "loss": 21.6089, "step": 39720 }, { "epoch": 0.43, "learning_rate": 1.2733796956238846e-05, "loss": 21.0429, "step": 39730 }, { "epoch": 0.43, "learning_rate": 1.2730428811626475e-05, "loss": 21.2263, "step": 39740 }, { "epoch": 0.43, "learning_rate": 1.2727060332277143e-05, "loss": 21.1939, "step": 39750 }, { "epoch": 0.43, "learning_rate": 1.2723691518603813e-05, "loss": 21.315, "step": 39760 }, { "epoch": 0.43, "learning_rate": 1.2720322371019485e-05, "loss": 21.6785, "step": 39770 }, { "epoch": 0.43, "learning_rate": 1.2716952889937195e-05, "loss": 20.7549, "step": 39780 }, { "epoch": 0.43, "learning_rate": 1.2713583075770031e-05, "loss": 21.1023, "step": 39790 }, { "epoch": 0.43, "learning_rate": 1.2710212928931111e-05, "loss": 21.652, "step": 39800 }, { "epoch": 0.43, "learning_rate": 1.2706842449833601e-05, "loss": 20.9383, "step": 39810 }, { "epoch": 0.43, "learning_rate": 1.2703471638890701e-05, "loss": 21.5922, "step": 39820 }, { "epoch": 0.43, "learning_rate": 1.2700100496515659e-05, "loss": 21.086, "step": 39830 }, { "epoch": 0.43, "learning_rate": 1.269672902312176e-05, "loss": 21.5124, "step": 39840 }, { "epoch": 0.43, "learning_rate": 1.2693357219122331e-05, "loss": 20.9852, "step": 39850 }, { "epoch": 0.43, "learning_rate": 1.2689985084930734e-05, "loss": 21.1063, "step": 39860 }, { "epoch": 0.43, "learning_rate": 1.2686612620960376e-05, "loss": 21.4694, "step": 39870 }, { "epoch": 0.43, "learning_rate": 1.2683239827624711e-05, "loss": 21.4461, "step": 39880 }, { "epoch": 0.43, "learning_rate": 1.2679866705337221e-05, "loss": 21.1255, "step": 39890 }, { "epoch": 0.43, "learning_rate": 1.2676493254511434e-05, "loss": 21.3887, "step": 39900 }, { "epoch": 0.43, "learning_rate": 1.267311947556092e-05, "loss": 21.1185, "step": 39910 }, { "epoch": 0.43, "learning_rate": 1.2669745368899284e-05, "loss": 20.8085, "step": 39920 }, { "epoch": 0.43, "learning_rate": 1.2666370934940184e-05, "loss": 21.2466, "step": 39930 }, { "epoch": 0.43, "learning_rate": 1.26629961740973e-05, "loss": 21.1039, "step": 39940 }, { "epoch": 0.43, "learning_rate": 1.2659621086784359e-05, "loss": 21.0722, "step": 39950 }, { "epoch": 0.43, "learning_rate": 1.265624567341514e-05, "loss": 20.7882, "step": 39960 }, { "epoch": 0.43, "learning_rate": 1.2652869934403443e-05, "loss": 21.1107, "step": 39970 }, { "epoch": 0.43, "learning_rate": 1.264949387016312e-05, "loss": 21.4219, "step": 39980 }, { "epoch": 0.43, "learning_rate": 1.264611748110806e-05, "loss": 20.8985, "step": 39990 }, { "epoch": 0.43, "learning_rate": 1.2642740767652189e-05, "loss": 21.1523, "step": 40000 }, { "epoch": 0.43, "learning_rate": 1.2639363730209479e-05, "loss": 21.6251, "step": 40010 }, { "epoch": 0.43, "learning_rate": 1.2635986369193934e-05, "loss": 21.3536, "step": 40020 }, { "epoch": 0.43, "learning_rate": 1.2632608685019605e-05, "loss": 21.5121, "step": 40030 }, { "epoch": 0.43, "learning_rate": 1.2629230678100579e-05, "loss": 21.5462, "step": 40040 }, { "epoch": 0.43, "learning_rate": 1.262585234885098e-05, "loss": 21.0867, "step": 40050 }, { "epoch": 0.43, "learning_rate": 1.2622473697684978e-05, "loss": 20.7955, "step": 40060 }, { "epoch": 0.43, "learning_rate": 1.2619094725016773e-05, "loss": 20.7949, "step": 40070 }, { "epoch": 0.43, "learning_rate": 1.2615715431260618e-05, "loss": 20.9988, "step": 40080 }, { "epoch": 0.43, "learning_rate": 1.2612335816830793e-05, "loss": 20.9118, "step": 40090 }, { "epoch": 0.43, "learning_rate": 1.260895588214162e-05, "loss": 21.3323, "step": 40100 }, { "epoch": 0.43, "learning_rate": 1.2605575627607465e-05, "loss": 21.5012, "step": 40110 }, { "epoch": 0.43, "learning_rate": 1.2602195053642731e-05, "loss": 20.7789, "step": 40120 }, { "epoch": 0.43, "learning_rate": 1.2598814160661859e-05, "loss": 21.3344, "step": 40130 }, { "epoch": 0.43, "learning_rate": 1.2595432949079329e-05, "loss": 20.9485, "step": 40140 }, { "epoch": 0.43, "learning_rate": 1.259205141930966e-05, "loss": 21.8961, "step": 40150 }, { "epoch": 0.43, "learning_rate": 1.258866957176741e-05, "loss": 21.8109, "step": 40160 }, { "epoch": 0.43, "learning_rate": 1.2585287406867181e-05, "loss": 21.474, "step": 40170 }, { "epoch": 0.43, "learning_rate": 1.2581904925023602e-05, "loss": 21.7279, "step": 40180 }, { "epoch": 0.43, "learning_rate": 1.2578522126651358e-05, "loss": 21.4464, "step": 40190 }, { "epoch": 0.43, "learning_rate": 1.2575139012165156e-05, "loss": 21.3715, "step": 40200 }, { "epoch": 0.43, "learning_rate": 1.2571755581979752e-05, "loss": 21.4034, "step": 40210 }, { "epoch": 0.43, "learning_rate": 1.2568371836509936e-05, "loss": 21.5877, "step": 40220 }, { "epoch": 0.43, "learning_rate": 1.256498777617054e-05, "loss": 21.594, "step": 40230 }, { "epoch": 0.44, "learning_rate": 1.2561603401376432e-05, "loss": 21.4029, "step": 40240 }, { "epoch": 0.44, "learning_rate": 1.255821871254252e-05, "loss": 21.3477, "step": 40250 }, { "epoch": 0.44, "learning_rate": 1.2554833710083746e-05, "loss": 21.936, "step": 40260 }, { "epoch": 0.44, "learning_rate": 1.2551448394415103e-05, "loss": 21.2215, "step": 40270 }, { "epoch": 0.44, "learning_rate": 1.2548062765951608e-05, "loss": 21.5664, "step": 40280 }, { "epoch": 0.44, "learning_rate": 1.2544676825108319e-05, "loss": 20.7595, "step": 40290 }, { "epoch": 0.44, "learning_rate": 1.2541290572300344e-05, "loss": 21.6629, "step": 40300 }, { "epoch": 0.44, "learning_rate": 1.2537904007942814e-05, "loss": 21.4685, "step": 40310 }, { "epoch": 0.44, "learning_rate": 1.2534517132450908e-05, "loss": 21.3121, "step": 40320 }, { "epoch": 0.44, "learning_rate": 1.253112994623984e-05, "loss": 21.7438, "step": 40330 }, { "epoch": 0.44, "learning_rate": 1.2527742449724857e-05, "loss": 22.0385, "step": 40340 }, { "epoch": 0.44, "learning_rate": 1.2524354643321257e-05, "loss": 20.6011, "step": 40350 }, { "epoch": 0.44, "learning_rate": 1.2520966527444365e-05, "loss": 21.6979, "step": 40360 }, { "epoch": 0.44, "learning_rate": 1.2517578102509545e-05, "loss": 21.1729, "step": 40370 }, { "epoch": 0.44, "learning_rate": 1.2514189368932201e-05, "loss": 20.6752, "step": 40380 }, { "epoch": 0.44, "learning_rate": 1.251080032712778e-05, "loss": 21.7365, "step": 40390 }, { "epoch": 0.44, "learning_rate": 1.2507410977511758e-05, "loss": 21.3262, "step": 40400 }, { "epoch": 0.44, "learning_rate": 1.250402132049965e-05, "loss": 20.9567, "step": 40410 }, { "epoch": 0.44, "learning_rate": 1.2500631356507018e-05, "loss": 21.1393, "step": 40420 }, { "epoch": 0.44, "learning_rate": 1.2497241085949445e-05, "loss": 21.0615, "step": 40430 }, { "epoch": 0.44, "learning_rate": 1.2493850509242571e-05, "loss": 21.9197, "step": 40440 }, { "epoch": 0.44, "learning_rate": 1.2490459626802056e-05, "loss": 21.4995, "step": 40450 }, { "epoch": 0.44, "learning_rate": 1.2487068439043608e-05, "loss": 21.7086, "step": 40460 }, { "epoch": 0.44, "learning_rate": 1.2483676946382976e-05, "loss": 20.9577, "step": 40470 }, { "epoch": 0.44, "learning_rate": 1.2480285149235928e-05, "loss": 21.1373, "step": 40480 }, { "epoch": 0.44, "learning_rate": 1.2476893048018293e-05, "loss": 20.8434, "step": 40490 }, { "epoch": 0.44, "learning_rate": 1.2473500643145917e-05, "loss": 21.1723, "step": 40500 }, { "epoch": 0.44, "learning_rate": 1.2470107935034697e-05, "loss": 21.873, "step": 40510 }, { "epoch": 0.44, "learning_rate": 1.246671492410056e-05, "loss": 21.5412, "step": 40520 }, { "epoch": 0.44, "learning_rate": 1.2463321610759472e-05, "loss": 21.2209, "step": 40530 }, { "epoch": 0.44, "learning_rate": 1.2459927995427439e-05, "loss": 20.9775, "step": 40540 }, { "epoch": 0.44, "learning_rate": 1.24565340785205e-05, "loss": 21.2931, "step": 40550 }, { "epoch": 0.44, "learning_rate": 1.2453139860454728e-05, "loss": 21.1865, "step": 40560 }, { "epoch": 0.44, "learning_rate": 1.2449745341646242e-05, "loss": 21.0351, "step": 40570 }, { "epoch": 0.44, "learning_rate": 1.2446350522511193e-05, "loss": 20.4533, "step": 40580 }, { "epoch": 0.44, "learning_rate": 1.2442955403465768e-05, "loss": 21.178, "step": 40590 }, { "epoch": 0.44, "learning_rate": 1.2439559984926196e-05, "loss": 21.3289, "step": 40600 }, { "epoch": 0.44, "learning_rate": 1.2436164267308725e-05, "loss": 21.0351, "step": 40610 }, { "epoch": 0.44, "learning_rate": 1.2432768251029667e-05, "loss": 20.454, "step": 40620 }, { "epoch": 0.44, "learning_rate": 1.242937193650535e-05, "loss": 21.2001, "step": 40630 }, { "epoch": 0.44, "learning_rate": 1.2425975324152149e-05, "loss": 20.7288, "step": 40640 }, { "epoch": 0.44, "learning_rate": 1.2422578414386468e-05, "loss": 21.5619, "step": 40650 }, { "epoch": 0.44, "learning_rate": 1.2419181207624753e-05, "loss": 20.8854, "step": 40660 }, { "epoch": 0.44, "learning_rate": 1.2415783704283487e-05, "loss": 20.953, "step": 40670 }, { "epoch": 0.44, "learning_rate": 1.241238590477918e-05, "loss": 20.5247, "step": 40680 }, { "epoch": 0.44, "learning_rate": 1.2408987809528392e-05, "loss": 21.4737, "step": 40690 }, { "epoch": 0.44, "learning_rate": 1.240558941894771e-05, "loss": 21.4318, "step": 40700 }, { "epoch": 0.44, "learning_rate": 1.2402190733453761e-05, "loss": 21.175, "step": 40710 }, { "epoch": 0.44, "learning_rate": 1.2398791753463204e-05, "loss": 21.8893, "step": 40720 }, { "epoch": 0.44, "learning_rate": 1.2395392479392738e-05, "loss": 20.9275, "step": 40730 }, { "epoch": 0.44, "learning_rate": 1.23919929116591e-05, "loss": 21.0199, "step": 40740 }, { "epoch": 0.44, "learning_rate": 1.2388593050679058e-05, "loss": 21.206, "step": 40750 }, { "epoch": 0.44, "learning_rate": 1.2385192896869418e-05, "loss": 20.9844, "step": 40760 }, { "epoch": 0.44, "learning_rate": 1.238179245064702e-05, "loss": 21.7805, "step": 40770 }, { "epoch": 0.44, "learning_rate": 1.2378391712428746e-05, "loss": 21.3807, "step": 40780 }, { "epoch": 0.44, "learning_rate": 1.2374990682631505e-05, "loss": 21.2982, "step": 40790 }, { "epoch": 0.44, "learning_rate": 1.2371589361672249e-05, "loss": 20.9623, "step": 40800 }, { "epoch": 0.44, "learning_rate": 1.2368187749967961e-05, "loss": 21.0271, "step": 40810 }, { "epoch": 0.44, "learning_rate": 1.2364785847935665e-05, "loss": 21.372, "step": 40820 }, { "epoch": 0.44, "learning_rate": 1.2361383655992416e-05, "loss": 21.2601, "step": 40830 }, { "epoch": 0.44, "learning_rate": 1.2357981174555305e-05, "loss": 21.914, "step": 40840 }, { "epoch": 0.44, "learning_rate": 1.2354578404041457e-05, "loss": 21.3906, "step": 40850 }, { "epoch": 0.44, "learning_rate": 1.2351175344868038e-05, "loss": 21.5011, "step": 40860 }, { "epoch": 0.44, "learning_rate": 1.2347771997452248e-05, "loss": 21.3811, "step": 40870 }, { "epoch": 0.44, "learning_rate": 1.2344368362211315e-05, "loss": 20.5624, "step": 40880 }, { "epoch": 0.44, "learning_rate": 1.2340964439562506e-05, "loss": 21.9685, "step": 40890 }, { "epoch": 0.44, "learning_rate": 1.2337560229923135e-05, "loss": 21.2153, "step": 40900 }, { "epoch": 0.44, "learning_rate": 1.2334155733710535e-05, "loss": 21.21, "step": 40910 }, { "epoch": 0.44, "learning_rate": 1.2330750951342077e-05, "loss": 20.9481, "step": 40920 }, { "epoch": 0.44, "learning_rate": 1.2327345883235177e-05, "loss": 20.8109, "step": 40930 }, { "epoch": 0.44, "learning_rate": 1.2323940529807274e-05, "loss": 21.5736, "step": 40940 }, { "epoch": 0.44, "learning_rate": 1.2320534891475854e-05, "loss": 20.918, "step": 40950 }, { "epoch": 0.44, "learning_rate": 1.2317128968658424e-05, "loss": 21.9101, "step": 40960 }, { "epoch": 0.44, "learning_rate": 1.2313722761772536e-05, "loss": 20.7479, "step": 40970 }, { "epoch": 0.44, "learning_rate": 1.2310316271235774e-05, "loss": 21.4757, "step": 40980 }, { "epoch": 0.44, "learning_rate": 1.2306909497465755e-05, "loss": 21.0824, "step": 40990 }, { "epoch": 0.44, "learning_rate": 1.2303502440880135e-05, "loss": 21.4075, "step": 41000 }, { "epoch": 0.44, "learning_rate": 1.2300095101896606e-05, "loss": 21.874, "step": 41010 }, { "epoch": 0.44, "learning_rate": 1.2296687480932881e-05, "loss": 21.7997, "step": 41020 }, { "epoch": 0.44, "learning_rate": 1.2293279578406727e-05, "loss": 21.2635, "step": 41030 }, { "epoch": 0.44, "learning_rate": 1.2289871394735927e-05, "loss": 21.3634, "step": 41040 }, { "epoch": 0.44, "learning_rate": 1.2286462930338312e-05, "loss": 20.9444, "step": 41050 }, { "epoch": 0.44, "learning_rate": 1.2283054185631746e-05, "loss": 21.4112, "step": 41060 }, { "epoch": 0.44, "learning_rate": 1.2279645161034118e-05, "loss": 21.5124, "step": 41070 }, { "epoch": 0.44, "learning_rate": 1.2276235856963358e-05, "loss": 21.5258, "step": 41080 }, { "epoch": 0.44, "learning_rate": 1.2272826273837436e-05, "loss": 21.7826, "step": 41090 }, { "epoch": 0.44, "learning_rate": 1.2269416412074341e-05, "loss": 21.124, "step": 41100 }, { "epoch": 0.44, "learning_rate": 1.2266006272092115e-05, "loss": 20.9231, "step": 41110 }, { "epoch": 0.44, "learning_rate": 1.2262595854308814e-05, "loss": 21.3451, "step": 41120 }, { "epoch": 0.44, "learning_rate": 1.2259185159142546e-05, "loss": 21.4946, "step": 41130 }, { "epoch": 0.44, "learning_rate": 1.225577418701144e-05, "loss": 21.5815, "step": 41140 }, { "epoch": 0.44, "learning_rate": 1.2252362938333669e-05, "loss": 21.7131, "step": 41150 }, { "epoch": 0.44, "learning_rate": 1.224895141352743e-05, "loss": 21.3079, "step": 41160 }, { "epoch": 0.45, "learning_rate": 1.2245539613010961e-05, "loss": 20.9118, "step": 41170 }, { "epoch": 0.45, "learning_rate": 1.2242127537202535e-05, "loss": 21.3325, "step": 41180 }, { "epoch": 0.45, "learning_rate": 1.223871518652045e-05, "loss": 22.024, "step": 41190 }, { "epoch": 0.45, "learning_rate": 1.2235302561383046e-05, "loss": 21.7576, "step": 41200 }, { "epoch": 0.45, "learning_rate": 1.2231889662208695e-05, "loss": 21.2486, "step": 41210 }, { "epoch": 0.45, "learning_rate": 1.2228476489415799e-05, "loss": 21.5209, "step": 41220 }, { "epoch": 0.45, "learning_rate": 1.2225063043422798e-05, "loss": 21.4149, "step": 41230 }, { "epoch": 0.45, "learning_rate": 1.2221649324648161e-05, "loss": 22.0653, "step": 41240 }, { "epoch": 0.45, "learning_rate": 1.2218235333510395e-05, "loss": 21.7017, "step": 41250 }, { "epoch": 0.45, "learning_rate": 1.2214821070428038e-05, "loss": 21.4423, "step": 41260 }, { "epoch": 0.45, "learning_rate": 1.221140653581966e-05, "loss": 20.141, "step": 41270 }, { "epoch": 0.45, "learning_rate": 1.220799173010387e-05, "loss": 21.2066, "step": 41280 }, { "epoch": 0.45, "learning_rate": 1.2204576653699301e-05, "loss": 22.0888, "step": 41290 }, { "epoch": 0.45, "learning_rate": 1.2201161307024626e-05, "loss": 20.7815, "step": 41300 }, { "epoch": 0.45, "learning_rate": 1.2197745690498553e-05, "loss": 21.7471, "step": 41310 }, { "epoch": 0.45, "learning_rate": 1.2194329804539815e-05, "loss": 21.8436, "step": 41320 }, { "epoch": 0.45, "learning_rate": 1.2190913649567185e-05, "loss": 21.1819, "step": 41330 }, { "epoch": 0.45, "learning_rate": 1.2187497225999463e-05, "loss": 21.8432, "step": 41340 }, { "epoch": 0.45, "learning_rate": 1.2184080534255489e-05, "loss": 20.8984, "step": 41350 }, { "epoch": 0.45, "learning_rate": 1.2180663574754134e-05, "loss": 20.8135, "step": 41360 }, { "epoch": 0.45, "learning_rate": 1.2177246347914297e-05, "loss": 21.4414, "step": 41370 }, { "epoch": 0.45, "learning_rate": 1.2173828854154914e-05, "loss": 21.2722, "step": 41380 }, { "epoch": 0.45, "learning_rate": 1.2170411093894954e-05, "loss": 21.3492, "step": 41390 }, { "epoch": 0.45, "learning_rate": 1.2166993067553412e-05, "loss": 21.057, "step": 41400 }, { "epoch": 0.45, "learning_rate": 1.216357477554933e-05, "loss": 21.3891, "step": 41410 }, { "epoch": 0.45, "learning_rate": 1.2160156218301763e-05, "loss": 21.4296, "step": 41420 }, { "epoch": 0.45, "learning_rate": 1.2156737396229817e-05, "loss": 22.1144, "step": 41430 }, { "epoch": 0.45, "learning_rate": 1.2153318309752622e-05, "loss": 21.0605, "step": 41440 }, { "epoch": 0.45, "learning_rate": 1.2149898959289338e-05, "loss": 21.0424, "step": 41450 }, { "epoch": 0.45, "learning_rate": 1.2146479345259161e-05, "loss": 21.3844, "step": 41460 }, { "epoch": 0.45, "learning_rate": 1.214305946808132e-05, "loss": 21.3874, "step": 41470 }, { "epoch": 0.45, "learning_rate": 1.213963932817507e-05, "loss": 21.9787, "step": 41480 }, { "epoch": 0.45, "learning_rate": 1.2136218925959713e-05, "loss": 20.9127, "step": 41490 }, { "epoch": 0.45, "learning_rate": 1.2132798261854562e-05, "loss": 21.0576, "step": 41500 }, { "epoch": 0.45, "learning_rate": 1.212937733627898e-05, "loss": 20.855, "step": 41510 }, { "epoch": 0.45, "learning_rate": 1.2125956149652356e-05, "loss": 20.7885, "step": 41520 }, { "epoch": 0.45, "learning_rate": 1.2122534702394104e-05, "loss": 20.9274, "step": 41530 }, { "epoch": 0.45, "learning_rate": 1.2119112994923685e-05, "loss": 20.7295, "step": 41540 }, { "epoch": 0.45, "learning_rate": 1.211569102766058e-05, "loss": 21.2461, "step": 41550 }, { "epoch": 0.45, "learning_rate": 1.2112268801024301e-05, "loss": 21.8685, "step": 41560 }, { "epoch": 0.45, "learning_rate": 1.2108846315434401e-05, "loss": 20.56, "step": 41570 }, { "epoch": 0.45, "learning_rate": 1.2105423571310456e-05, "loss": 21.7406, "step": 41580 }, { "epoch": 0.45, "learning_rate": 1.2102000569072081e-05, "loss": 22.0155, "step": 41590 }, { "epoch": 0.45, "learning_rate": 1.2098577309138916e-05, "loss": 20.6569, "step": 41600 }, { "epoch": 0.45, "learning_rate": 1.2095153791930639e-05, "loss": 20.8548, "step": 41610 }, { "epoch": 0.45, "learning_rate": 1.2091730017866952e-05, "loss": 21.5192, "step": 41620 }, { "epoch": 0.45, "learning_rate": 1.2088305987367592e-05, "loss": 20.6219, "step": 41630 }, { "epoch": 0.45, "learning_rate": 1.2084881700852335e-05, "loss": 21.5655, "step": 41640 }, { "epoch": 0.45, "learning_rate": 1.2081457158740974e-05, "loss": 21.0394, "step": 41650 }, { "epoch": 0.45, "learning_rate": 1.2078032361453347e-05, "loss": 20.8628, "step": 41660 }, { "epoch": 0.45, "learning_rate": 1.2074607309409311e-05, "loss": 21.7695, "step": 41670 }, { "epoch": 0.45, "learning_rate": 1.2071182003028766e-05, "loss": 21.6193, "step": 41680 }, { "epoch": 0.45, "learning_rate": 1.2067756442731632e-05, "loss": 21.504, "step": 41690 }, { "epoch": 0.45, "learning_rate": 1.206433062893787e-05, "loss": 21.1021, "step": 41700 }, { "epoch": 0.45, "learning_rate": 1.2060904562067466e-05, "loss": 20.9887, "step": 41710 }, { "epoch": 0.45, "learning_rate": 1.2057478242540436e-05, "loss": 21.6305, "step": 41720 }, { "epoch": 0.45, "learning_rate": 1.2054051670776836e-05, "loss": 20.9488, "step": 41730 }, { "epoch": 0.45, "learning_rate": 1.2050624847196742e-05, "loss": 21.2392, "step": 41740 }, { "epoch": 0.45, "learning_rate": 1.2047197772220267e-05, "loss": 21.2237, "step": 41750 }, { "epoch": 0.45, "learning_rate": 1.2043770446267551e-05, "loss": 21.2914, "step": 41760 }, { "epoch": 0.45, "learning_rate": 1.204034286975877e-05, "loss": 21.3134, "step": 41770 }, { "epoch": 0.45, "learning_rate": 1.2036915043114125e-05, "loss": 21.021, "step": 41780 }, { "epoch": 0.45, "learning_rate": 1.2033486966753856e-05, "loss": 21.2491, "step": 41790 }, { "epoch": 0.45, "learning_rate": 1.2030058641098222e-05, "loss": 21.3448, "step": 41800 }, { "epoch": 0.45, "learning_rate": 1.202663006656752e-05, "loss": 21.0308, "step": 41810 }, { "epoch": 0.45, "learning_rate": 1.202320124358208e-05, "loss": 21.2179, "step": 41820 }, { "epoch": 0.45, "learning_rate": 1.201977217256225e-05, "loss": 21.5319, "step": 41830 }, { "epoch": 0.45, "learning_rate": 1.2016342853928426e-05, "loss": 20.5858, "step": 41840 }, { "epoch": 0.45, "learning_rate": 1.2012913288101022e-05, "loss": 21.1643, "step": 41850 }, { "epoch": 0.45, "learning_rate": 1.2009483475500486e-05, "loss": 22.3803, "step": 41860 }, { "epoch": 0.45, "learning_rate": 1.2006053416547296e-05, "loss": 21.7486, "step": 41870 }, { "epoch": 0.45, "learning_rate": 1.200262311166196e-05, "loss": 20.9844, "step": 41880 }, { "epoch": 0.45, "learning_rate": 1.1999192561265012e-05, "loss": 20.7652, "step": 41890 }, { "epoch": 0.45, "learning_rate": 1.1995761765777027e-05, "loss": 20.7613, "step": 41900 }, { "epoch": 0.45, "learning_rate": 1.19923307256186e-05, "loss": 21.1324, "step": 41910 }, { "epoch": 0.45, "learning_rate": 1.1988899441210362e-05, "loss": 21.1249, "step": 41920 }, { "epoch": 0.45, "learning_rate": 1.198546791297297e-05, "loss": 21.4235, "step": 41930 }, { "epoch": 0.45, "learning_rate": 1.1982036141327107e-05, "loss": 21.5857, "step": 41940 }, { "epoch": 0.45, "learning_rate": 1.19786041266935e-05, "loss": 21.9368, "step": 41950 }, { "epoch": 0.45, "learning_rate": 1.1975171869492889e-05, "loss": 20.6464, "step": 41960 }, { "epoch": 0.45, "learning_rate": 1.197173937014606e-05, "loss": 20.4585, "step": 41970 }, { "epoch": 0.45, "learning_rate": 1.1968306629073816e-05, "loss": 20.8267, "step": 41980 }, { "epoch": 0.45, "learning_rate": 1.1964873646696988e-05, "loss": 20.6849, "step": 41990 }, { "epoch": 0.45, "learning_rate": 1.1961440423436454e-05, "loss": 21.5114, "step": 42000 }, { "epoch": 0.45, "learning_rate": 1.19580069597131e-05, "loss": 21.8186, "step": 42010 }, { "epoch": 0.45, "learning_rate": 1.1954573255947856e-05, "loss": 20.9844, "step": 42020 }, { "epoch": 0.45, "learning_rate": 1.1951139312561681e-05, "loss": 20.8407, "step": 42030 }, { "epoch": 0.45, "learning_rate": 1.194770512997555e-05, "loss": 21.9007, "step": 42040 }, { "epoch": 0.45, "learning_rate": 1.1944270708610484e-05, "loss": 20.8657, "step": 42050 }, { "epoch": 0.45, "learning_rate": 1.1940836048887522e-05, "loss": 21.7353, "step": 42060 }, { "epoch": 0.45, "learning_rate": 1.193740115122774e-05, "loss": 20.8857, "step": 42070 }, { "epoch": 0.45, "learning_rate": 1.1933966016052238e-05, "loss": 20.7047, "step": 42080 }, { "epoch": 0.46, "learning_rate": 1.1930530643782144e-05, "loss": 21.0988, "step": 42090 }, { "epoch": 0.46, "learning_rate": 1.1927095034838615e-05, "loss": 20.6281, "step": 42100 }, { "epoch": 0.46, "learning_rate": 1.1923659189642849e-05, "loss": 21.8821, "step": 42110 }, { "epoch": 0.46, "learning_rate": 1.1920223108616056e-05, "loss": 21.6254, "step": 42120 }, { "epoch": 0.46, "learning_rate": 1.1916786792179487e-05, "loss": 21.8059, "step": 42130 }, { "epoch": 0.46, "learning_rate": 1.191335024075441e-05, "loss": 21.0793, "step": 42140 }, { "epoch": 0.46, "learning_rate": 1.1909913454762138e-05, "loss": 21.2363, "step": 42150 }, { "epoch": 0.46, "learning_rate": 1.1906476434623997e-05, "loss": 21.4129, "step": 42160 }, { "epoch": 0.46, "learning_rate": 1.1903039180761353e-05, "loss": 21.6863, "step": 42170 }, { "epoch": 0.46, "learning_rate": 1.1899601693595593e-05, "loss": 21.9549, "step": 42180 }, { "epoch": 0.46, "learning_rate": 1.1896163973548138e-05, "loss": 21.9228, "step": 42190 }, { "epoch": 0.46, "learning_rate": 1.1892726021040432e-05, "loss": 21.2291, "step": 42200 }, { "epoch": 0.46, "learning_rate": 1.1889287836493958e-05, "loss": 20.8371, "step": 42210 }, { "epoch": 0.46, "learning_rate": 1.1885849420330211e-05, "loss": 21.8423, "step": 42220 }, { "epoch": 0.46, "learning_rate": 1.188241077297073e-05, "loss": 20.9377, "step": 42230 }, { "epoch": 0.46, "learning_rate": 1.1878971894837073e-05, "loss": 21.0525, "step": 42240 }, { "epoch": 0.46, "learning_rate": 1.1875532786350834e-05, "loss": 20.3068, "step": 42250 }, { "epoch": 0.46, "learning_rate": 1.1872093447933627e-05, "loss": 21.468, "step": 42260 }, { "epoch": 0.46, "learning_rate": 1.1868653880007095e-05, "loss": 22.0553, "step": 42270 }, { "epoch": 0.46, "learning_rate": 1.1865214082992914e-05, "loss": 20.5632, "step": 42280 }, { "epoch": 0.46, "learning_rate": 1.1861774057312786e-05, "loss": 21.3044, "step": 42290 }, { "epoch": 0.46, "learning_rate": 1.1858333803388446e-05, "loss": 21.0278, "step": 42300 }, { "epoch": 0.46, "learning_rate": 1.1854893321641647e-05, "loss": 20.7134, "step": 42310 }, { "epoch": 0.46, "learning_rate": 1.1851452612494171e-05, "loss": 21.0073, "step": 42320 }, { "epoch": 0.46, "learning_rate": 1.1848011676367844e-05, "loss": 21.6731, "step": 42330 }, { "epoch": 0.46, "learning_rate": 1.1844570513684493e-05, "loss": 20.6887, "step": 42340 }, { "epoch": 0.46, "learning_rate": 1.1841129124865999e-05, "loss": 21.2787, "step": 42350 }, { "epoch": 0.46, "learning_rate": 1.1837687510334252e-05, "loss": 21.2528, "step": 42360 }, { "epoch": 0.46, "learning_rate": 1.1834245670511177e-05, "loss": 20.7925, "step": 42370 }, { "epoch": 0.46, "learning_rate": 1.1830803605818735e-05, "loss": 20.7302, "step": 42380 }, { "epoch": 0.46, "learning_rate": 1.1827361316678893e-05, "loss": 21.3851, "step": 42390 }, { "epoch": 0.46, "learning_rate": 1.182391880351367e-05, "loss": 21.3336, "step": 42400 }, { "epoch": 0.46, "learning_rate": 1.1820476066745098e-05, "loss": 21.0568, "step": 42410 }, { "epoch": 0.46, "learning_rate": 1.1817033106795231e-05, "loss": 21.2918, "step": 42420 }, { "epoch": 0.46, "learning_rate": 1.1813589924086169e-05, "loss": 21.3465, "step": 42430 }, { "epoch": 0.46, "learning_rate": 1.1810146519040023e-05, "loss": 21.7048, "step": 42440 }, { "epoch": 0.46, "learning_rate": 1.1806702892078939e-05, "loss": 21.1832, "step": 42450 }, { "epoch": 0.46, "learning_rate": 1.1803259043625092e-05, "loss": 21.3199, "step": 42460 }, { "epoch": 0.46, "learning_rate": 1.1799814974100676e-05, "loss": 21.5309, "step": 42470 }, { "epoch": 0.46, "learning_rate": 1.1796370683927918e-05, "loss": 21.6517, "step": 42480 }, { "epoch": 0.46, "learning_rate": 1.1792926173529071e-05, "loss": 20.7918, "step": 42490 }, { "epoch": 0.46, "learning_rate": 1.1789481443326415e-05, "loss": 22.0224, "step": 42500 }, { "epoch": 0.46, "learning_rate": 1.1786036493742261e-05, "loss": 20.6775, "step": 42510 }, { "epoch": 0.46, "learning_rate": 1.1782591325198934e-05, "loss": 20.6656, "step": 42520 }, { "epoch": 0.46, "learning_rate": 1.17791459381188e-05, "loss": 21.2779, "step": 42530 }, { "epoch": 0.46, "learning_rate": 1.1775700332924243e-05, "loss": 21.0926, "step": 42540 }, { "epoch": 0.46, "learning_rate": 1.1772254510037682e-05, "loss": 21.7377, "step": 42550 }, { "epoch": 0.46, "learning_rate": 1.1768808469881555e-05, "loss": 21.9767, "step": 42560 }, { "epoch": 0.46, "learning_rate": 1.1765362212878326e-05, "loss": 21.5259, "step": 42570 }, { "epoch": 0.46, "learning_rate": 1.1761915739450494e-05, "loss": 21.3866, "step": 42580 }, { "epoch": 0.46, "learning_rate": 1.1758469050020578e-05, "loss": 20.8999, "step": 42590 }, { "epoch": 0.46, "learning_rate": 1.1755022145011123e-05, "loss": 21.2173, "step": 42600 }, { "epoch": 0.46, "learning_rate": 1.1751575024844706e-05, "loss": 21.4719, "step": 42610 }, { "epoch": 0.46, "learning_rate": 1.1748127689943925e-05, "loss": 21.0679, "step": 42620 }, { "epoch": 0.46, "learning_rate": 1.1744680140731404e-05, "loss": 21.1668, "step": 42630 }, { "epoch": 0.46, "learning_rate": 1.1741232377629796e-05, "loss": 21.0865, "step": 42640 }, { "epoch": 0.46, "learning_rate": 1.1737784401061782e-05, "loss": 21.6906, "step": 42650 }, { "epoch": 0.46, "learning_rate": 1.1734336211450067e-05, "loss": 21.6609, "step": 42660 }, { "epoch": 0.46, "learning_rate": 1.1730887809217377e-05, "loss": 21.8539, "step": 42670 }, { "epoch": 0.46, "learning_rate": 1.1727439194786474e-05, "loss": 21.6634, "step": 42680 }, { "epoch": 0.46, "learning_rate": 1.1723990368580138e-05, "loss": 21.7981, "step": 42690 }, { "epoch": 0.46, "learning_rate": 1.172054133102118e-05, "loss": 21.6944, "step": 42700 }, { "epoch": 0.46, "learning_rate": 1.1717092082532434e-05, "loss": 21.2278, "step": 42710 }, { "epoch": 0.46, "learning_rate": 1.1713642623536759e-05, "loss": 21.3936, "step": 42720 }, { "epoch": 0.46, "learning_rate": 1.1710192954457045e-05, "loss": 21.4784, "step": 42730 }, { "epoch": 0.46, "learning_rate": 1.17067430757162e-05, "loss": 22.073, "step": 42740 }, { "epoch": 0.46, "learning_rate": 1.1703292987737163e-05, "loss": 21.315, "step": 42750 }, { "epoch": 0.46, "learning_rate": 1.1699842690942903e-05, "loss": 21.9921, "step": 42760 }, { "epoch": 0.46, "learning_rate": 1.16963921857564e-05, "loss": 21.034, "step": 42770 }, { "epoch": 0.46, "learning_rate": 1.1692941472600676e-05, "loss": 20.8267, "step": 42780 }, { "epoch": 0.46, "learning_rate": 1.168949055189877e-05, "loss": 21.1511, "step": 42790 }, { "epoch": 0.46, "learning_rate": 1.1686039424073741e-05, "loss": 20.6438, "step": 42800 }, { "epoch": 0.46, "learning_rate": 1.1682588089548692e-05, "loss": 20.7156, "step": 42810 }, { "epoch": 0.46, "learning_rate": 1.167913654874673e-05, "loss": 20.4426, "step": 42820 }, { "epoch": 0.46, "learning_rate": 1.1675684802090999e-05, "loss": 21.5295, "step": 42830 }, { "epoch": 0.46, "learning_rate": 1.167223285000467e-05, "loss": 20.9206, "step": 42840 }, { "epoch": 0.46, "learning_rate": 1.1668780692910926e-05, "loss": 21.5829, "step": 42850 }, { "epoch": 0.46, "learning_rate": 1.1665328331232995e-05, "loss": 20.9516, "step": 42860 }, { "epoch": 0.46, "learning_rate": 1.1661875765394114e-05, "loss": 21.005, "step": 42870 }, { "epoch": 0.46, "learning_rate": 1.1658422995817544e-05, "loss": 21.1078, "step": 42880 }, { "epoch": 0.46, "learning_rate": 1.1654970022926592e-05, "loss": 20.8596, "step": 42890 }, { "epoch": 0.46, "learning_rate": 1.1651516847144561e-05, "loss": 21.1257, "step": 42900 }, { "epoch": 0.46, "learning_rate": 1.1648063468894803e-05, "loss": 21.7194, "step": 42910 }, { "epoch": 0.46, "learning_rate": 1.1644609888600682e-05, "loss": 21.5149, "step": 42920 }, { "epoch": 0.46, "learning_rate": 1.1641156106685584e-05, "loss": 21.5986, "step": 42930 }, { "epoch": 0.46, "learning_rate": 1.1637702123572936e-05, "loss": 22.0591, "step": 42940 }, { "epoch": 0.46, "learning_rate": 1.163424793968617e-05, "loss": 21.0204, "step": 42950 }, { "epoch": 0.46, "learning_rate": 1.1630793555448756e-05, "loss": 20.8627, "step": 42960 }, { "epoch": 0.46, "learning_rate": 1.1627338971284189e-05, "loss": 21.4006, "step": 42970 }, { "epoch": 0.46, "learning_rate": 1.162388418761597e-05, "loss": 20.8906, "step": 42980 }, { "epoch": 0.46, "learning_rate": 1.162042920486765e-05, "loss": 20.3725, "step": 42990 }, { "epoch": 0.46, "learning_rate": 1.1616974023462789e-05, "loss": 22.0646, "step": 43000 }, { "epoch": 0.46, "learning_rate": 1.1613518643824975e-05, "loss": 21.1449, "step": 43010 }, { "epoch": 0.47, "learning_rate": 1.1610063066377821e-05, "loss": 21.9224, "step": 43020 }, { "epoch": 0.47, "learning_rate": 1.1606607291544962e-05, "loss": 20.6522, "step": 43030 }, { "epoch": 0.47, "learning_rate": 1.1603151319750064e-05, "loss": 20.901, "step": 43040 }, { "epoch": 0.47, "learning_rate": 1.1599695151416804e-05, "loss": 20.8194, "step": 43050 }, { "epoch": 0.47, "learning_rate": 1.1596238786968894e-05, "loss": 21.0008, "step": 43060 }, { "epoch": 0.47, "learning_rate": 1.1592782226830071e-05, "loss": 20.8676, "step": 43070 }, { "epoch": 0.47, "learning_rate": 1.1589325471424087e-05, "loss": 21.5957, "step": 43080 }, { "epoch": 0.47, "learning_rate": 1.1585868521174723e-05, "loss": 21.5749, "step": 43090 }, { "epoch": 0.47, "learning_rate": 1.1582411376505789e-05, "loss": 21.2076, "step": 43100 }, { "epoch": 0.47, "learning_rate": 1.157895403784111e-05, "loss": 21.2466, "step": 43110 }, { "epoch": 0.47, "learning_rate": 1.1575496505604537e-05, "loss": 21.9405, "step": 43120 }, { "epoch": 0.47, "learning_rate": 1.157203878021995e-05, "loss": 21.8633, "step": 43130 }, { "epoch": 0.47, "learning_rate": 1.1568580862111247e-05, "loss": 20.9039, "step": 43140 }, { "epoch": 0.47, "learning_rate": 1.1565122751702351e-05, "loss": 21.2841, "step": 43150 }, { "epoch": 0.47, "learning_rate": 1.156166444941721e-05, "loss": 21.1107, "step": 43160 }, { "epoch": 0.47, "learning_rate": 1.1558205955679792e-05, "loss": 21.3796, "step": 43170 }, { "epoch": 0.47, "learning_rate": 1.1554747270914098e-05, "loss": 21.6641, "step": 43180 }, { "epoch": 0.47, "learning_rate": 1.1551288395544135e-05, "loss": 21.2929, "step": 43190 }, { "epoch": 0.47, "learning_rate": 1.1547829329993954e-05, "loss": 20.6251, "step": 43200 }, { "epoch": 0.47, "learning_rate": 1.1544370074687612e-05, "loss": 20.9039, "step": 43210 }, { "epoch": 0.47, "learning_rate": 1.1540910630049202e-05, "loss": 21.1707, "step": 43220 }, { "epoch": 0.47, "learning_rate": 1.153745099650283e-05, "loss": 21.1303, "step": 43230 }, { "epoch": 0.47, "learning_rate": 1.1533991174472635e-05, "loss": 21.3802, "step": 43240 }, { "epoch": 0.47, "learning_rate": 1.1530531164382768e-05, "loss": 21.1985, "step": 43250 }, { "epoch": 0.47, "learning_rate": 1.152707096665741e-05, "loss": 21.9592, "step": 43260 }, { "epoch": 0.47, "learning_rate": 1.152361058172077e-05, "loss": 20.9866, "step": 43270 }, { "epoch": 0.47, "learning_rate": 1.1520150009997066e-05, "loss": 21.4595, "step": 43280 }, { "epoch": 0.47, "learning_rate": 1.151668925191055e-05, "loss": 21.5137, "step": 43290 }, { "epoch": 0.47, "learning_rate": 1.15132283078855e-05, "loss": 20.8291, "step": 43300 }, { "epoch": 0.47, "learning_rate": 1.1509767178346198e-05, "loss": 21.992, "step": 43310 }, { "epoch": 0.47, "learning_rate": 1.1506305863716973e-05, "loss": 20.6903, "step": 43320 }, { "epoch": 0.47, "learning_rate": 1.150284436442216e-05, "loss": 20.9332, "step": 43330 }, { "epoch": 0.47, "learning_rate": 1.1499382680886116e-05, "loss": 21.7621, "step": 43340 }, { "epoch": 0.47, "learning_rate": 1.1495920813533234e-05, "loss": 21.0873, "step": 43350 }, { "epoch": 0.47, "learning_rate": 1.149245876278792e-05, "loss": 20.8767, "step": 43360 }, { "epoch": 0.47, "learning_rate": 1.1488996529074602e-05, "loss": 22.1592, "step": 43370 }, { "epoch": 0.47, "learning_rate": 1.1485534112817738e-05, "loss": 21.2159, "step": 43380 }, { "epoch": 0.47, "learning_rate": 1.1482071514441793e-05, "loss": 21.1407, "step": 43390 }, { "epoch": 0.47, "learning_rate": 1.1478608734371278e-05, "loss": 20.6153, "step": 43400 }, { "epoch": 0.47, "learning_rate": 1.1475145773030695e-05, "loss": 20.0208, "step": 43410 }, { "epoch": 0.47, "learning_rate": 1.14716826308446e-05, "loss": 22.3524, "step": 43420 }, { "epoch": 0.47, "learning_rate": 1.1468219308237556e-05, "loss": 21.4075, "step": 43430 }, { "epoch": 0.47, "learning_rate": 1.146475580563414e-05, "loss": 20.6619, "step": 43440 }, { "epoch": 0.47, "learning_rate": 1.1461292123458968e-05, "loss": 21.247, "step": 43450 }, { "epoch": 0.47, "learning_rate": 1.145782826213667e-05, "loss": 21.0002, "step": 43460 }, { "epoch": 0.47, "learning_rate": 1.1454364222091895e-05, "loss": 21.1204, "step": 43470 }, { "epoch": 0.47, "learning_rate": 1.145090000374932e-05, "loss": 21.5766, "step": 43480 }, { "epoch": 0.47, "learning_rate": 1.1447435607533632e-05, "loss": 21.3874, "step": 43490 }, { "epoch": 0.47, "learning_rate": 1.1443971033869561e-05, "loss": 21.4381, "step": 43500 }, { "epoch": 0.47, "learning_rate": 1.144050628318184e-05, "loss": 21.8423, "step": 43510 }, { "epoch": 0.47, "learning_rate": 1.1437041355895233e-05, "loss": 21.1903, "step": 43520 }, { "epoch": 0.47, "learning_rate": 1.143357625243452e-05, "loss": 20.5314, "step": 43530 }, { "epoch": 0.47, "learning_rate": 1.1430110973224507e-05, "loss": 21.5656, "step": 43540 }, { "epoch": 0.47, "learning_rate": 1.1426645518690015e-05, "loss": 21.3205, "step": 43550 }, { "epoch": 0.47, "learning_rate": 1.1423179889255902e-05, "loss": 21.6077, "step": 43560 }, { "epoch": 0.47, "learning_rate": 1.141971408534703e-05, "loss": 21.2136, "step": 43570 }, { "epoch": 0.47, "learning_rate": 1.1416248107388286e-05, "loss": 21.5172, "step": 43580 }, { "epoch": 0.47, "learning_rate": 1.1412781955804588e-05, "loss": 21.4189, "step": 43590 }, { "epoch": 0.47, "learning_rate": 1.1409315631020867e-05, "loss": 21.8222, "step": 43600 }, { "epoch": 0.47, "learning_rate": 1.1405849133462076e-05, "loss": 21.2694, "step": 43610 }, { "epoch": 0.47, "learning_rate": 1.1402382463553192e-05, "loss": 21.5826, "step": 43620 }, { "epoch": 0.47, "learning_rate": 1.1398915621719211e-05, "loss": 21.1449, "step": 43630 }, { "epoch": 0.47, "learning_rate": 1.1395448608385149e-05, "loss": 21.2521, "step": 43640 }, { "epoch": 0.47, "learning_rate": 1.1391981423976047e-05, "loss": 21.117, "step": 43650 }, { "epoch": 0.47, "learning_rate": 1.138851406891696e-05, "loss": 21.1892, "step": 43660 }, { "epoch": 0.47, "learning_rate": 1.1385046543632974e-05, "loss": 21.4082, "step": 43670 }, { "epoch": 0.47, "learning_rate": 1.1381578848549186e-05, "loss": 21.1695, "step": 43680 }, { "epoch": 0.47, "learning_rate": 1.1378110984090723e-05, "loss": 21.5183, "step": 43690 }, { "epoch": 0.47, "learning_rate": 1.1374642950682722e-05, "loss": 21.643, "step": 43700 }, { "epoch": 0.47, "learning_rate": 1.1371174748750352e-05, "loss": 21.5887, "step": 43710 }, { "epoch": 0.47, "learning_rate": 1.1367706378718791e-05, "loss": 21.3851, "step": 43720 }, { "epoch": 0.47, "learning_rate": 1.136423784101325e-05, "loss": 21.7285, "step": 43730 }, { "epoch": 0.47, "learning_rate": 1.1360769136058951e-05, "loss": 21.2519, "step": 43740 }, { "epoch": 0.47, "learning_rate": 1.1357300264281144e-05, "loss": 21.1546, "step": 43750 }, { "epoch": 0.47, "learning_rate": 1.135383122610509e-05, "loss": 20.5802, "step": 43760 }, { "epoch": 0.47, "learning_rate": 1.1350362021956073e-05, "loss": 21.1492, "step": 43770 }, { "epoch": 0.47, "learning_rate": 1.1346892652259413e-05, "loss": 21.1733, "step": 43780 }, { "epoch": 0.47, "learning_rate": 1.1343423117440429e-05, "loss": 20.8449, "step": 43790 }, { "epoch": 0.47, "learning_rate": 1.1339953417924465e-05, "loss": 20.766, "step": 43800 }, { "epoch": 0.47, "learning_rate": 1.1336483554136897e-05, "loss": 21.5881, "step": 43810 }, { "epoch": 0.47, "learning_rate": 1.1333013526503107e-05, "loss": 21.4333, "step": 43820 }, { "epoch": 0.47, "learning_rate": 1.1329543335448508e-05, "loss": 21.9891, "step": 43830 }, { "epoch": 0.47, "learning_rate": 1.1326072981398524e-05, "loss": 20.0759, "step": 43840 }, { "epoch": 0.47, "learning_rate": 1.13226024647786e-05, "loss": 22.3188, "step": 43850 }, { "epoch": 0.47, "learning_rate": 1.1319131786014216e-05, "loss": 21.7389, "step": 43860 }, { "epoch": 0.47, "learning_rate": 1.1315660945530846e-05, "loss": 21.3715, "step": 43870 }, { "epoch": 0.47, "learning_rate": 1.1312189943754008e-05, "loss": 20.888, "step": 43880 }, { "epoch": 0.47, "learning_rate": 1.1308718781109227e-05, "loss": 21.7227, "step": 43890 }, { "epoch": 0.47, "learning_rate": 1.1305247458022046e-05, "loss": 21.1909, "step": 43900 }, { "epoch": 0.47, "learning_rate": 1.1301775974918035e-05, "loss": 20.9485, "step": 43910 }, { "epoch": 0.47, "learning_rate": 1.129830433222278e-05, "loss": 21.0301, "step": 43920 }, { "epoch": 0.47, "learning_rate": 1.129483253036189e-05, "loss": 21.7164, "step": 43930 }, { "epoch": 0.48, "learning_rate": 1.129136056976099e-05, "loss": 21.3005, "step": 43940 }, { "epoch": 0.48, "learning_rate": 1.1287888450845717e-05, "loss": 20.9352, "step": 43950 }, { "epoch": 0.48, "learning_rate": 1.1284416174041744e-05, "loss": 21.2305, "step": 43960 }, { "epoch": 0.48, "learning_rate": 1.1280943739774752e-05, "loss": 21.5878, "step": 43970 }, { "epoch": 0.48, "learning_rate": 1.1277471148470445e-05, "loss": 20.5336, "step": 43980 }, { "epoch": 0.48, "learning_rate": 1.1273998400554547e-05, "loss": 21.5825, "step": 43990 }, { "epoch": 0.48, "learning_rate": 1.1270525496452793e-05, "loss": 20.8497, "step": 44000 }, { "epoch": 0.48, "learning_rate": 1.1267052436590954e-05, "loss": 20.7601, "step": 44010 }, { "epoch": 0.48, "learning_rate": 1.1263579221394798e-05, "loss": 21.2265, "step": 44020 }, { "epoch": 0.48, "learning_rate": 1.1260105851290133e-05, "loss": 21.6098, "step": 44030 }, { "epoch": 0.48, "learning_rate": 1.1256632326702774e-05, "loss": 21.8106, "step": 44040 }, { "epoch": 0.48, "learning_rate": 1.1253158648058558e-05, "loss": 20.9149, "step": 44050 }, { "epoch": 0.48, "learning_rate": 1.1249684815783337e-05, "loss": 21.7433, "step": 44060 }, { "epoch": 0.48, "learning_rate": 1.1246210830302993e-05, "loss": 21.6377, "step": 44070 }, { "epoch": 0.48, "learning_rate": 1.1242736692043413e-05, "loss": 21.2624, "step": 44080 }, { "epoch": 0.48, "learning_rate": 1.123926240143051e-05, "loss": 21.8224, "step": 44090 }, { "epoch": 0.48, "learning_rate": 1.1235787958890217e-05, "loss": 21.6445, "step": 44100 }, { "epoch": 0.48, "learning_rate": 1.1232313364848481e-05, "loss": 20.708, "step": 44110 }, { "epoch": 0.48, "learning_rate": 1.1228838619731272e-05, "loss": 20.2501, "step": 44120 }, { "epoch": 0.48, "learning_rate": 1.1225363723964576e-05, "loss": 21.069, "step": 44130 }, { "epoch": 0.48, "learning_rate": 1.1221888677974397e-05, "loss": 20.8238, "step": 44140 }, { "epoch": 0.48, "learning_rate": 1.1218413482186756e-05, "loss": 21.2867, "step": 44150 }, { "epoch": 0.48, "learning_rate": 1.1214938137027702e-05, "loss": 21.7683, "step": 44160 }, { "epoch": 0.48, "learning_rate": 1.1211462642923288e-05, "loss": 21.5013, "step": 44170 }, { "epoch": 0.48, "learning_rate": 1.1207987000299593e-05, "loss": 21.2015, "step": 44180 }, { "epoch": 0.48, "learning_rate": 1.1204511209582718e-05, "loss": 21.083, "step": 44190 }, { "epoch": 0.48, "learning_rate": 1.120103527119877e-05, "loss": 21.2529, "step": 44200 }, { "epoch": 0.48, "learning_rate": 1.1197559185573893e-05, "loss": 21.0634, "step": 44210 }, { "epoch": 0.48, "learning_rate": 1.1194082953134226e-05, "loss": 21.3099, "step": 44220 }, { "epoch": 0.48, "learning_rate": 1.1190606574305942e-05, "loss": 20.9433, "step": 44230 }, { "epoch": 0.48, "learning_rate": 1.1187130049515234e-05, "loss": 21.3737, "step": 44240 }, { "epoch": 0.48, "learning_rate": 1.1183653379188294e-05, "loss": 20.8963, "step": 44250 }, { "epoch": 0.48, "learning_rate": 1.1180176563751356e-05, "loss": 21.7264, "step": 44260 }, { "epoch": 0.48, "learning_rate": 1.1176699603630659e-05, "loss": 21.2554, "step": 44270 }, { "epoch": 0.48, "learning_rate": 1.1173222499252453e-05, "loss": 20.9485, "step": 44280 }, { "epoch": 0.48, "learning_rate": 1.116974525104302e-05, "loss": 20.7896, "step": 44290 }, { "epoch": 0.48, "learning_rate": 1.1166267859428653e-05, "loss": 21.6537, "step": 44300 }, { "epoch": 0.48, "learning_rate": 1.1162790324835657e-05, "loss": 21.8301, "step": 44310 }, { "epoch": 0.48, "learning_rate": 1.115931264769037e-05, "loss": 21.2648, "step": 44320 }, { "epoch": 0.48, "learning_rate": 1.115583482841913e-05, "loss": 20.7942, "step": 44330 }, { "epoch": 0.48, "learning_rate": 1.1152356867448305e-05, "loss": 21.357, "step": 44340 }, { "epoch": 0.48, "learning_rate": 1.1148878765204275e-05, "loss": 20.7559, "step": 44350 }, { "epoch": 0.48, "learning_rate": 1.1145400522113431e-05, "loss": 21.8285, "step": 44360 }, { "epoch": 0.48, "learning_rate": 1.1141922138602203e-05, "loss": 20.7556, "step": 44370 }, { "epoch": 0.48, "learning_rate": 1.1138443615097008e-05, "loss": 21.2238, "step": 44380 }, { "epoch": 0.48, "learning_rate": 1.1134964952024303e-05, "loss": 21.5802, "step": 44390 }, { "epoch": 0.48, "learning_rate": 1.1131486149810557e-05, "loss": 21.5806, "step": 44400 }, { "epoch": 0.48, "learning_rate": 1.1128007208882248e-05, "loss": 20.9787, "step": 44410 }, { "epoch": 0.48, "learning_rate": 1.1124528129665882e-05, "loss": 21.1559, "step": 44420 }, { "epoch": 0.48, "learning_rate": 1.1121048912587973e-05, "loss": 21.2107, "step": 44430 }, { "epoch": 0.48, "learning_rate": 1.1117569558075057e-05, "loss": 21.7529, "step": 44440 }, { "epoch": 0.48, "learning_rate": 1.111409006655369e-05, "loss": 21.1011, "step": 44450 }, { "epoch": 0.48, "learning_rate": 1.1110610438450426e-05, "loss": 21.5514, "step": 44460 }, { "epoch": 0.48, "learning_rate": 1.1107130674191869e-05, "loss": 21.2599, "step": 44470 }, { "epoch": 0.48, "learning_rate": 1.1103650774204606e-05, "loss": 20.9758, "step": 44480 }, { "epoch": 0.48, "learning_rate": 1.1100170738915264e-05, "loss": 21.3313, "step": 44490 }, { "epoch": 0.48, "learning_rate": 1.1096690568750475e-05, "loss": 21.692, "step": 44500 }, { "epoch": 0.48, "learning_rate": 1.109321026413689e-05, "loss": 20.8815, "step": 44510 }, { "epoch": 0.48, "learning_rate": 1.108972982550118e-05, "loss": 21.7176, "step": 44520 }, { "epoch": 0.48, "learning_rate": 1.1086249253270024e-05, "loss": 20.8643, "step": 44530 }, { "epoch": 0.48, "learning_rate": 1.1082768547870123e-05, "loss": 21.6755, "step": 44540 }, { "epoch": 0.48, "learning_rate": 1.1079287709728202e-05, "loss": 20.823, "step": 44550 }, { "epoch": 0.48, "learning_rate": 1.1075806739270986e-05, "loss": 21.8582, "step": 44560 }, { "epoch": 0.48, "learning_rate": 1.1072325636925231e-05, "loss": 21.4013, "step": 44570 }, { "epoch": 0.48, "learning_rate": 1.1068844403117698e-05, "loss": 21.7015, "step": 44580 }, { "epoch": 0.48, "learning_rate": 1.1065363038275172e-05, "loss": 21.5407, "step": 44590 }, { "epoch": 0.48, "learning_rate": 1.1061881542824449e-05, "loss": 22.0502, "step": 44600 }, { "epoch": 0.48, "learning_rate": 1.105839991719234e-05, "loss": 21.2578, "step": 44610 }, { "epoch": 0.48, "learning_rate": 1.1054918161805684e-05, "loss": 20.9966, "step": 44620 }, { "epoch": 0.48, "learning_rate": 1.1051436277091319e-05, "loss": 22.0925, "step": 44630 }, { "epoch": 0.48, "learning_rate": 1.1047954263476108e-05, "loss": 21.1591, "step": 44640 }, { "epoch": 0.48, "learning_rate": 1.104447212138693e-05, "loss": 21.2651, "step": 44650 }, { "epoch": 0.48, "learning_rate": 1.1040989851250678e-05, "loss": 20.655, "step": 44660 }, { "epoch": 0.48, "learning_rate": 1.1037507453494262e-05, "loss": 21.7503, "step": 44670 }, { "epoch": 0.48, "learning_rate": 1.1034024928544607e-05, "loss": 21.3377, "step": 44680 }, { "epoch": 0.48, "learning_rate": 1.1030542276828647e-05, "loss": 22.0138, "step": 44690 }, { "epoch": 0.48, "learning_rate": 1.1027059498773345e-05, "loss": 21.1562, "step": 44700 }, { "epoch": 0.48, "learning_rate": 1.1023576594805667e-05, "loss": 21.2242, "step": 44710 }, { "epoch": 0.48, "learning_rate": 1.1020093565352607e-05, "loss": 21.0162, "step": 44720 }, { "epoch": 0.48, "learning_rate": 1.101661041084116e-05, "loss": 21.6492, "step": 44730 }, { "epoch": 0.48, "learning_rate": 1.1013127131698343e-05, "loss": 21.679, "step": 44740 }, { "epoch": 0.48, "learning_rate": 1.1009643728351197e-05, "loss": 21.1083, "step": 44750 }, { "epoch": 0.48, "learning_rate": 1.1006160201226756e-05, "loss": 22.0859, "step": 44760 }, { "epoch": 0.48, "learning_rate": 1.1002676550752098e-05, "loss": 21.3531, "step": 44770 }, { "epoch": 0.48, "learning_rate": 1.0999192777354294e-05, "loss": 20.9618, "step": 44780 }, { "epoch": 0.48, "learning_rate": 1.0995708881460434e-05, "loss": 21.3442, "step": 44790 }, { "epoch": 0.48, "learning_rate": 1.0992224863497633e-05, "loss": 21.6436, "step": 44800 }, { "epoch": 0.48, "learning_rate": 1.0988740723893008e-05, "loss": 21.5515, "step": 44810 }, { "epoch": 0.48, "learning_rate": 1.0985256463073703e-05, "loss": 21.3256, "step": 44820 }, { "epoch": 0.48, "learning_rate": 1.098177208146687e-05, "loss": 22.3731, "step": 44830 }, { "epoch": 0.48, "learning_rate": 1.0978287579499672e-05, "loss": 21.4042, "step": 44840 }, { "epoch": 0.48, "learning_rate": 1.0974802957599293e-05, "loss": 21.1899, "step": 44850 }, { "epoch": 0.48, "learning_rate": 1.0971318216192934e-05, "loss": 21.0894, "step": 44860 }, { "epoch": 0.49, "learning_rate": 1.0967833355707807e-05, "loss": 21.3912, "step": 44870 }, { "epoch": 0.49, "learning_rate": 1.0964348376571135e-05, "loss": 21.4567, "step": 44880 }, { "epoch": 0.49, "learning_rate": 1.0960863279210158e-05, "loss": 20.44, "step": 44890 }, { "epoch": 0.49, "learning_rate": 1.0957378064052138e-05, "loss": 20.991, "step": 44900 }, { "epoch": 0.49, "learning_rate": 1.0953892731524338e-05, "loss": 21.695, "step": 44910 }, { "epoch": 0.49, "learning_rate": 1.0950407282054045e-05, "loss": 20.3577, "step": 44920 }, { "epoch": 0.49, "learning_rate": 1.0946921716068561e-05, "loss": 21.4819, "step": 44930 }, { "epoch": 0.49, "learning_rate": 1.0943436033995194e-05, "loss": 21.3578, "step": 44940 }, { "epoch": 0.49, "learning_rate": 1.0939950236261274e-05, "loss": 21.1279, "step": 44950 }, { "epoch": 0.49, "learning_rate": 1.0936464323294142e-05, "loss": 21.0941, "step": 44960 }, { "epoch": 0.49, "learning_rate": 1.0932978295521152e-05, "loss": 20.7761, "step": 44970 }, { "epoch": 0.49, "learning_rate": 1.0929492153369678e-05, "loss": 21.4879, "step": 44980 }, { "epoch": 0.49, "learning_rate": 1.0926005897267097e-05, "loss": 21.1276, "step": 44990 }, { "epoch": 0.49, "learning_rate": 1.0922519527640814e-05, "loss": 21.209, "step": 45000 }, { "epoch": 0.49, "learning_rate": 1.0919033044918235e-05, "loss": 20.7824, "step": 45010 }, { "epoch": 0.49, "learning_rate": 1.0915546449526785e-05, "loss": 21.3493, "step": 45020 }, { "epoch": 0.49, "learning_rate": 1.0912059741893908e-05, "loss": 21.6689, "step": 45030 }, { "epoch": 0.49, "learning_rate": 1.0908572922447055e-05, "loss": 20.777, "step": 45040 }, { "epoch": 0.49, "learning_rate": 1.090508599161369e-05, "loss": 21.6308, "step": 45050 }, { "epoch": 0.49, "learning_rate": 1.0901598949821295e-05, "loss": 21.1762, "step": 45060 }, { "epoch": 0.49, "learning_rate": 1.0898111797497366e-05, "loss": 21.6276, "step": 45070 }, { "epoch": 0.49, "learning_rate": 1.0894624535069406e-05, "loss": 21.4511, "step": 45080 }, { "epoch": 0.49, "learning_rate": 1.0891137162964942e-05, "loss": 21.7061, "step": 45090 }, { "epoch": 0.49, "learning_rate": 1.0887649681611505e-05, "loss": 22.326, "step": 45100 }, { "epoch": 0.49, "learning_rate": 1.088416209143664e-05, "loss": 21.1338, "step": 45110 }, { "epoch": 0.49, "learning_rate": 1.088067439286791e-05, "loss": 21.852, "step": 45120 }, { "epoch": 0.49, "learning_rate": 1.0877186586332898e-05, "loss": 21.3165, "step": 45130 }, { "epoch": 0.49, "learning_rate": 1.0873698672259181e-05, "loss": 21.6277, "step": 45140 }, { "epoch": 0.49, "learning_rate": 1.0870210651074362e-05, "loss": 21.6699, "step": 45150 }, { "epoch": 0.49, "learning_rate": 1.0866722523206057e-05, "loss": 21.6596, "step": 45160 }, { "epoch": 0.49, "learning_rate": 1.0863234289081888e-05, "loss": 21.0565, "step": 45170 }, { "epoch": 0.49, "learning_rate": 1.0859745949129505e-05, "loss": 21.2765, "step": 45180 }, { "epoch": 0.49, "learning_rate": 1.0856257503776554e-05, "loss": 20.4155, "step": 45190 }, { "epoch": 0.49, "learning_rate": 1.08527689534507e-05, "loss": 21.2552, "step": 45200 }, { "epoch": 0.49, "learning_rate": 1.084928029857963e-05, "loss": 20.5398, "step": 45210 }, { "epoch": 0.49, "learning_rate": 1.0845791539591023e-05, "loss": 20.7476, "step": 45220 }, { "epoch": 0.49, "learning_rate": 1.0842302676912595e-05, "loss": 21.1753, "step": 45230 }, { "epoch": 0.49, "learning_rate": 1.083881371097206e-05, "loss": 20.9611, "step": 45240 }, { "epoch": 0.49, "learning_rate": 1.0835324642197143e-05, "loss": 21.2474, "step": 45250 }, { "epoch": 0.49, "learning_rate": 1.0831835471015592e-05, "loss": 20.6308, "step": 45260 }, { "epoch": 0.49, "learning_rate": 1.0828346197855157e-05, "loss": 20.7753, "step": 45270 }, { "epoch": 0.49, "learning_rate": 1.082485682314361e-05, "loss": 21.4597, "step": 45280 }, { "epoch": 0.49, "learning_rate": 1.0821367347308734e-05, "loss": 20.7082, "step": 45290 }, { "epoch": 0.49, "learning_rate": 1.0817877770778309e-05, "loss": 20.9548, "step": 45300 }, { "epoch": 0.49, "learning_rate": 1.0814388093980152e-05, "loss": 20.9498, "step": 45310 }, { "epoch": 0.49, "learning_rate": 1.0810898317342074e-05, "loss": 21.4092, "step": 45320 }, { "epoch": 0.49, "learning_rate": 1.0807408441291907e-05, "loss": 20.8188, "step": 45330 }, { "epoch": 0.49, "learning_rate": 1.0803918466257491e-05, "loss": 20.8501, "step": 45340 }, { "epoch": 0.49, "learning_rate": 1.0800428392666676e-05, "loss": 20.6937, "step": 45350 }, { "epoch": 0.49, "learning_rate": 1.0796938220947335e-05, "loss": 20.9968, "step": 45360 }, { "epoch": 0.49, "learning_rate": 1.0793447951527339e-05, "loss": 21.6584, "step": 45370 }, { "epoch": 0.49, "learning_rate": 1.0789957584834584e-05, "loss": 21.222, "step": 45380 }, { "epoch": 0.49, "learning_rate": 1.0786467121296963e-05, "loss": 21.0483, "step": 45390 }, { "epoch": 0.49, "learning_rate": 1.0782976561342398e-05, "loss": 21.4984, "step": 45400 }, { "epoch": 0.49, "learning_rate": 1.077948590539881e-05, "loss": 20.6011, "step": 45410 }, { "epoch": 0.49, "learning_rate": 1.0775995153894136e-05, "loss": 20.9103, "step": 45420 }, { "epoch": 0.49, "learning_rate": 1.0772504307256326e-05, "loss": 21.5918, "step": 45430 }, { "epoch": 0.49, "learning_rate": 1.076901336591334e-05, "loss": 21.716, "step": 45440 }, { "epoch": 0.49, "learning_rate": 1.076552233029315e-05, "loss": 21.1089, "step": 45450 }, { "epoch": 0.49, "learning_rate": 1.0762031200823737e-05, "loss": 21.7621, "step": 45460 }, { "epoch": 0.49, "learning_rate": 1.0758539977933101e-05, "loss": 21.2061, "step": 45470 }, { "epoch": 0.49, "learning_rate": 1.0755048662049245e-05, "loss": 22.0814, "step": 45480 }, { "epoch": 0.49, "learning_rate": 1.0751557253600188e-05, "loss": 21.6229, "step": 45490 }, { "epoch": 0.49, "learning_rate": 1.074806575301396e-05, "loss": 21.5798, "step": 45500 }, { "epoch": 0.49, "learning_rate": 1.0744574160718599e-05, "loss": 21.59, "step": 45510 }, { "epoch": 0.49, "learning_rate": 1.074108247714216e-05, "loss": 21.7451, "step": 45520 }, { "epoch": 0.49, "learning_rate": 1.0737590702712702e-05, "loss": 21.7036, "step": 45530 }, { "epoch": 0.49, "learning_rate": 1.0734098837858304e-05, "loss": 20.8394, "step": 45540 }, { "epoch": 0.49, "learning_rate": 1.0730606883007048e-05, "loss": 21.6169, "step": 45550 }, { "epoch": 0.49, "learning_rate": 1.0727114838587032e-05, "loss": 21.5458, "step": 45560 }, { "epoch": 0.49, "learning_rate": 1.072362270502636e-05, "loss": 22.0103, "step": 45570 }, { "epoch": 0.49, "learning_rate": 1.0720130482753153e-05, "loss": 21.3336, "step": 45580 }, { "epoch": 0.49, "learning_rate": 1.0716638172195541e-05, "loss": 22.2893, "step": 45590 }, { "epoch": 0.49, "learning_rate": 1.0713145773781664e-05, "loss": 20.2684, "step": 45600 }, { "epoch": 0.49, "learning_rate": 1.0709653287939667e-05, "loss": 21.2435, "step": 45610 }, { "epoch": 0.49, "learning_rate": 1.0706160715097718e-05, "loss": 21.1369, "step": 45620 }, { "epoch": 0.49, "learning_rate": 1.0702668055683982e-05, "loss": 21.2329, "step": 45630 }, { "epoch": 0.49, "learning_rate": 1.0699175310126652e-05, "loss": 21.1828, "step": 45640 }, { "epoch": 0.49, "learning_rate": 1.0695682478853913e-05, "loss": 21.7573, "step": 45650 }, { "epoch": 0.49, "learning_rate": 1.069218956229397e-05, "loss": 21.5507, "step": 45660 }, { "epoch": 0.49, "learning_rate": 1.068869656087504e-05, "loss": 22.03, "step": 45670 }, { "epoch": 0.49, "learning_rate": 1.068520347502534e-05, "loss": 21.2169, "step": 45680 }, { "epoch": 0.49, "learning_rate": 1.0681710305173118e-05, "loss": 21.0443, "step": 45690 }, { "epoch": 0.49, "learning_rate": 1.0678217051746609e-05, "loss": 21.2291, "step": 45700 }, { "epoch": 0.49, "learning_rate": 1.0674723715174069e-05, "loss": 21.1088, "step": 45710 }, { "epoch": 0.49, "learning_rate": 1.067123029588377e-05, "loss": 21.4258, "step": 45720 }, { "epoch": 0.49, "learning_rate": 1.0667736794303977e-05, "loss": 20.5932, "step": 45730 }, { "epoch": 0.49, "learning_rate": 1.0664243210862989e-05, "loss": 20.7322, "step": 45740 }, { "epoch": 0.49, "learning_rate": 1.0660749545989093e-05, "loss": 21.8955, "step": 45750 }, { "epoch": 0.49, "learning_rate": 1.0657255800110596e-05, "loss": 21.5211, "step": 45760 }, { "epoch": 0.49, "learning_rate": 1.0653761973655819e-05, "loss": 20.3184, "step": 45770 }, { "epoch": 0.49, "learning_rate": 1.0650268067053077e-05, "loss": 21.3678, "step": 45780 }, { "epoch": 0.5, "learning_rate": 1.0646774080730717e-05, "loss": 21.2298, "step": 45790 }, { "epoch": 0.5, "learning_rate": 1.064328001511708e-05, "loss": 21.6147, "step": 45800 }, { "epoch": 0.5, "learning_rate": 1.063978587064052e-05, "loss": 21.735, "step": 45810 }, { "epoch": 0.5, "learning_rate": 1.0636291647729402e-05, "loss": 20.681, "step": 45820 }, { "epoch": 0.5, "learning_rate": 1.06327973468121e-05, "loss": 21.0105, "step": 45830 }, { "epoch": 0.5, "learning_rate": 1.0629302968316998e-05, "loss": 21.3939, "step": 45840 }, { "epoch": 0.5, "learning_rate": 1.0625808512672495e-05, "loss": 20.5156, "step": 45850 }, { "epoch": 0.5, "learning_rate": 1.0622313980306982e-05, "loss": 20.3121, "step": 45860 }, { "epoch": 0.5, "learning_rate": 1.0618819371648881e-05, "loss": 21.7729, "step": 45870 }, { "epoch": 0.5, "learning_rate": 1.0615324687126612e-05, "loss": 21.0434, "step": 45880 }, { "epoch": 0.5, "learning_rate": 1.0611829927168602e-05, "loss": 20.7826, "step": 45890 }, { "epoch": 0.5, "learning_rate": 1.0608335092203294e-05, "loss": 20.9518, "step": 45900 }, { "epoch": 0.5, "learning_rate": 1.0604840182659138e-05, "loss": 21.2771, "step": 45910 }, { "epoch": 0.5, "learning_rate": 1.060134519896459e-05, "loss": 21.5415, "step": 45920 }, { "epoch": 0.5, "learning_rate": 1.059785014154812e-05, "loss": 20.7847, "step": 45930 }, { "epoch": 0.5, "learning_rate": 1.0594355010838205e-05, "loss": 21.7804, "step": 45940 }, { "epoch": 0.5, "learning_rate": 1.0590859807263327e-05, "loss": 20.8231, "step": 45950 }, { "epoch": 0.5, "learning_rate": 1.0587364531251983e-05, "loss": 21.1737, "step": 45960 }, { "epoch": 0.5, "learning_rate": 1.0583869183232678e-05, "loss": 22.0544, "step": 45970 }, { "epoch": 0.5, "learning_rate": 1.058037376363392e-05, "loss": 20.8464, "step": 45980 }, { "epoch": 0.5, "learning_rate": 1.0576878272884234e-05, "loss": 20.5569, "step": 45990 }, { "epoch": 0.5, "learning_rate": 1.0573382711412148e-05, "loss": 20.1937, "step": 46000 }, { "epoch": 0.5, "learning_rate": 1.05698870796462e-05, "loss": 21.4457, "step": 46010 }, { "epoch": 0.5, "learning_rate": 1.0566391378014937e-05, "loss": 21.4245, "step": 46020 }, { "epoch": 0.5, "learning_rate": 1.0562895606946916e-05, "loss": 21.6604, "step": 46030 }, { "epoch": 0.5, "learning_rate": 1.0559399766870701e-05, "loss": 21.5552, "step": 46040 }, { "epoch": 0.5, "learning_rate": 1.0555903858214865e-05, "loss": 21.0875, "step": 46050 }, { "epoch": 0.5, "learning_rate": 1.0552407881407984e-05, "loss": 21.2977, "step": 46060 }, { "epoch": 0.5, "learning_rate": 1.0548911836878655e-05, "loss": 21.695, "step": 46070 }, { "epoch": 0.5, "learning_rate": 1.0545415725055468e-05, "loss": 20.9829, "step": 46080 }, { "epoch": 0.5, "learning_rate": 1.0541919546367032e-05, "loss": 21.1563, "step": 46090 }, { "epoch": 0.5, "learning_rate": 1.0538423301241967e-05, "loss": 21.2293, "step": 46100 }, { "epoch": 0.5, "learning_rate": 1.0534926990108887e-05, "loss": 21.2762, "step": 46110 }, { "epoch": 0.5, "learning_rate": 1.0531430613396428e-05, "loss": 21.032, "step": 46120 }, { "epoch": 0.5, "learning_rate": 1.052793417153322e-05, "loss": 21.0607, "step": 46130 }, { "epoch": 0.5, "learning_rate": 1.0524437664947918e-05, "loss": 21.457, "step": 46140 }, { "epoch": 0.5, "learning_rate": 1.0520941094069175e-05, "loss": 21.7442, "step": 46150 }, { "epoch": 0.5, "learning_rate": 1.051744445932565e-05, "loss": 20.7003, "step": 46160 }, { "epoch": 0.5, "learning_rate": 1.051394776114601e-05, "loss": 20.3595, "step": 46170 }, { "epoch": 0.5, "learning_rate": 1.0510450999958946e-05, "loss": 21.7072, "step": 46180 }, { "epoch": 0.5, "learning_rate": 1.0506954176193128e-05, "loss": 21.2506, "step": 46190 }, { "epoch": 0.5, "learning_rate": 1.0503457290277255e-05, "loss": 20.9857, "step": 46200 }, { "epoch": 0.5, "learning_rate": 1.0499960342640035e-05, "loss": 21.3328, "step": 46210 }, { "epoch": 0.5, "learning_rate": 1.0496463333710164e-05, "loss": 21.738, "step": 46220 }, { "epoch": 0.5, "learning_rate": 1.0492966263916367e-05, "loss": 21.0849, "step": 46230 }, { "epoch": 0.5, "learning_rate": 1.048946913368736e-05, "loss": 21.3176, "step": 46240 }, { "epoch": 0.5, "learning_rate": 1.048597194345188e-05, "loss": 21.2066, "step": 46250 }, { "epoch": 0.5, "learning_rate": 1.0482474693638668e-05, "loss": 21.0291, "step": 46260 }, { "epoch": 0.5, "learning_rate": 1.0478977384676457e-05, "loss": 21.7947, "step": 46270 }, { "epoch": 0.5, "learning_rate": 1.0475480016994009e-05, "loss": 21.2572, "step": 46280 }, { "epoch": 0.5, "learning_rate": 1.0471982591020083e-05, "loss": 21.2987, "step": 46290 }, { "epoch": 0.5, "learning_rate": 1.0468485107183443e-05, "loss": 20.8122, "step": 46300 }, { "epoch": 0.5, "learning_rate": 1.0464987565912868e-05, "loss": 20.9879, "step": 46310 }, { "epoch": 0.5, "learning_rate": 1.046148996763713e-05, "loss": 21.1415, "step": 46320 }, { "epoch": 0.5, "learning_rate": 1.0457992312785027e-05, "loss": 20.7299, "step": 46330 }, { "epoch": 0.5, "learning_rate": 1.045449460178535e-05, "loss": 21.8762, "step": 46340 }, { "epoch": 0.5, "learning_rate": 1.0450996835066902e-05, "loss": 21.4979, "step": 46350 }, { "epoch": 0.5, "learning_rate": 1.0447499013058489e-05, "loss": 21.4483, "step": 46360 }, { "epoch": 0.5, "learning_rate": 1.044400113618893e-05, "loss": 21.4618, "step": 46370 }, { "epoch": 0.5, "learning_rate": 1.0440503204887046e-05, "loss": 21.3176, "step": 46380 }, { "epoch": 0.5, "learning_rate": 1.0437005219581662e-05, "loss": 21.6458, "step": 46390 }, { "epoch": 0.5, "learning_rate": 1.0433507180701618e-05, "loss": 21.8055, "step": 46400 }, { "epoch": 0.5, "learning_rate": 1.0430009088675759e-05, "loss": 21.755, "step": 46410 }, { "epoch": 0.5, "learning_rate": 1.0426510943932927e-05, "loss": 21.8433, "step": 46420 }, { "epoch": 0.5, "learning_rate": 1.0423012746901979e-05, "loss": 21.3398, "step": 46430 }, { "epoch": 0.5, "learning_rate": 1.0419514498011779e-05, "loss": 21.5116, "step": 46440 }, { "epoch": 0.5, "learning_rate": 1.0416016197691192e-05, "loss": 22.4402, "step": 46450 }, { "epoch": 0.5, "learning_rate": 1.0412517846369094e-05, "loss": 21.4258, "step": 46460 }, { "epoch": 0.5, "learning_rate": 1.0409019444474366e-05, "loss": 21.2427, "step": 46470 }, { "epoch": 0.5, "learning_rate": 1.0405520992435894e-05, "loss": 21.4953, "step": 46480 }, { "epoch": 0.5, "learning_rate": 1.0402022490682568e-05, "loss": 21.284, "step": 46490 }, { "epoch": 0.5, "learning_rate": 1.039852393964329e-05, "loss": 21.4171, "step": 46500 }, { "epoch": 0.5, "learning_rate": 1.0395025339746965e-05, "loss": 21.2116, "step": 46510 }, { "epoch": 0.5, "learning_rate": 1.03915266914225e-05, "loss": 22.2696, "step": 46520 }, { "epoch": 0.5, "learning_rate": 1.038802799509882e-05, "loss": 21.2753, "step": 46530 }, { "epoch": 0.5, "learning_rate": 1.038452925120484e-05, "loss": 20.6009, "step": 46540 }, { "epoch": 0.5, "learning_rate": 1.0381030460169488e-05, "loss": 21.681, "step": 46550 }, { "epoch": 0.5, "learning_rate": 1.0377531622421705e-05, "loss": 21.4183, "step": 46560 }, { "epoch": 0.5, "learning_rate": 1.0374032738390426e-05, "loss": 21.3566, "step": 46570 }, { "epoch": 0.5, "learning_rate": 1.0370533808504602e-05, "loss": 21.6893, "step": 46580 }, { "epoch": 0.5, "learning_rate": 1.036703483319318e-05, "loss": 21.1612, "step": 46590 }, { "epoch": 0.5, "learning_rate": 1.0363535812885113e-05, "loss": 21.5087, "step": 46600 }, { "epoch": 0.5, "learning_rate": 1.0360036748009372e-05, "loss": 20.4277, "step": 46610 }, { "epoch": 0.5, "learning_rate": 1.0356537638994918e-05, "loss": 21.64, "step": 46620 }, { "epoch": 0.5, "learning_rate": 1.0353038486270729e-05, "loss": 21.8712, "step": 46630 }, { "epoch": 0.5, "learning_rate": 1.0349539290265782e-05, "loss": 21.0808, "step": 46640 }, { "epoch": 0.5, "learning_rate": 1.0346040051409059e-05, "loss": 20.9525, "step": 46650 }, { "epoch": 0.5, "learning_rate": 1.0342540770129554e-05, "loss": 20.5909, "step": 46660 }, { "epoch": 0.5, "learning_rate": 1.0339041446856256e-05, "loss": 20.3991, "step": 46670 }, { "epoch": 0.5, "learning_rate": 1.0335542082018166e-05, "loss": 21.0323, "step": 46680 }, { "epoch": 0.5, "learning_rate": 1.0332042676044294e-05, "loss": 21.7628, "step": 46690 }, { "epoch": 0.5, "learning_rate": 1.0328543229363641e-05, "loss": 21.3541, "step": 46700 }, { "epoch": 0.5, "learning_rate": 1.032504374240523e-05, "loss": 21.3041, "step": 46710 }, { "epoch": 0.51, "learning_rate": 1.0321544215598079e-05, "loss": 21.0552, "step": 46720 }, { "epoch": 0.51, "learning_rate": 1.0318044649371204e-05, "loss": 21.3867, "step": 46730 }, { "epoch": 0.51, "learning_rate": 1.0314545044153645e-05, "loss": 21.4554, "step": 46740 }, { "epoch": 0.51, "learning_rate": 1.0311045400374429e-05, "loss": 21.2019, "step": 46750 }, { "epoch": 0.51, "learning_rate": 1.03075457184626e-05, "loss": 21.5227, "step": 46760 }, { "epoch": 0.51, "learning_rate": 1.03040459988472e-05, "loss": 21.258, "step": 46770 }, { "epoch": 0.51, "learning_rate": 1.0300546241957274e-05, "loss": 21.0437, "step": 46780 }, { "epoch": 0.51, "learning_rate": 1.0297046448221881e-05, "loss": 20.8429, "step": 46790 }, { "epoch": 0.51, "learning_rate": 1.0293546618070072e-05, "loss": 21.5735, "step": 46800 }, { "epoch": 0.51, "learning_rate": 1.029004675193091e-05, "loss": 20.2569, "step": 46810 }, { "epoch": 0.51, "learning_rate": 1.0286546850233468e-05, "loss": 21.7764, "step": 46820 }, { "epoch": 0.51, "learning_rate": 1.0283046913406805e-05, "loss": 20.983, "step": 46830 }, { "epoch": 0.51, "learning_rate": 1.0279546941880005e-05, "loss": 20.6967, "step": 46840 }, { "epoch": 0.51, "learning_rate": 1.0276046936082143e-05, "loss": 21.168, "step": 46850 }, { "epoch": 0.51, "learning_rate": 1.0272546896442301e-05, "loss": 21.2625, "step": 46860 }, { "epoch": 0.51, "learning_rate": 1.0269046823389573e-05, "loss": 21.1806, "step": 46870 }, { "epoch": 0.51, "learning_rate": 1.0265546717353041e-05, "loss": 20.3359, "step": 46880 }, { "epoch": 0.51, "learning_rate": 1.0262046578761809e-05, "loss": 20.8039, "step": 46890 }, { "epoch": 0.51, "learning_rate": 1.0258546408044972e-05, "loss": 21.2278, "step": 46900 }, { "epoch": 0.51, "learning_rate": 1.0255046205631634e-05, "loss": 21.6851, "step": 46910 }, { "epoch": 0.51, "learning_rate": 1.0251545971950903e-05, "loss": 21.6523, "step": 46920 }, { "epoch": 0.51, "learning_rate": 1.0248045707431891e-05, "loss": 21.2066, "step": 46930 }, { "epoch": 0.51, "learning_rate": 1.024454541250371e-05, "loss": 21.1752, "step": 46940 }, { "epoch": 0.51, "learning_rate": 1.0241045087595482e-05, "loss": 21.1021, "step": 46950 }, { "epoch": 0.51, "learning_rate": 1.0237544733136328e-05, "loss": 20.9053, "step": 46960 }, { "epoch": 0.51, "learning_rate": 1.0234044349555377e-05, "loss": 20.6964, "step": 46970 }, { "epoch": 0.51, "learning_rate": 1.0230543937281749e-05, "loss": 20.7018, "step": 46980 }, { "epoch": 0.51, "learning_rate": 1.0227043496744591e-05, "loss": 21.6958, "step": 46990 }, { "epoch": 0.51, "learning_rate": 1.0223543028373031e-05, "loss": 21.1559, "step": 47000 }, { "epoch": 0.51, "learning_rate": 1.0220042532596208e-05, "loss": 21.1159, "step": 47010 }, { "epoch": 0.51, "learning_rate": 1.021654200984327e-05, "loss": 20.8536, "step": 47020 }, { "epoch": 0.51, "learning_rate": 1.0213041460543356e-05, "loss": 20.5383, "step": 47030 }, { "epoch": 0.51, "learning_rate": 1.0209540885125625e-05, "loss": 20.5523, "step": 47040 }, { "epoch": 0.51, "learning_rate": 1.0206040284019227e-05, "loss": 21.3311, "step": 47050 }, { "epoch": 0.51, "learning_rate": 1.0202539657653317e-05, "loss": 21.1752, "step": 47060 }, { "epoch": 0.51, "learning_rate": 1.0199039006457056e-05, "loss": 21.0677, "step": 47070 }, { "epoch": 0.51, "learning_rate": 1.0195538330859602e-05, "loss": 21.0084, "step": 47080 }, { "epoch": 0.51, "learning_rate": 1.0192037631290128e-05, "loss": 20.4561, "step": 47090 }, { "epoch": 0.51, "learning_rate": 1.0188536908177795e-05, "loss": 21.14, "step": 47100 }, { "epoch": 0.51, "learning_rate": 1.0185036161951776e-05, "loss": 21.0649, "step": 47110 }, { "epoch": 0.51, "learning_rate": 1.0181535393041248e-05, "loss": 21.7475, "step": 47120 }, { "epoch": 0.51, "learning_rate": 1.0178034601875384e-05, "loss": 20.7498, "step": 47130 }, { "epoch": 0.51, "learning_rate": 1.0174533788883367e-05, "loss": 21.756, "step": 47140 }, { "epoch": 0.51, "learning_rate": 1.0171032954494381e-05, "loss": 20.6575, "step": 47150 }, { "epoch": 0.51, "learning_rate": 1.0167532099137603e-05, "loss": 21.5652, "step": 47160 }, { "epoch": 0.51, "learning_rate": 1.0164031223242228e-05, "loss": 20.5912, "step": 47170 }, { "epoch": 0.51, "learning_rate": 1.0160530327237441e-05, "loss": 21.3591, "step": 47180 }, { "epoch": 0.51, "learning_rate": 1.0157029411552437e-05, "loss": 20.9646, "step": 47190 }, { "epoch": 0.51, "learning_rate": 1.0153528476616412e-05, "loss": 21.6984, "step": 47200 }, { "epoch": 0.51, "learning_rate": 1.0150027522858556e-05, "loss": 21.541, "step": 47210 }, { "epoch": 0.51, "learning_rate": 1.0146526550708077e-05, "loss": 21.05, "step": 47220 }, { "epoch": 0.51, "learning_rate": 1.0143025560594173e-05, "loss": 21.211, "step": 47230 }, { "epoch": 0.51, "learning_rate": 1.013952455294605e-05, "loss": 21.0076, "step": 47240 }, { "epoch": 0.51, "learning_rate": 1.013602352819291e-05, "loss": 20.8397, "step": 47250 }, { "epoch": 0.51, "learning_rate": 1.0132522486763967e-05, "loss": 20.8886, "step": 47260 }, { "epoch": 0.51, "learning_rate": 1.0129021429088426e-05, "loss": 21.3776, "step": 47270 }, { "epoch": 0.51, "learning_rate": 1.01255203555955e-05, "loss": 20.7239, "step": 47280 }, { "epoch": 0.51, "learning_rate": 1.0122019266714406e-05, "loss": 21.8891, "step": 47290 }, { "epoch": 0.51, "learning_rate": 1.0118518162874358e-05, "loss": 21.07, "step": 47300 }, { "epoch": 0.51, "learning_rate": 1.0115017044504573e-05, "loss": 21.1923, "step": 47310 }, { "epoch": 0.51, "learning_rate": 1.0111515912034273e-05, "loss": 20.9428, "step": 47320 }, { "epoch": 0.51, "learning_rate": 1.0108014765892677e-05, "loss": 21.506, "step": 47330 }, { "epoch": 0.51, "learning_rate": 1.0104513606509013e-05, "loss": 21.5884, "step": 47340 }, { "epoch": 0.51, "learning_rate": 1.0101012434312498e-05, "loss": 21.4339, "step": 47350 }, { "epoch": 0.51, "learning_rate": 1.0097511249732363e-05, "loss": 21.0453, "step": 47360 }, { "epoch": 0.51, "learning_rate": 1.0094010053197836e-05, "loss": 21.2399, "step": 47370 }, { "epoch": 0.51, "learning_rate": 1.0090508845138144e-05, "loss": 21.6775, "step": 47380 }, { "epoch": 0.51, "learning_rate": 1.008700762598252e-05, "loss": 21.212, "step": 47390 }, { "epoch": 0.51, "learning_rate": 1.0083506396160193e-05, "loss": 20.9157, "step": 47400 }, { "epoch": 0.51, "learning_rate": 1.00800051561004e-05, "loss": 21.256, "step": 47410 }, { "epoch": 0.51, "learning_rate": 1.0076503906232374e-05, "loss": 21.2012, "step": 47420 }, { "epoch": 0.51, "learning_rate": 1.007300264698535e-05, "loss": 21.8015, "step": 47430 }, { "epoch": 0.51, "learning_rate": 1.0069501378788567e-05, "loss": 21.4743, "step": 47440 }, { "epoch": 0.51, "learning_rate": 1.0066000102071258e-05, "loss": 21.426, "step": 47450 }, { "epoch": 0.51, "learning_rate": 1.0062498817262668e-05, "loss": 20.5835, "step": 47460 }, { "epoch": 0.51, "learning_rate": 1.0058997524792034e-05, "loss": 20.6805, "step": 47470 }, { "epoch": 0.51, "learning_rate": 1.0055496225088599e-05, "loss": 20.4161, "step": 47480 }, { "epoch": 0.51, "learning_rate": 1.00519949185816e-05, "loss": 21.1185, "step": 47490 }, { "epoch": 0.51, "learning_rate": 1.0048493605700287e-05, "loss": 21.8263, "step": 47500 }, { "epoch": 0.51, "learning_rate": 1.0044992286873899e-05, "loss": 20.3701, "step": 47510 }, { "epoch": 0.51, "learning_rate": 1.004149096253168e-05, "loss": 21.3195, "step": 47520 }, { "epoch": 0.51, "learning_rate": 1.0037989633102877e-05, "loss": 20.8778, "step": 47530 }, { "epoch": 0.51, "learning_rate": 1.0034488299016729e-05, "loss": 20.837, "step": 47540 }, { "epoch": 0.51, "learning_rate": 1.0030986960702496e-05, "loss": 21.7286, "step": 47550 }, { "epoch": 0.51, "learning_rate": 1.0027485618589412e-05, "loss": 21.0963, "step": 47560 }, { "epoch": 0.51, "learning_rate": 1.0023984273106726e-05, "loss": 21.3815, "step": 47570 }, { "epoch": 0.51, "learning_rate": 1.0020482924683692e-05, "loss": 21.2326, "step": 47580 }, { "epoch": 0.51, "learning_rate": 1.001698157374955e-05, "loss": 20.2676, "step": 47590 }, { "epoch": 0.51, "learning_rate": 1.0013480220733554e-05, "loss": 21.4809, "step": 47600 }, { "epoch": 0.51, "learning_rate": 1.0009978866064951e-05, "loss": 22.2225, "step": 47610 }, { "epoch": 0.51, "learning_rate": 1.0006477510172984e-05, "loss": 20.7635, "step": 47620 }, { "epoch": 0.51, "learning_rate": 1.0002976153486913e-05, "loss": 21.4536, "step": 47630 }, { "epoch": 0.52, "learning_rate": 9.999474796435975e-06, "loss": 21.4003, "step": 47640 }, { "epoch": 0.52, "learning_rate": 9.995973439449426e-06, "loss": 20.7064, "step": 47650 }, { "epoch": 0.52, "learning_rate": 9.992472082956514e-06, "loss": 21.501, "step": 47660 }, { "epoch": 0.52, "learning_rate": 9.98897072738649e-06, "loss": 21.3872, "step": 47670 }, { "epoch": 0.52, "learning_rate": 9.985469373168598e-06, "loss": 21.0562, "step": 47680 }, { "epoch": 0.52, "learning_rate": 9.981968020732083e-06, "loss": 22.1322, "step": 47690 }, { "epoch": 0.52, "learning_rate": 9.978466670506204e-06, "loss": 21.2693, "step": 47700 }, { "epoch": 0.52, "learning_rate": 9.974965322920203e-06, "loss": 21.0996, "step": 47710 }, { "epoch": 0.52, "learning_rate": 9.971463978403327e-06, "loss": 21.6799, "step": 47720 }, { "epoch": 0.52, "learning_rate": 9.96796263738483e-06, "loss": 20.8457, "step": 47730 }, { "epoch": 0.52, "learning_rate": 9.964461300293947e-06, "loss": 21.3355, "step": 47740 }, { "epoch": 0.52, "learning_rate": 9.960959967559935e-06, "loss": 21.593, "step": 47750 }, { "epoch": 0.52, "learning_rate": 9.957458639612035e-06, "loss": 20.8678, "step": 47760 }, { "epoch": 0.52, "learning_rate": 9.953957316879495e-06, "loss": 21.1624, "step": 47770 }, { "epoch": 0.52, "learning_rate": 9.95045599979156e-06, "loss": 21.8496, "step": 47780 }, { "epoch": 0.52, "learning_rate": 9.94695468877747e-06, "loss": 21.2626, "step": 47790 }, { "epoch": 0.52, "learning_rate": 9.94345338426647e-06, "loss": 21.3936, "step": 47800 }, { "epoch": 0.52, "learning_rate": 9.939952086687805e-06, "loss": 21.1056, "step": 47810 }, { "epoch": 0.52, "learning_rate": 9.936450796470712e-06, "loss": 20.9564, "step": 47820 }, { "epoch": 0.52, "learning_rate": 9.93294951404444e-06, "loss": 20.4344, "step": 47830 }, { "epoch": 0.52, "learning_rate": 9.929448239838217e-06, "loss": 20.5786, "step": 47840 }, { "epoch": 0.52, "learning_rate": 9.92594697428129e-06, "loss": 21.5172, "step": 47850 }, { "epoch": 0.52, "learning_rate": 9.922445717802897e-06, "loss": 20.7168, "step": 47860 }, { "epoch": 0.52, "learning_rate": 9.91894447083227e-06, "loss": 21.0164, "step": 47870 }, { "epoch": 0.52, "learning_rate": 9.915443233798645e-06, "loss": 21.2249, "step": 47880 }, { "epoch": 0.52, "learning_rate": 9.911942007131263e-06, "loss": 21.1455, "step": 47890 }, { "epoch": 0.52, "learning_rate": 9.908440791259349e-06, "loss": 21.3581, "step": 47900 }, { "epoch": 0.52, "learning_rate": 9.904939586612136e-06, "loss": 21.7985, "step": 47910 }, { "epoch": 0.52, "learning_rate": 9.901438393618859e-06, "loss": 21.4385, "step": 47920 }, { "epoch": 0.52, "learning_rate": 9.89793721270874e-06, "loss": 20.8299, "step": 47930 }, { "epoch": 0.52, "learning_rate": 9.894436044311014e-06, "loss": 21.4324, "step": 47940 }, { "epoch": 0.52, "learning_rate": 9.8909348888549e-06, "loss": 21.0499, "step": 47950 }, { "epoch": 0.52, "learning_rate": 9.887433746769625e-06, "loss": 21.4828, "step": 47960 }, { "epoch": 0.52, "learning_rate": 9.883932618484411e-06, "loss": 20.7942, "step": 47970 }, { "epoch": 0.52, "learning_rate": 9.880431504428477e-06, "loss": 21.9176, "step": 47980 }, { "epoch": 0.52, "learning_rate": 9.876930405031047e-06, "loss": 22.7775, "step": 47990 }, { "epoch": 0.52, "learning_rate": 9.873429320721338e-06, "loss": 20.6365, "step": 48000 }, { "epoch": 0.52, "learning_rate": 9.869928251928561e-06, "loss": 21.693, "step": 48010 }, { "epoch": 0.52, "learning_rate": 9.866427199081931e-06, "loss": 20.4638, "step": 48020 }, { "epoch": 0.52, "learning_rate": 9.86292616261066e-06, "loss": 22.0423, "step": 48030 }, { "epoch": 0.52, "learning_rate": 9.85942514294396e-06, "loss": 21.0269, "step": 48040 }, { "epoch": 0.52, "learning_rate": 9.855924140511037e-06, "loss": 21.2298, "step": 48050 }, { "epoch": 0.52, "learning_rate": 9.852423155741094e-06, "loss": 21.5683, "step": 48060 }, { "epoch": 0.52, "learning_rate": 9.848922189063337e-06, "loss": 21.4204, "step": 48070 }, { "epoch": 0.52, "learning_rate": 9.845421240906965e-06, "loss": 21.4742, "step": 48080 }, { "epoch": 0.52, "learning_rate": 9.841920311701178e-06, "loss": 21.6056, "step": 48090 }, { "epoch": 0.52, "learning_rate": 9.838419401875177e-06, "loss": 21.9652, "step": 48100 }, { "epoch": 0.52, "learning_rate": 9.834918511858148e-06, "loss": 21.2626, "step": 48110 }, { "epoch": 0.52, "learning_rate": 9.831417642079286e-06, "loss": 20.7416, "step": 48120 }, { "epoch": 0.52, "learning_rate": 9.82791679296778e-06, "loss": 21.5421, "step": 48130 }, { "epoch": 0.52, "learning_rate": 9.824415964952818e-06, "loss": 21.0023, "step": 48140 }, { "epoch": 0.52, "learning_rate": 9.820915158463583e-06, "loss": 21.449, "step": 48150 }, { "epoch": 0.52, "learning_rate": 9.817414373929261e-06, "loss": 21.2368, "step": 48160 }, { "epoch": 0.52, "learning_rate": 9.813913611779021e-06, "loss": 21.6403, "step": 48170 }, { "epoch": 0.52, "learning_rate": 9.810412872442045e-06, "loss": 20.9548, "step": 48180 }, { "epoch": 0.52, "learning_rate": 9.806912156347505e-06, "loss": 20.9365, "step": 48190 }, { "epoch": 0.52, "learning_rate": 9.803411463924575e-06, "loss": 20.839, "step": 48200 }, { "epoch": 0.52, "learning_rate": 9.79991079560242e-06, "loss": 21.455, "step": 48210 }, { "epoch": 0.52, "learning_rate": 9.7964101518102e-06, "loss": 21.3527, "step": 48220 }, { "epoch": 0.52, "learning_rate": 9.79290953297708e-06, "loss": 20.6142, "step": 48230 }, { "epoch": 0.52, "learning_rate": 9.78940893953222e-06, "loss": 21.5774, "step": 48240 }, { "epoch": 0.52, "learning_rate": 9.785908371904775e-06, "loss": 20.9728, "step": 48250 }, { "epoch": 0.52, "learning_rate": 9.782407830523893e-06, "loss": 21.2157, "step": 48260 }, { "epoch": 0.52, "learning_rate": 9.778907315818733e-06, "loss": 21.0692, "step": 48270 }, { "epoch": 0.52, "learning_rate": 9.775406828218427e-06, "loss": 21.2419, "step": 48280 }, { "epoch": 0.52, "learning_rate": 9.771906368152125e-06, "loss": 21.2545, "step": 48290 }, { "epoch": 0.52, "learning_rate": 9.768405936048968e-06, "loss": 20.7541, "step": 48300 }, { "epoch": 0.52, "learning_rate": 9.764905532338084e-06, "loss": 21.2411, "step": 48310 }, { "epoch": 0.52, "learning_rate": 9.761405157448615e-06, "loss": 21.5786, "step": 48320 }, { "epoch": 0.52, "learning_rate": 9.75790481180968e-06, "loss": 21.2498, "step": 48330 }, { "epoch": 0.52, "learning_rate": 9.754404495850408e-06, "loss": 20.8107, "step": 48340 }, { "epoch": 0.52, "learning_rate": 9.750904209999921e-06, "loss": 21.354, "step": 48350 }, { "epoch": 0.52, "learning_rate": 9.747403954687334e-06, "loss": 20.8466, "step": 48360 }, { "epoch": 0.52, "learning_rate": 9.74390373034177e-06, "loss": 21.3072, "step": 48370 }, { "epoch": 0.52, "learning_rate": 9.740403537392324e-06, "loss": 21.256, "step": 48380 }, { "epoch": 0.52, "learning_rate": 9.736903376268112e-06, "loss": 21.3486, "step": 48390 }, { "epoch": 0.52, "learning_rate": 9.733403247398236e-06, "loss": 20.7047, "step": 48400 }, { "epoch": 0.52, "learning_rate": 9.729903151211788e-06, "loss": 21.5775, "step": 48410 }, { "epoch": 0.52, "learning_rate": 9.72640308813787e-06, "loss": 20.9001, "step": 48420 }, { "epoch": 0.52, "learning_rate": 9.722903058605572e-06, "loss": 20.8223, "step": 48430 }, { "epoch": 0.52, "learning_rate": 9.719403063043973e-06, "loss": 21.5489, "step": 48440 }, { "epoch": 0.52, "learning_rate": 9.715903101882163e-06, "loss": 21.122, "step": 48450 }, { "epoch": 0.52, "learning_rate": 9.712403175549212e-06, "loss": 20.9328, "step": 48460 }, { "epoch": 0.52, "learning_rate": 9.708903284474199e-06, "loss": 21.0961, "step": 48470 }, { "epoch": 0.52, "learning_rate": 9.705403429086195e-06, "loss": 21.6413, "step": 48480 }, { "epoch": 0.52, "learning_rate": 9.70190360981426e-06, "loss": 20.2255, "step": 48490 }, { "epoch": 0.52, "learning_rate": 9.698403827087454e-06, "loss": 21.8716, "step": 48500 }, { "epoch": 0.52, "learning_rate": 9.694904081334835e-06, "loss": 21.4765, "step": 48510 }, { "epoch": 0.52, "learning_rate": 9.691404372985455e-06, "loss": 22.5527, "step": 48520 }, { "epoch": 0.52, "learning_rate": 9.687904702468362e-06, "loss": 21.589, "step": 48530 }, { "epoch": 0.52, "learning_rate": 9.684405070212598e-06, "loss": 21.5105, "step": 48540 }, { "epoch": 0.52, "learning_rate": 9.680905476647194e-06, "loss": 21.7507, "step": 48550 }, { "epoch": 0.52, "learning_rate": 9.677405922201189e-06, "loss": 21.5467, "step": 48560 }, { "epoch": 0.53, "learning_rate": 9.67390640730361e-06, "loss": 21.9262, "step": 48570 }, { "epoch": 0.53, "learning_rate": 9.670406932383478e-06, "loss": 21.0924, "step": 48580 }, { "epoch": 0.53, "learning_rate": 9.666907497869817e-06, "loss": 20.8346, "step": 48590 }, { "epoch": 0.53, "learning_rate": 9.663408104191632e-06, "loss": 20.6294, "step": 48600 }, { "epoch": 0.53, "learning_rate": 9.659908751777935e-06, "loss": 21.2896, "step": 48610 }, { "epoch": 0.53, "learning_rate": 9.65640944105773e-06, "loss": 21.1856, "step": 48620 }, { "epoch": 0.53, "learning_rate": 9.652910172460016e-06, "loss": 21.3514, "step": 48630 }, { "epoch": 0.53, "learning_rate": 9.649410946413785e-06, "loss": 21.8032, "step": 48640 }, { "epoch": 0.53, "learning_rate": 9.645911763348022e-06, "loss": 21.4363, "step": 48650 }, { "epoch": 0.53, "learning_rate": 9.642412623691708e-06, "loss": 21.6631, "step": 48660 }, { "epoch": 0.53, "learning_rate": 9.638913527873827e-06, "loss": 21.197, "step": 48670 }, { "epoch": 0.53, "learning_rate": 9.635414476323346e-06, "loss": 21.433, "step": 48680 }, { "epoch": 0.53, "learning_rate": 9.63191546946923e-06, "loss": 21.4609, "step": 48690 }, { "epoch": 0.53, "learning_rate": 9.62841650774045e-06, "loss": 21.1976, "step": 48700 }, { "epoch": 0.53, "learning_rate": 9.624917591565947e-06, "loss": 21.2127, "step": 48710 }, { "epoch": 0.53, "learning_rate": 9.621418721374678e-06, "loss": 21.4031, "step": 48720 }, { "epoch": 0.53, "learning_rate": 9.617919897595586e-06, "loss": 21.905, "step": 48730 }, { "epoch": 0.53, "learning_rate": 9.614421120657607e-06, "loss": 22.3541, "step": 48740 }, { "epoch": 0.53, "learning_rate": 9.610922390989685e-06, "loss": 21.2171, "step": 48750 }, { "epoch": 0.53, "learning_rate": 9.607423709020728e-06, "loss": 21.5661, "step": 48760 }, { "epoch": 0.53, "learning_rate": 9.603925075179671e-06, "loss": 21.5031, "step": 48770 }, { "epoch": 0.53, "learning_rate": 9.600426489895425e-06, "loss": 21.4914, "step": 48780 }, { "epoch": 0.53, "learning_rate": 9.596927953596895e-06, "loss": 21.1395, "step": 48790 }, { "epoch": 0.53, "learning_rate": 9.593429466712997e-06, "loss": 21.1319, "step": 48800 }, { "epoch": 0.53, "learning_rate": 9.58993102967261e-06, "loss": 20.8912, "step": 48810 }, { "epoch": 0.53, "learning_rate": 9.586432642904639e-06, "loss": 20.7503, "step": 48820 }, { "epoch": 0.53, "learning_rate": 9.582934306837962e-06, "loss": 21.5051, "step": 48830 }, { "epoch": 0.53, "learning_rate": 9.579436021901458e-06, "loss": 21.1506, "step": 48840 }, { "epoch": 0.53, "learning_rate": 9.575937788524003e-06, "loss": 20.9559, "step": 48850 }, { "epoch": 0.53, "learning_rate": 9.572439607134463e-06, "loss": 22.0831, "step": 48860 }, { "epoch": 0.53, "learning_rate": 9.568941478161693e-06, "loss": 21.4238, "step": 48870 }, { "epoch": 0.53, "learning_rate": 9.565443402034548e-06, "loss": 21.2163, "step": 48880 }, { "epoch": 0.53, "learning_rate": 9.561945379181873e-06, "loss": 21.0649, "step": 48890 }, { "epoch": 0.53, "learning_rate": 9.558447410032512e-06, "loss": 22.0205, "step": 48900 }, { "epoch": 0.53, "learning_rate": 9.5549494950153e-06, "loss": 21.2045, "step": 48910 }, { "epoch": 0.53, "learning_rate": 9.551451634559058e-06, "loss": 21.262, "step": 48920 }, { "epoch": 0.53, "learning_rate": 9.54795382909261e-06, "loss": 21.6585, "step": 48930 }, { "epoch": 0.53, "learning_rate": 9.544456079044765e-06, "loss": 21.5173, "step": 48940 }, { "epoch": 0.53, "learning_rate": 9.540958384844336e-06, "loss": 20.8161, "step": 48950 }, { "epoch": 0.53, "learning_rate": 9.537460746920121e-06, "loss": 20.4751, "step": 48960 }, { "epoch": 0.53, "learning_rate": 9.533963165700913e-06, "loss": 21.1643, "step": 48970 }, { "epoch": 0.53, "learning_rate": 9.530465641615496e-06, "loss": 21.9321, "step": 48980 }, { "epoch": 0.53, "learning_rate": 9.526968175092648e-06, "loss": 21.407, "step": 48990 }, { "epoch": 0.53, "learning_rate": 9.523470766561145e-06, "loss": 20.94, "step": 49000 }, { "epoch": 0.53, "learning_rate": 9.519973416449749e-06, "loss": 21.0079, "step": 49010 }, { "epoch": 0.53, "learning_rate": 9.516476125187221e-06, "loss": 21.574, "step": 49020 }, { "epoch": 0.53, "learning_rate": 9.512978893202308e-06, "loss": 20.5181, "step": 49030 }, { "epoch": 0.53, "learning_rate": 9.509481720923752e-06, "loss": 21.5086, "step": 49040 }, { "epoch": 0.53, "learning_rate": 9.505984608780294e-06, "loss": 20.2499, "step": 49050 }, { "epoch": 0.53, "learning_rate": 9.502487557200658e-06, "loss": 20.8274, "step": 49060 }, { "epoch": 0.53, "learning_rate": 9.49899056661357e-06, "loss": 20.7982, "step": 49070 }, { "epoch": 0.53, "learning_rate": 9.495493637447738e-06, "loss": 21.3807, "step": 49080 }, { "epoch": 0.53, "learning_rate": 9.491996770131868e-06, "loss": 21.7886, "step": 49090 }, { "epoch": 0.53, "learning_rate": 9.488499965094664e-06, "loss": 21.0407, "step": 49100 }, { "epoch": 0.53, "learning_rate": 9.485003222764813e-06, "loss": 21.2497, "step": 49110 }, { "epoch": 0.53, "learning_rate": 9.481506543571e-06, "loss": 21.798, "step": 49120 }, { "epoch": 0.53, "learning_rate": 9.478009927941901e-06, "loss": 21.3875, "step": 49130 }, { "epoch": 0.53, "learning_rate": 9.47451337630618e-06, "loss": 21.6097, "step": 49140 }, { "epoch": 0.53, "learning_rate": 9.471016889092497e-06, "loss": 21.6201, "step": 49150 }, { "epoch": 0.53, "learning_rate": 9.467520466729508e-06, "loss": 21.0578, "step": 49160 }, { "epoch": 0.53, "learning_rate": 9.464024109645854e-06, "loss": 21.446, "step": 49170 }, { "epoch": 0.53, "learning_rate": 9.460527818270174e-06, "loss": 21.7107, "step": 49180 }, { "epoch": 0.53, "learning_rate": 9.457031593031091e-06, "loss": 20.7364, "step": 49190 }, { "epoch": 0.53, "learning_rate": 9.453535434357226e-06, "loss": 21.2163, "step": 49200 }, { "epoch": 0.53, "learning_rate": 9.450039342677193e-06, "loss": 21.2233, "step": 49210 }, { "epoch": 0.53, "learning_rate": 9.446543318419596e-06, "loss": 21.2097, "step": 49220 }, { "epoch": 0.53, "learning_rate": 9.443047362013026e-06, "loss": 21.5207, "step": 49230 }, { "epoch": 0.53, "learning_rate": 9.43955147388608e-06, "loss": 21.6481, "step": 49240 }, { "epoch": 0.53, "learning_rate": 9.43605565446732e-06, "loss": 21.3333, "step": 49250 }, { "epoch": 0.53, "learning_rate": 9.432559904185328e-06, "loss": 21.2896, "step": 49260 }, { "epoch": 0.53, "learning_rate": 9.429064223468663e-06, "loss": 21.4538, "step": 49270 }, { "epoch": 0.53, "learning_rate": 9.425568612745873e-06, "loss": 21.0912, "step": 49280 }, { "epoch": 0.53, "learning_rate": 9.422073072445515e-06, "loss": 20.8726, "step": 49290 }, { "epoch": 0.53, "learning_rate": 9.418577602996111e-06, "loss": 20.8187, "step": 49300 }, { "epoch": 0.53, "learning_rate": 9.415082204826195e-06, "loss": 21.2816, "step": 49310 }, { "epoch": 0.53, "learning_rate": 9.411586878364284e-06, "loss": 21.4045, "step": 49320 }, { "epoch": 0.53, "learning_rate": 9.408091624038885e-06, "loss": 21.0126, "step": 49330 }, { "epoch": 0.53, "learning_rate": 9.40459644227851e-06, "loss": 21.0725, "step": 49340 }, { "epoch": 0.53, "learning_rate": 9.401101333511633e-06, "loss": 21.9383, "step": 49350 }, { "epoch": 0.53, "learning_rate": 9.397606298166752e-06, "loss": 20.573, "step": 49360 }, { "epoch": 0.53, "learning_rate": 9.394111336672334e-06, "loss": 20.5132, "step": 49370 }, { "epoch": 0.53, "learning_rate": 9.39061644945684e-06, "loss": 20.5467, "step": 49380 }, { "epoch": 0.53, "learning_rate": 9.387121636948737e-06, "loss": 21.2623, "step": 49390 }, { "epoch": 0.53, "learning_rate": 9.383626899576465e-06, "loss": 21.1331, "step": 49400 }, { "epoch": 0.53, "learning_rate": 9.380132237768461e-06, "loss": 21.5282, "step": 49410 }, { "epoch": 0.53, "learning_rate": 9.376637651953154e-06, "loss": 20.9977, "step": 49420 }, { "epoch": 0.53, "learning_rate": 9.37314314255896e-06, "loss": 20.5234, "step": 49430 }, { "epoch": 0.53, "learning_rate": 9.369648710014291e-06, "loss": 20.5333, "step": 49440 }, { "epoch": 0.53, "learning_rate": 9.366154354747552e-06, "loss": 20.8713, "step": 49450 }, { "epoch": 0.53, "learning_rate": 9.362660077187127e-06, "loss": 21.3509, "step": 49460 }, { "epoch": 0.53, "learning_rate": 9.359165877761396e-06, "loss": 21.0169, "step": 49470 }, { "epoch": 0.53, "learning_rate": 9.355671756898733e-06, "loss": 20.927, "step": 49480 }, { "epoch": 0.54, "learning_rate": 9.352177715027501e-06, "loss": 21.5453, "step": 49490 }, { "epoch": 0.54, "learning_rate": 9.348683752576054e-06, "loss": 21.663, "step": 49500 }, { "epoch": 0.54, "learning_rate": 9.345189869972729e-06, "loss": 21.8023, "step": 49510 }, { "epoch": 0.54, "learning_rate": 9.34169606764586e-06, "loss": 21.5264, "step": 49520 }, { "epoch": 0.54, "learning_rate": 9.33820234602377e-06, "loss": 20.883, "step": 49530 }, { "epoch": 0.54, "learning_rate": 9.334708705534775e-06, "loss": 21.2609, "step": 49540 }, { "epoch": 0.54, "learning_rate": 9.331215146607174e-06, "loss": 20.4843, "step": 49550 }, { "epoch": 0.54, "learning_rate": 9.327721669669262e-06, "loss": 21.2521, "step": 49560 }, { "epoch": 0.54, "learning_rate": 9.324228275149322e-06, "loss": 20.9083, "step": 49570 }, { "epoch": 0.54, "learning_rate": 9.320734963475622e-06, "loss": 21.204, "step": 49580 }, { "epoch": 0.54, "learning_rate": 9.317241735076432e-06, "loss": 20.5907, "step": 49590 }, { "epoch": 0.54, "learning_rate": 9.31374859038e-06, "loss": 21.1528, "step": 49600 }, { "epoch": 0.54, "learning_rate": 9.310255529814572e-06, "loss": 20.9289, "step": 49610 }, { "epoch": 0.54, "learning_rate": 9.306762553808374e-06, "loss": 21.1451, "step": 49620 }, { "epoch": 0.54, "learning_rate": 9.303269662789628e-06, "loss": 21.5514, "step": 49630 }, { "epoch": 0.54, "learning_rate": 9.29977685718655e-06, "loss": 21.3024, "step": 49640 }, { "epoch": 0.54, "learning_rate": 9.296284137427339e-06, "loss": 21.2942, "step": 49650 }, { "epoch": 0.54, "learning_rate": 9.292791503940179e-06, "loss": 20.8912, "step": 49660 }, { "epoch": 0.54, "learning_rate": 9.289298957153263e-06, "loss": 21.1834, "step": 49670 }, { "epoch": 0.54, "learning_rate": 9.285806497494744e-06, "loss": 21.7993, "step": 49680 }, { "epoch": 0.54, "learning_rate": 9.28231412539279e-06, "loss": 21.9885, "step": 49690 }, { "epoch": 0.54, "learning_rate": 9.278821841275545e-06, "loss": 20.9513, "step": 49700 }, { "epoch": 0.54, "learning_rate": 9.275329645571143e-06, "loss": 20.2538, "step": 49710 }, { "epoch": 0.54, "learning_rate": 9.271837538707723e-06, "loss": 21.6556, "step": 49720 }, { "epoch": 0.54, "learning_rate": 9.26834552111338e-06, "loss": 20.3228, "step": 49730 }, { "epoch": 0.54, "learning_rate": 9.264853593216233e-06, "loss": 21.4922, "step": 49740 }, { "epoch": 0.54, "learning_rate": 9.261361755444366e-06, "loss": 21.7533, "step": 49750 }, { "epoch": 0.54, "learning_rate": 9.257870008225867e-06, "loss": 21.4784, "step": 49760 }, { "epoch": 0.54, "learning_rate": 9.254378351988809e-06, "loss": 20.8323, "step": 49770 }, { "epoch": 0.54, "learning_rate": 9.250886787161241e-06, "loss": 20.905, "step": 49780 }, { "epoch": 0.54, "learning_rate": 9.247395314171219e-06, "loss": 21.44, "step": 49790 }, { "epoch": 0.54, "learning_rate": 9.24390393344678e-06, "loss": 20.5721, "step": 49800 }, { "epoch": 0.54, "learning_rate": 9.240412645415946e-06, "loss": 20.9072, "step": 49810 }, { "epoch": 0.54, "learning_rate": 9.236921450506737e-06, "loss": 22.1913, "step": 49820 }, { "epoch": 0.54, "learning_rate": 9.233430349147156e-06, "loss": 21.7338, "step": 49830 }, { "epoch": 0.54, "learning_rate": 9.229939341765188e-06, "loss": 21.3803, "step": 49840 }, { "epoch": 0.54, "learning_rate": 9.226448428788818e-06, "loss": 21.7661, "step": 49850 }, { "epoch": 0.54, "learning_rate": 9.222957610646011e-06, "loss": 21.0311, "step": 49860 }, { "epoch": 0.54, "learning_rate": 9.21946688776473e-06, "loss": 20.7604, "step": 49870 }, { "epoch": 0.54, "learning_rate": 9.215976260572917e-06, "loss": 21.5654, "step": 49880 }, { "epoch": 0.54, "learning_rate": 9.212485729498504e-06, "loss": 22.1489, "step": 49890 }, { "epoch": 0.54, "learning_rate": 9.208995294969414e-06, "loss": 22.5474, "step": 49900 }, { "epoch": 0.54, "learning_rate": 9.205504957413554e-06, "loss": 21.6614, "step": 49910 }, { "epoch": 0.54, "learning_rate": 9.202014717258827e-06, "loss": 21.779, "step": 49920 }, { "epoch": 0.54, "learning_rate": 9.198524574933117e-06, "loss": 21.9952, "step": 49930 }, { "epoch": 0.54, "learning_rate": 9.1950345308643e-06, "loss": 21.2301, "step": 49940 }, { "epoch": 0.54, "learning_rate": 9.191544585480234e-06, "loss": 20.893, "step": 49950 }, { "epoch": 0.54, "learning_rate": 9.188054739208769e-06, "loss": 22.3313, "step": 49960 }, { "epoch": 0.54, "learning_rate": 9.184564992477745e-06, "loss": 21.6316, "step": 49970 }, { "epoch": 0.54, "learning_rate": 9.181075345714987e-06, "loss": 20.8582, "step": 49980 }, { "epoch": 0.54, "learning_rate": 9.177585799348312e-06, "loss": 21.5452, "step": 49990 }, { "epoch": 0.54, "learning_rate": 9.174096353805515e-06, "loss": 20.7344, "step": 50000 }, { "epoch": 0.54, "learning_rate": 9.170607009514383e-06, "loss": 20.868, "step": 50010 }, { "epoch": 0.54, "learning_rate": 9.1671177669027e-06, "loss": 21.3615, "step": 50020 }, { "epoch": 0.54, "learning_rate": 9.163628626398225e-06, "loss": 21.0057, "step": 50030 }, { "epoch": 0.54, "learning_rate": 9.160139588428712e-06, "loss": 21.3468, "step": 50040 }, { "epoch": 0.54, "learning_rate": 9.156650653421896e-06, "loss": 21.5268, "step": 50050 }, { "epoch": 0.54, "learning_rate": 9.153161821805505e-06, "loss": 21.1873, "step": 50060 }, { "epoch": 0.54, "learning_rate": 9.149673094007251e-06, "loss": 21.5414, "step": 50070 }, { "epoch": 0.54, "learning_rate": 9.146184470454837e-06, "loss": 21.1675, "step": 50080 }, { "epoch": 0.54, "learning_rate": 9.142695951575947e-06, "loss": 21.0733, "step": 50090 }, { "epoch": 0.54, "learning_rate": 9.139207537798265e-06, "loss": 20.7098, "step": 50100 }, { "epoch": 0.54, "learning_rate": 9.135719229549442e-06, "loss": 21.8322, "step": 50110 }, { "epoch": 0.54, "learning_rate": 9.132231027257133e-06, "loss": 22.1752, "step": 50120 }, { "epoch": 0.54, "learning_rate": 9.128742931348973e-06, "loss": 21.4932, "step": 50130 }, { "epoch": 0.54, "learning_rate": 9.125254942252586e-06, "loss": 21.1233, "step": 50140 }, { "epoch": 0.54, "learning_rate": 9.121767060395583e-06, "loss": 20.7596, "step": 50150 }, { "epoch": 0.54, "learning_rate": 9.118279286205556e-06, "loss": 21.7448, "step": 50160 }, { "epoch": 0.54, "learning_rate": 9.114791620110093e-06, "loss": 21.5077, "step": 50170 }, { "epoch": 0.54, "learning_rate": 9.111304062536764e-06, "loss": 20.9297, "step": 50180 }, { "epoch": 0.54, "learning_rate": 9.107816613913126e-06, "loss": 21.3293, "step": 50190 }, { "epoch": 0.54, "learning_rate": 9.10432927466672e-06, "loss": 21.0459, "step": 50200 }, { "epoch": 0.54, "learning_rate": 9.100842045225084e-06, "loss": 21.2956, "step": 50210 }, { "epoch": 0.54, "learning_rate": 9.097354926015727e-06, "loss": 21.4912, "step": 50220 }, { "epoch": 0.54, "learning_rate": 9.093867917466155e-06, "loss": 21.2582, "step": 50230 }, { "epoch": 0.54, "learning_rate": 9.09038102000386e-06, "loss": 21.3236, "step": 50240 }, { "epoch": 0.54, "learning_rate": 9.086894234056313e-06, "loss": 21.5421, "step": 50250 }, { "epoch": 0.54, "learning_rate": 9.083407560050984e-06, "loss": 20.899, "step": 50260 }, { "epoch": 0.54, "learning_rate": 9.079920998415317e-06, "loss": 21.791, "step": 50270 }, { "epoch": 0.54, "learning_rate": 9.076434549576746e-06, "loss": 20.0081, "step": 50280 }, { "epoch": 0.54, "learning_rate": 9.072948213962696e-06, "loss": 21.2553, "step": 50290 }, { "epoch": 0.54, "learning_rate": 9.06946199200057e-06, "loss": 20.8547, "step": 50300 }, { "epoch": 0.54, "learning_rate": 9.065975884117767e-06, "loss": 21.637, "step": 50310 }, { "epoch": 0.54, "learning_rate": 9.062489890741662e-06, "loss": 21.0674, "step": 50320 }, { "epoch": 0.54, "learning_rate": 9.059004012299622e-06, "loss": 21.6813, "step": 50330 }, { "epoch": 0.54, "learning_rate": 9.055518249218998e-06, "loss": 21.1371, "step": 50340 }, { "epoch": 0.54, "learning_rate": 9.052032601927125e-06, "loss": 21.1078, "step": 50350 }, { "epoch": 0.54, "learning_rate": 9.04854707085133e-06, "loss": 21.8595, "step": 50360 }, { "epoch": 0.54, "learning_rate": 9.045061656418922e-06, "loss": 21.3941, "step": 50370 }, { "epoch": 0.54, "learning_rate": 9.041576359057193e-06, "loss": 21.788, "step": 50380 }, { "epoch": 0.54, "learning_rate": 9.038091179193423e-06, "loss": 21.9845, "step": 50390 }, { "epoch": 0.54, "learning_rate": 9.034606117254874e-06, "loss": 22.1667, "step": 50400 }, { "epoch": 0.54, "learning_rate": 9.031121173668805e-06, "loss": 21.3392, "step": 50410 }, { "epoch": 0.55, "learning_rate": 9.027636348862452e-06, "loss": 20.9644, "step": 50420 }, { "epoch": 0.55, "learning_rate": 9.02415164326303e-06, "loss": 21.7813, "step": 50430 }, { "epoch": 0.55, "learning_rate": 9.020667057297753e-06, "loss": 21.3182, "step": 50440 }, { "epoch": 0.55, "learning_rate": 9.017182591393808e-06, "loss": 20.7978, "step": 50450 }, { "epoch": 0.55, "learning_rate": 9.013698245978379e-06, "loss": 21.0578, "step": 50460 }, { "epoch": 0.55, "learning_rate": 9.010214021478632e-06, "loss": 21.5957, "step": 50470 }, { "epoch": 0.55, "learning_rate": 9.006729918321706e-06, "loss": 21.9503, "step": 50480 }, { "epoch": 0.55, "learning_rate": 9.00324593693474e-06, "loss": 20.9524, "step": 50490 }, { "epoch": 0.55, "learning_rate": 8.999762077744849e-06, "loss": 20.5563, "step": 50500 }, { "epoch": 0.55, "learning_rate": 8.996278341179144e-06, "loss": 21.3229, "step": 50510 }, { "epoch": 0.55, "learning_rate": 8.992794727664707e-06, "loss": 21.4248, "step": 50520 }, { "epoch": 0.55, "learning_rate": 8.98931123762862e-06, "loss": 20.9602, "step": 50530 }, { "epoch": 0.55, "learning_rate": 8.98582787149793e-06, "loss": 21.1567, "step": 50540 }, { "epoch": 0.55, "learning_rate": 8.982344629699686e-06, "loss": 21.3406, "step": 50550 }, { "epoch": 0.55, "learning_rate": 8.978861512660918e-06, "loss": 21.9291, "step": 50560 }, { "epoch": 0.55, "learning_rate": 8.975378520808637e-06, "loss": 20.3725, "step": 50570 }, { "epoch": 0.55, "learning_rate": 8.971895654569842e-06, "loss": 21.0432, "step": 50580 }, { "epoch": 0.55, "learning_rate": 8.96841291437151e-06, "loss": 21.5289, "step": 50590 }, { "epoch": 0.55, "learning_rate": 8.964930300640612e-06, "loss": 21.0111, "step": 50600 }, { "epoch": 0.55, "learning_rate": 8.9614478138041e-06, "loss": 20.7207, "step": 50610 }, { "epoch": 0.55, "learning_rate": 8.957965454288907e-06, "loss": 21.0179, "step": 50620 }, { "epoch": 0.55, "learning_rate": 8.954483222521951e-06, "loss": 21.0461, "step": 50630 }, { "epoch": 0.55, "learning_rate": 8.951001118930143e-06, "loss": 20.8267, "step": 50640 }, { "epoch": 0.55, "learning_rate": 8.947519143940365e-06, "loss": 21.6204, "step": 50650 }, { "epoch": 0.55, "learning_rate": 8.944037297979491e-06, "loss": 20.5867, "step": 50660 }, { "epoch": 0.55, "learning_rate": 8.94055558147438e-06, "loss": 21.5426, "step": 50670 }, { "epoch": 0.55, "learning_rate": 8.937073994851871e-06, "loss": 21.828, "step": 50680 }, { "epoch": 0.55, "learning_rate": 8.933592538538796e-06, "loss": 21.9414, "step": 50690 }, { "epoch": 0.55, "learning_rate": 8.930111212961951e-06, "loss": 21.1726, "step": 50700 }, { "epoch": 0.55, "learning_rate": 8.92663001854814e-06, "loss": 20.3166, "step": 50710 }, { "epoch": 0.55, "learning_rate": 8.923148955724136e-06, "loss": 21.4473, "step": 50720 }, { "epoch": 0.55, "learning_rate": 8.9196680249167e-06, "loss": 21.1812, "step": 50730 }, { "epoch": 0.55, "learning_rate": 8.916187226552583e-06, "loss": 21.0964, "step": 50740 }, { "epoch": 0.55, "learning_rate": 8.912706561058502e-06, "loss": 20.7481, "step": 50750 }, { "epoch": 0.55, "learning_rate": 8.909226028861176e-06, "loss": 21.1965, "step": 50760 }, { "epoch": 0.55, "learning_rate": 8.905745630387301e-06, "loss": 20.9351, "step": 50770 }, { "epoch": 0.55, "learning_rate": 8.902265366063552e-06, "loss": 20.9428, "step": 50780 }, { "epoch": 0.55, "learning_rate": 8.898785236316601e-06, "loss": 21.2898, "step": 50790 }, { "epoch": 0.55, "learning_rate": 8.895305241573088e-06, "loss": 21.1252, "step": 50800 }, { "epoch": 0.55, "learning_rate": 8.891825382259644e-06, "loss": 21.1136, "step": 50810 }, { "epoch": 0.55, "learning_rate": 8.88834565880288e-06, "loss": 21.2094, "step": 50820 }, { "epoch": 0.55, "learning_rate": 8.884866071629396e-06, "loss": 21.1348, "step": 50830 }, { "epoch": 0.55, "learning_rate": 8.881386621165774e-06, "loss": 20.8816, "step": 50840 }, { "epoch": 0.55, "learning_rate": 8.877907307838574e-06, "loss": 22.1609, "step": 50850 }, { "epoch": 0.55, "learning_rate": 8.874428132074343e-06, "loss": 21.135, "step": 50860 }, { "epoch": 0.55, "learning_rate": 8.87094909429961e-06, "loss": 20.9696, "step": 50870 }, { "epoch": 0.55, "learning_rate": 8.867470194940886e-06, "loss": 21.2958, "step": 50880 }, { "epoch": 0.55, "learning_rate": 8.863991434424671e-06, "loss": 21.1517, "step": 50890 }, { "epoch": 0.55, "learning_rate": 8.860512813177444e-06, "loss": 21.5556, "step": 50900 }, { "epoch": 0.55, "learning_rate": 8.857034331625665e-06, "loss": 21.9581, "step": 50910 }, { "epoch": 0.55, "learning_rate": 8.853555990195774e-06, "loss": 21.3889, "step": 50920 }, { "epoch": 0.55, "learning_rate": 8.850077789314202e-06, "loss": 21.0143, "step": 50930 }, { "epoch": 0.55, "learning_rate": 8.846599729407362e-06, "loss": 21.2575, "step": 50940 }, { "epoch": 0.55, "learning_rate": 8.843121810901643e-06, "loss": 21.402, "step": 50950 }, { "epoch": 0.55, "learning_rate": 8.839644034223424e-06, "loss": 20.9147, "step": 50960 }, { "epoch": 0.55, "learning_rate": 8.836166399799059e-06, "loss": 21.2498, "step": 50970 }, { "epoch": 0.55, "learning_rate": 8.832688908054888e-06, "loss": 21.5257, "step": 50980 }, { "epoch": 0.55, "learning_rate": 8.829211559417238e-06, "loss": 20.8907, "step": 50990 }, { "epoch": 0.55, "learning_rate": 8.825734354312414e-06, "loss": 21.3861, "step": 51000 }, { "epoch": 0.55, "learning_rate": 8.822257293166703e-06, "loss": 21.2693, "step": 51010 }, { "epoch": 0.55, "learning_rate": 8.818780376406376e-06, "loss": 19.8979, "step": 51020 }, { "epoch": 0.55, "learning_rate": 8.815303604457682e-06, "loss": 21.6598, "step": 51030 }, { "epoch": 0.55, "learning_rate": 8.81182697774686e-06, "loss": 21.9094, "step": 51040 }, { "epoch": 0.55, "learning_rate": 8.808350496700127e-06, "loss": 20.6091, "step": 51050 }, { "epoch": 0.55, "learning_rate": 8.804874161743679e-06, "loss": 21.626, "step": 51060 }, { "epoch": 0.55, "learning_rate": 8.801397973303706e-06, "loss": 20.405, "step": 51070 }, { "epoch": 0.55, "learning_rate": 8.79792193180636e-06, "loss": 20.8692, "step": 51080 }, { "epoch": 0.55, "learning_rate": 8.794446037677793e-06, "loss": 20.7997, "step": 51090 }, { "epoch": 0.55, "learning_rate": 8.79097029134413e-06, "loss": 21.3191, "step": 51100 }, { "epoch": 0.55, "learning_rate": 8.787494693231478e-06, "loss": 20.8976, "step": 51110 }, { "epoch": 0.55, "learning_rate": 8.78401924376594e-06, "loss": 20.9133, "step": 51120 }, { "epoch": 0.55, "learning_rate": 8.78054394337357e-06, "loss": 20.9137, "step": 51130 }, { "epoch": 0.55, "learning_rate": 8.777068792480436e-06, "loss": 21.0105, "step": 51140 }, { "epoch": 0.55, "learning_rate": 8.77359379151257e-06, "loss": 21.3367, "step": 51150 }, { "epoch": 0.55, "learning_rate": 8.770118940895987e-06, "loss": 21.3497, "step": 51160 }, { "epoch": 0.55, "learning_rate": 8.766644241056697e-06, "loss": 21.5954, "step": 51170 }, { "epoch": 0.55, "learning_rate": 8.763169692420667e-06, "loss": 21.1257, "step": 51180 }, { "epoch": 0.55, "learning_rate": 8.759695295413867e-06, "loss": 20.7655, "step": 51190 }, { "epoch": 0.55, "learning_rate": 8.756221050462239e-06, "loss": 21.0149, "step": 51200 }, { "epoch": 0.55, "learning_rate": 8.752746957991706e-06, "loss": 20.4545, "step": 51210 }, { "epoch": 0.55, "learning_rate": 8.749273018428181e-06, "loss": 20.7516, "step": 51220 }, { "epoch": 0.55, "learning_rate": 8.74579923219755e-06, "loss": 21.4357, "step": 51230 }, { "epoch": 0.55, "learning_rate": 8.742325599725676e-06, "loss": 21.0897, "step": 51240 }, { "epoch": 0.55, "learning_rate": 8.738852121438413e-06, "loss": 21.2413, "step": 51250 }, { "epoch": 0.55, "learning_rate": 8.735378797761589e-06, "loss": 21.3041, "step": 51260 }, { "epoch": 0.55, "learning_rate": 8.73190562912102e-06, "loss": 21.3256, "step": 51270 }, { "epoch": 0.55, "learning_rate": 8.728432615942502e-06, "loss": 21.0893, "step": 51280 }, { "epoch": 0.55, "learning_rate": 8.724959758651801e-06, "loss": 20.7811, "step": 51290 }, { "epoch": 0.55, "learning_rate": 8.721487057674677e-06, "loss": 21.6437, "step": 51300 }, { "epoch": 0.55, "learning_rate": 8.718014513436863e-06, "loss": 21.1369, "step": 51310 }, { "epoch": 0.55, "learning_rate": 8.71454212636408e-06, "loss": 20.7896, "step": 51320 }, { "epoch": 0.55, "learning_rate": 8.711069896882023e-06, "loss": 21.6751, "step": 51330 }, { "epoch": 0.56, "learning_rate": 8.70759782541637e-06, "loss": 21.9633, "step": 51340 }, { "epoch": 0.56, "learning_rate": 8.704125912392778e-06, "loss": 21.7196, "step": 51350 }, { "epoch": 0.56, "learning_rate": 8.700654158236887e-06, "loss": 21.4707, "step": 51360 }, { "epoch": 0.56, "learning_rate": 8.697182563374318e-06, "loss": 21.0102, "step": 51370 }, { "epoch": 0.56, "learning_rate": 8.69371112823067e-06, "loss": 21.3065, "step": 51380 }, { "epoch": 0.56, "learning_rate": 8.690239853231528e-06, "loss": 20.7652, "step": 51390 }, { "epoch": 0.56, "learning_rate": 8.686768738802447e-06, "loss": 20.909, "step": 51400 }, { "epoch": 0.56, "learning_rate": 8.683297785368968e-06, "loss": 20.7994, "step": 51410 }, { "epoch": 0.56, "learning_rate": 8.679826993356619e-06, "loss": 21.1078, "step": 51420 }, { "epoch": 0.56, "learning_rate": 8.676356363190896e-06, "loss": 21.0269, "step": 51430 }, { "epoch": 0.56, "learning_rate": 8.672885895297285e-06, "loss": 20.7046, "step": 51440 }, { "epoch": 0.56, "learning_rate": 8.669415590101244e-06, "loss": 21.0797, "step": 51450 }, { "epoch": 0.56, "learning_rate": 8.665945448028217e-06, "loss": 20.6788, "step": 51460 }, { "epoch": 0.56, "learning_rate": 8.662475469503626e-06, "loss": 20.4103, "step": 51470 }, { "epoch": 0.56, "learning_rate": 8.659005654952875e-06, "loss": 21.4052, "step": 51480 }, { "epoch": 0.56, "learning_rate": 8.655536004801342e-06, "loss": 21.4449, "step": 51490 }, { "epoch": 0.56, "learning_rate": 8.652066519474395e-06, "loss": 21.7451, "step": 51500 }, { "epoch": 0.56, "learning_rate": 8.648597199397367e-06, "loss": 20.2476, "step": 51510 }, { "epoch": 0.56, "learning_rate": 8.645128044995587e-06, "loss": 20.6875, "step": 51520 }, { "epoch": 0.56, "learning_rate": 8.641659056694351e-06, "loss": 21.6712, "step": 51530 }, { "epoch": 0.56, "learning_rate": 8.638190234918944e-06, "loss": 20.8615, "step": 51540 }, { "epoch": 0.56, "learning_rate": 8.634721580094625e-06, "loss": 21.3392, "step": 51550 }, { "epoch": 0.56, "learning_rate": 8.63125309264663e-06, "loss": 21.0014, "step": 51560 }, { "epoch": 0.56, "learning_rate": 8.62778477300018e-06, "loss": 21.5183, "step": 51570 }, { "epoch": 0.56, "learning_rate": 8.624316621580478e-06, "loss": 20.7309, "step": 51580 }, { "epoch": 0.56, "learning_rate": 8.620848638812696e-06, "loss": 21.4009, "step": 51590 }, { "epoch": 0.56, "learning_rate": 8.617380825121994e-06, "loss": 21.2304, "step": 51600 }, { "epoch": 0.56, "learning_rate": 8.613913180933515e-06, "loss": 21.0477, "step": 51610 }, { "epoch": 0.56, "learning_rate": 8.61044570667236e-06, "loss": 20.3596, "step": 51620 }, { "epoch": 0.56, "learning_rate": 8.606978402763638e-06, "loss": 21.533, "step": 51630 }, { "epoch": 0.56, "learning_rate": 8.603511269632417e-06, "loss": 20.8678, "step": 51640 }, { "epoch": 0.56, "learning_rate": 8.600044307703749e-06, "loss": 21.3477, "step": 51650 }, { "epoch": 0.56, "learning_rate": 8.596577517402675e-06, "loss": 22.3757, "step": 51660 }, { "epoch": 0.56, "learning_rate": 8.593110899154193e-06, "loss": 21.5263, "step": 51670 }, { "epoch": 0.56, "learning_rate": 8.589644453383301e-06, "loss": 21.0281, "step": 51680 }, { "epoch": 0.56, "learning_rate": 8.586178180514968e-06, "loss": 20.915, "step": 51690 }, { "epoch": 0.56, "learning_rate": 8.582712080974138e-06, "loss": 21.0027, "step": 51700 }, { "epoch": 0.56, "learning_rate": 8.579246155185746e-06, "loss": 21.8138, "step": 51710 }, { "epoch": 0.56, "learning_rate": 8.575780403574684e-06, "loss": 20.9257, "step": 51720 }, { "epoch": 0.56, "learning_rate": 8.572314826565849e-06, "loss": 21.7404, "step": 51730 }, { "epoch": 0.56, "learning_rate": 8.568849424584093e-06, "loss": 21.2301, "step": 51740 }, { "epoch": 0.56, "learning_rate": 8.565384198054262e-06, "loss": 20.9537, "step": 51750 }, { "epoch": 0.56, "learning_rate": 8.561919147401177e-06, "loss": 21.4167, "step": 51760 }, { "epoch": 0.56, "learning_rate": 8.558454273049636e-06, "loss": 20.7809, "step": 51770 }, { "epoch": 0.56, "learning_rate": 8.554989575424411e-06, "loss": 21.0984, "step": 51780 }, { "epoch": 0.56, "learning_rate": 8.551525054950259e-06, "loss": 21.6962, "step": 51790 }, { "epoch": 0.56, "learning_rate": 8.54806071205191e-06, "loss": 21.8666, "step": 51800 }, { "epoch": 0.56, "learning_rate": 8.544596547154082e-06, "loss": 21.3268, "step": 51810 }, { "epoch": 0.56, "learning_rate": 8.541132560681462e-06, "loss": 21.3082, "step": 51820 }, { "epoch": 0.56, "learning_rate": 8.537668753058713e-06, "loss": 20.7695, "step": 51830 }, { "epoch": 0.56, "learning_rate": 8.534205124710484e-06, "loss": 21.4818, "step": 51840 }, { "epoch": 0.56, "learning_rate": 8.530741676061395e-06, "loss": 21.1863, "step": 51850 }, { "epoch": 0.56, "learning_rate": 8.527278407536054e-06, "loss": 21.6063, "step": 51860 }, { "epoch": 0.56, "learning_rate": 8.523815319559036e-06, "loss": 21.1316, "step": 51870 }, { "epoch": 0.56, "learning_rate": 8.520352412554903e-06, "loss": 21.1135, "step": 51880 }, { "epoch": 0.56, "learning_rate": 8.51688968694818e-06, "loss": 20.8991, "step": 51890 }, { "epoch": 0.56, "learning_rate": 8.513427143163389e-06, "loss": 21.7117, "step": 51900 }, { "epoch": 0.56, "learning_rate": 8.509964781625017e-06, "loss": 20.918, "step": 51910 }, { "epoch": 0.56, "learning_rate": 8.506502602757535e-06, "loss": 21.3236, "step": 51920 }, { "epoch": 0.56, "learning_rate": 8.503040606985388e-06, "loss": 20.8931, "step": 51930 }, { "epoch": 0.56, "learning_rate": 8.499578794732998e-06, "loss": 21.9864, "step": 51940 }, { "epoch": 0.56, "learning_rate": 8.496117166424764e-06, "loss": 21.3458, "step": 51950 }, { "epoch": 0.56, "learning_rate": 8.492655722485066e-06, "loss": 21.5914, "step": 51960 }, { "epoch": 0.56, "learning_rate": 8.489194463338264e-06, "loss": 21.5973, "step": 51970 }, { "epoch": 0.56, "learning_rate": 8.485733389408687e-06, "loss": 21.7312, "step": 51980 }, { "epoch": 0.56, "learning_rate": 8.482272501120648e-06, "loss": 21.4724, "step": 51990 }, { "epoch": 0.56, "learning_rate": 8.478811798898426e-06, "loss": 22.2116, "step": 52000 }, { "epoch": 0.56, "learning_rate": 8.475351283166297e-06, "loss": 21.295, "step": 52010 }, { "epoch": 0.56, "learning_rate": 8.471890954348498e-06, "loss": 20.7504, "step": 52020 }, { "epoch": 0.56, "learning_rate": 8.468430812869248e-06, "loss": 20.5887, "step": 52030 }, { "epoch": 0.56, "learning_rate": 8.464970859152748e-06, "loss": 20.7937, "step": 52040 }, { "epoch": 0.56, "learning_rate": 8.46151109362316e-06, "loss": 20.7647, "step": 52050 }, { "epoch": 0.56, "learning_rate": 8.458051516704644e-06, "loss": 20.6959, "step": 52060 }, { "epoch": 0.56, "learning_rate": 8.454592128821324e-06, "loss": 21.3112, "step": 52070 }, { "epoch": 0.56, "learning_rate": 8.451132930397302e-06, "loss": 21.1091, "step": 52080 }, { "epoch": 0.56, "learning_rate": 8.447673921856665e-06, "loss": 21.4772, "step": 52090 }, { "epoch": 0.56, "learning_rate": 8.444215103623457e-06, "loss": 21.6051, "step": 52100 }, { "epoch": 0.56, "learning_rate": 8.440756476121723e-06, "loss": 20.7359, "step": 52110 }, { "epoch": 0.56, "learning_rate": 8.437298039775472e-06, "loss": 21.2874, "step": 52120 }, { "epoch": 0.56, "learning_rate": 8.433839795008686e-06, "loss": 20.7542, "step": 52130 }, { "epoch": 0.56, "learning_rate": 8.430381742245339e-06, "loss": 21.2913, "step": 52140 }, { "epoch": 0.56, "learning_rate": 8.426923881909356e-06, "loss": 21.8173, "step": 52150 }, { "epoch": 0.56, "learning_rate": 8.423466214424665e-06, "loss": 21.2297, "step": 52160 }, { "epoch": 0.56, "learning_rate": 8.420008740215155e-06, "loss": 20.6501, "step": 52170 }, { "epoch": 0.56, "learning_rate": 8.416551459704694e-06, "loss": 20.7853, "step": 52180 }, { "epoch": 0.56, "learning_rate": 8.413094373317128e-06, "loss": 21.1656, "step": 52190 }, { "epoch": 0.56, "learning_rate": 8.409637481476285e-06, "loss": 21.368, "step": 52200 }, { "epoch": 0.56, "learning_rate": 8.406180784605953e-06, "loss": 20.7709, "step": 52210 }, { "epoch": 0.56, "learning_rate": 8.40272428312991e-06, "loss": 21.5626, "step": 52220 }, { "epoch": 0.56, "learning_rate": 8.399267977471904e-06, "loss": 22.0669, "step": 52230 }, { "epoch": 0.56, "learning_rate": 8.395811868055663e-06, "loss": 21.1452, "step": 52240 }, { "epoch": 0.56, "learning_rate": 8.392355955304891e-06, "loss": 20.822, "step": 52250 }, { "epoch": 0.56, "learning_rate": 8.388900239643261e-06, "loss": 20.6116, "step": 52260 }, { "epoch": 0.57, "learning_rate": 8.38544472149443e-06, "loss": 21.1314, "step": 52270 }, { "epoch": 0.57, "learning_rate": 8.38198940128202e-06, "loss": 21.1489, "step": 52280 }, { "epoch": 0.57, "learning_rate": 8.378534279429646e-06, "loss": 21.0056, "step": 52290 }, { "epoch": 0.57, "learning_rate": 8.375079356360884e-06, "loss": 20.6439, "step": 52300 }, { "epoch": 0.57, "learning_rate": 8.371624632499294e-06, "loss": 21.1234, "step": 52310 }, { "epoch": 0.57, "learning_rate": 8.3681701082684e-06, "loss": 20.8676, "step": 52320 }, { "epoch": 0.57, "learning_rate": 8.364715784091715e-06, "loss": 21.0001, "step": 52330 }, { "epoch": 0.57, "learning_rate": 8.361261660392723e-06, "loss": 21.1977, "step": 52340 }, { "epoch": 0.57, "learning_rate": 8.357807737594878e-06, "loss": 21.0739, "step": 52350 }, { "epoch": 0.57, "learning_rate": 8.35435401612162e-06, "loss": 21.5468, "step": 52360 }, { "epoch": 0.57, "learning_rate": 8.350900496396352e-06, "loss": 21.4497, "step": 52370 }, { "epoch": 0.57, "learning_rate": 8.347447178842458e-06, "loss": 20.622, "step": 52380 }, { "epoch": 0.57, "learning_rate": 8.3439940638833e-06, "loss": 21.618, "step": 52390 }, { "epoch": 0.57, "learning_rate": 8.340541151942215e-06, "loss": 21.1842, "step": 52400 }, { "epoch": 0.57, "learning_rate": 8.337088443442513e-06, "loss": 21.2686, "step": 52410 }, { "epoch": 0.57, "learning_rate": 8.333635938807473e-06, "loss": 21.3944, "step": 52420 }, { "epoch": 0.57, "learning_rate": 8.330183638460356e-06, "loss": 21.4712, "step": 52430 }, { "epoch": 0.57, "learning_rate": 8.3267315428244e-06, "loss": 21.6048, "step": 52440 }, { "epoch": 0.57, "learning_rate": 8.323279652322815e-06, "loss": 21.0428, "step": 52450 }, { "epoch": 0.57, "learning_rate": 8.319827967378784e-06, "loss": 20.4636, "step": 52460 }, { "epoch": 0.57, "learning_rate": 8.31637648841547e-06, "loss": 20.9625, "step": 52470 }, { "epoch": 0.57, "learning_rate": 8.312925215855997e-06, "loss": 21.3147, "step": 52480 }, { "epoch": 0.57, "learning_rate": 8.309474150123484e-06, "loss": 20.9468, "step": 52490 }, { "epoch": 0.57, "learning_rate": 8.30602329164101e-06, "loss": 21.7128, "step": 52500 }, { "epoch": 0.57, "learning_rate": 8.302572640831634e-06, "loss": 21.1057, "step": 52510 }, { "epoch": 0.57, "learning_rate": 8.299122198118394e-06, "loss": 20.8953, "step": 52520 }, { "epoch": 0.57, "learning_rate": 8.295671963924285e-06, "loss": 20.5888, "step": 52530 }, { "epoch": 0.57, "learning_rate": 8.292221938672296e-06, "loss": 21.5825, "step": 52540 }, { "epoch": 0.57, "learning_rate": 8.288772122785384e-06, "loss": 20.3218, "step": 52550 }, { "epoch": 0.57, "learning_rate": 8.285322516686476e-06, "loss": 20.8434, "step": 52560 }, { "epoch": 0.57, "learning_rate": 8.281873120798476e-06, "loss": 20.9709, "step": 52570 }, { "epoch": 0.57, "learning_rate": 8.278423935544268e-06, "loss": 21.3431, "step": 52580 }, { "epoch": 0.57, "learning_rate": 8.2749749613467e-06, "loss": 21.2709, "step": 52590 }, { "epoch": 0.57, "learning_rate": 8.2715261986286e-06, "loss": 20.9246, "step": 52600 }, { "epoch": 0.57, "learning_rate": 8.268077647812772e-06, "loss": 21.1999, "step": 52610 }, { "epoch": 0.57, "learning_rate": 8.264629309321983e-06, "loss": 21.1012, "step": 52620 }, { "epoch": 0.57, "learning_rate": 8.261181183578995e-06, "loss": 21.5399, "step": 52630 }, { "epoch": 0.57, "learning_rate": 8.25773327100652e-06, "loss": 20.8006, "step": 52640 }, { "epoch": 0.57, "learning_rate": 8.254285572027259e-06, "loss": 20.9803, "step": 52650 }, { "epoch": 0.57, "learning_rate": 8.250838087063882e-06, "loss": 21.5794, "step": 52660 }, { "epoch": 0.57, "learning_rate": 8.247390816539032e-06, "loss": 20.7377, "step": 52670 }, { "epoch": 0.57, "learning_rate": 8.243943760875334e-06, "loss": 20.9244, "step": 52680 }, { "epoch": 0.57, "learning_rate": 8.240496920495372e-06, "loss": 20.0907, "step": 52690 }, { "epoch": 0.57, "learning_rate": 8.237050295821716e-06, "loss": 21.743, "step": 52700 }, { "epoch": 0.57, "learning_rate": 8.233603887276902e-06, "loss": 21.1968, "step": 52710 }, { "epoch": 0.57, "learning_rate": 8.230157695283441e-06, "loss": 20.5737, "step": 52720 }, { "epoch": 0.57, "learning_rate": 8.226711720263825e-06, "loss": 22.0366, "step": 52730 }, { "epoch": 0.57, "learning_rate": 8.223265962640512e-06, "loss": 20.971, "step": 52740 }, { "epoch": 0.57, "learning_rate": 8.219820422835932e-06, "loss": 21.1362, "step": 52750 }, { "epoch": 0.57, "learning_rate": 8.21637510127249e-06, "loss": 20.5725, "step": 52760 }, { "epoch": 0.57, "learning_rate": 8.212929998372564e-06, "loss": 20.8099, "step": 52770 }, { "epoch": 0.57, "learning_rate": 8.209485114558515e-06, "loss": 20.8903, "step": 52780 }, { "epoch": 0.57, "learning_rate": 8.206040450252664e-06, "loss": 21.4395, "step": 52790 }, { "epoch": 0.57, "learning_rate": 8.202596005877307e-06, "loss": 20.6163, "step": 52800 }, { "epoch": 0.57, "learning_rate": 8.199151781854714e-06, "loss": 21.4433, "step": 52810 }, { "epoch": 0.57, "learning_rate": 8.195707778607136e-06, "loss": 20.2444, "step": 52820 }, { "epoch": 0.57, "learning_rate": 8.192263996556787e-06, "loss": 21.0438, "step": 52830 }, { "epoch": 0.57, "learning_rate": 8.188820436125862e-06, "loss": 21.2565, "step": 52840 }, { "epoch": 0.57, "learning_rate": 8.185377097736518e-06, "loss": 21.0414, "step": 52850 }, { "epoch": 0.57, "learning_rate": 8.181933981810892e-06, "loss": 21.5361, "step": 52860 }, { "epoch": 0.57, "learning_rate": 8.178491088771094e-06, "loss": 20.6436, "step": 52870 }, { "epoch": 0.57, "learning_rate": 8.175048419039208e-06, "loss": 21.3344, "step": 52880 }, { "epoch": 0.57, "learning_rate": 8.171605973037287e-06, "loss": 21.3342, "step": 52890 }, { "epoch": 0.57, "learning_rate": 8.16816375118736e-06, "loss": 21.6077, "step": 52900 }, { "epoch": 0.57, "learning_rate": 8.16472175391142e-06, "loss": 21.3468, "step": 52910 }, { "epoch": 0.57, "learning_rate": 8.16127998163144e-06, "loss": 21.937, "step": 52920 }, { "epoch": 0.57, "learning_rate": 8.157838434769368e-06, "loss": 21.217, "step": 52930 }, { "epoch": 0.57, "learning_rate": 8.154397113747117e-06, "loss": 20.7486, "step": 52940 }, { "epoch": 0.57, "learning_rate": 8.150956018986582e-06, "loss": 21.5751, "step": 52950 }, { "epoch": 0.57, "learning_rate": 8.147515150909616e-06, "loss": 20.5357, "step": 52960 }, { "epoch": 0.57, "learning_rate": 8.144074509938054e-06, "loss": 20.716, "step": 52970 }, { "epoch": 0.57, "learning_rate": 8.140634096493705e-06, "loss": 20.9917, "step": 52980 }, { "epoch": 0.57, "learning_rate": 8.137193910998344e-06, "loss": 21.1883, "step": 52990 }, { "epoch": 0.57, "learning_rate": 8.13375395387372e-06, "loss": 20.9941, "step": 53000 }, { "epoch": 0.57, "learning_rate": 8.130314225541563e-06, "loss": 21.7983, "step": 53010 }, { "epoch": 0.57, "learning_rate": 8.126874726423552e-06, "loss": 21.185, "step": 53020 }, { "epoch": 0.57, "learning_rate": 8.123435456941361e-06, "loss": 20.6856, "step": 53030 }, { "epoch": 0.57, "learning_rate": 8.119996417516627e-06, "loss": 21.5117, "step": 53040 }, { "epoch": 0.57, "learning_rate": 8.116557608570957e-06, "loss": 21.0623, "step": 53050 }, { "epoch": 0.57, "learning_rate": 8.113119030525938e-06, "loss": 20.5669, "step": 53060 }, { "epoch": 0.57, "learning_rate": 8.109680683803112e-06, "loss": 21.6291, "step": 53070 }, { "epoch": 0.57, "learning_rate": 8.10624256882401e-06, "loss": 20.9432, "step": 53080 }, { "epoch": 0.57, "learning_rate": 8.102804686010126e-06, "loss": 21.5536, "step": 53090 }, { "epoch": 0.57, "learning_rate": 8.099367035782928e-06, "loss": 20.8348, "step": 53100 }, { "epoch": 0.57, "learning_rate": 8.095929618563857e-06, "loss": 21.8004, "step": 53110 }, { "epoch": 0.57, "learning_rate": 8.092492434774318e-06, "loss": 21.3781, "step": 53120 }, { "epoch": 0.57, "learning_rate": 8.089055484835696e-06, "loss": 20.8711, "step": 53130 }, { "epoch": 0.57, "learning_rate": 8.085618769169344e-06, "loss": 21.3973, "step": 53140 }, { "epoch": 0.57, "learning_rate": 8.082182288196583e-06, "loss": 21.2588, "step": 53150 }, { "epoch": 0.57, "learning_rate": 8.078746042338712e-06, "loss": 20.5183, "step": 53160 }, { "epoch": 0.57, "learning_rate": 8.075310032017e-06, "loss": 21.157, "step": 53170 }, { "epoch": 0.57, "learning_rate": 8.07187425765268e-06, "loss": 20.9632, "step": 53180 }, { "epoch": 0.58, "learning_rate": 8.068438719666959e-06, "loss": 20.4415, "step": 53190 }, { "epoch": 0.58, "learning_rate": 8.065003418481018e-06, "loss": 21.6308, "step": 53200 }, { "epoch": 0.58, "learning_rate": 8.061568354516014e-06, "loss": 21.3421, "step": 53210 }, { "epoch": 0.58, "learning_rate": 8.058133528193066e-06, "loss": 21.1834, "step": 53220 }, { "epoch": 0.58, "learning_rate": 8.054698939933262e-06, "loss": 21.3629, "step": 53230 }, { "epoch": 0.58, "learning_rate": 8.051264590157668e-06, "loss": 20.7472, "step": 53240 }, { "epoch": 0.58, "learning_rate": 8.047830479287318e-06, "loss": 21.5617, "step": 53250 }, { "epoch": 0.58, "learning_rate": 8.044396607743219e-06, "loss": 21.8298, "step": 53260 }, { "epoch": 0.58, "learning_rate": 8.040962975946343e-06, "loss": 20.6542, "step": 53270 }, { "epoch": 0.58, "learning_rate": 8.037529584317642e-06, "loss": 20.9475, "step": 53280 }, { "epoch": 0.58, "learning_rate": 8.034096433278028e-06, "loss": 20.9633, "step": 53290 }, { "epoch": 0.58, "learning_rate": 8.030663523248384e-06, "loss": 20.6007, "step": 53300 }, { "epoch": 0.58, "learning_rate": 8.027230854649576e-06, "loss": 21.4408, "step": 53310 }, { "epoch": 0.58, "learning_rate": 8.023798427902428e-06, "loss": 21.4227, "step": 53320 }, { "epoch": 0.58, "learning_rate": 8.020366243427742e-06, "loss": 21.934, "step": 53330 }, { "epoch": 0.58, "learning_rate": 8.016934301646282e-06, "loss": 20.362, "step": 53340 }, { "epoch": 0.58, "learning_rate": 8.013502602978785e-06, "loss": 22.1557, "step": 53350 }, { "epoch": 0.58, "learning_rate": 8.010071147845968e-06, "loss": 21.2914, "step": 53360 }, { "epoch": 0.58, "learning_rate": 8.006639936668504e-06, "loss": 21.4742, "step": 53370 }, { "epoch": 0.58, "learning_rate": 8.003208969867048e-06, "loss": 22.1456, "step": 53380 }, { "epoch": 0.58, "learning_rate": 7.999778247862214e-06, "loss": 21.2399, "step": 53390 }, { "epoch": 0.58, "learning_rate": 7.99634777107459e-06, "loss": 20.8494, "step": 53400 }, { "epoch": 0.58, "learning_rate": 7.992917539924741e-06, "loss": 21.1032, "step": 53410 }, { "epoch": 0.58, "learning_rate": 7.989487554833194e-06, "loss": 21.194, "step": 53420 }, { "epoch": 0.58, "learning_rate": 7.986057816220447e-06, "loss": 21.8704, "step": 53430 }, { "epoch": 0.58, "learning_rate": 7.982628324506976e-06, "loss": 21.468, "step": 53440 }, { "epoch": 0.58, "learning_rate": 7.979199080113205e-06, "loss": 21.4128, "step": 53450 }, { "epoch": 0.58, "learning_rate": 7.975770083459556e-06, "loss": 21.0473, "step": 53460 }, { "epoch": 0.58, "learning_rate": 7.9723413349664e-06, "loss": 20.3725, "step": 53470 }, { "epoch": 0.58, "learning_rate": 7.968912835054084e-06, "loss": 20.7848, "step": 53480 }, { "epoch": 0.58, "learning_rate": 7.965484584142933e-06, "loss": 20.5904, "step": 53490 }, { "epoch": 0.58, "learning_rate": 7.962056582653221e-06, "loss": 21.2438, "step": 53500 }, { "epoch": 0.58, "learning_rate": 7.958628831005212e-06, "loss": 20.8483, "step": 53510 }, { "epoch": 0.58, "learning_rate": 7.955201329619132e-06, "loss": 22.2154, "step": 53520 }, { "epoch": 0.58, "learning_rate": 7.95177407891517e-06, "loss": 21.3592, "step": 53530 }, { "epoch": 0.58, "learning_rate": 7.948347079313494e-06, "loss": 21.1233, "step": 53540 }, { "epoch": 0.58, "learning_rate": 7.94492033123424e-06, "loss": 20.6589, "step": 53550 }, { "epoch": 0.58, "learning_rate": 7.941493835097505e-06, "loss": 21.8016, "step": 53560 }, { "epoch": 0.58, "learning_rate": 7.93806759132336e-06, "loss": 21.3671, "step": 53570 }, { "epoch": 0.58, "learning_rate": 7.934641600331844e-06, "loss": 21.6174, "step": 53580 }, { "epoch": 0.58, "learning_rate": 7.931215862542973e-06, "loss": 21.274, "step": 53590 }, { "epoch": 0.58, "learning_rate": 7.927790378376726e-06, "loss": 21.0854, "step": 53600 }, { "epoch": 0.58, "learning_rate": 7.924365148253042e-06, "loss": 20.9152, "step": 53610 }, { "epoch": 0.58, "learning_rate": 7.920940172591842e-06, "loss": 21.4024, "step": 53620 }, { "epoch": 0.58, "learning_rate": 7.917515451813008e-06, "loss": 21.2608, "step": 53630 }, { "epoch": 0.58, "learning_rate": 7.914090986336396e-06, "loss": 20.9378, "step": 53640 }, { "epoch": 0.58, "learning_rate": 7.910666776581833e-06, "loss": 20.6933, "step": 53650 }, { "epoch": 0.58, "learning_rate": 7.907242822969103e-06, "loss": 21.5135, "step": 53660 }, { "epoch": 0.58, "learning_rate": 7.903819125917967e-06, "loss": 22.2255, "step": 53670 }, { "epoch": 0.58, "learning_rate": 7.900395685848154e-06, "loss": 21.1874, "step": 53680 }, { "epoch": 0.58, "learning_rate": 7.89697250317936e-06, "loss": 20.4486, "step": 53690 }, { "epoch": 0.58, "learning_rate": 7.893549578331254e-06, "loss": 21.6467, "step": 53700 }, { "epoch": 0.58, "learning_rate": 7.890126911723468e-06, "loss": 20.9506, "step": 53710 }, { "epoch": 0.58, "learning_rate": 7.8867045037756e-06, "loss": 21.3525, "step": 53720 }, { "epoch": 0.58, "learning_rate": 7.883282354907219e-06, "loss": 21.2861, "step": 53730 }, { "epoch": 0.58, "learning_rate": 7.87986046553787e-06, "loss": 21.6673, "step": 53740 }, { "epoch": 0.58, "learning_rate": 7.876438836087058e-06, "loss": 20.9534, "step": 53750 }, { "epoch": 0.58, "learning_rate": 7.873017466974258e-06, "loss": 20.8697, "step": 53760 }, { "epoch": 0.58, "learning_rate": 7.869596358618907e-06, "loss": 20.8294, "step": 53770 }, { "epoch": 0.58, "learning_rate": 7.866175511440419e-06, "loss": 22.2765, "step": 53780 }, { "epoch": 0.58, "learning_rate": 7.862754925858177e-06, "loss": 21.1656, "step": 53790 }, { "epoch": 0.58, "learning_rate": 7.859334602291521e-06, "loss": 21.1501, "step": 53800 }, { "epoch": 0.58, "learning_rate": 7.855914541159776e-06, "loss": 21.2194, "step": 53810 }, { "epoch": 0.58, "learning_rate": 7.852494742882211e-06, "loss": 20.8433, "step": 53820 }, { "epoch": 0.58, "learning_rate": 7.849075207878081e-06, "loss": 21.3133, "step": 53830 }, { "epoch": 0.58, "learning_rate": 7.84565593656661e-06, "loss": 21.5445, "step": 53840 }, { "epoch": 0.58, "learning_rate": 7.842236929366978e-06, "loss": 20.8354, "step": 53850 }, { "epoch": 0.58, "learning_rate": 7.83881818669834e-06, "loss": 20.9482, "step": 53860 }, { "epoch": 0.58, "learning_rate": 7.835399708979818e-06, "loss": 21.5941, "step": 53870 }, { "epoch": 0.58, "learning_rate": 7.831981496630494e-06, "loss": 21.5505, "step": 53880 }, { "epoch": 0.58, "learning_rate": 7.82856355006943e-06, "loss": 20.3167, "step": 53890 }, { "epoch": 0.58, "learning_rate": 7.82514586971565e-06, "loss": 21.1126, "step": 53900 }, { "epoch": 0.58, "learning_rate": 7.82172845598814e-06, "loss": 20.8775, "step": 53910 }, { "epoch": 0.58, "learning_rate": 7.818311309305862e-06, "loss": 20.7607, "step": 53920 }, { "epoch": 0.58, "learning_rate": 7.814894430087736e-06, "loss": 21.2273, "step": 53930 }, { "epoch": 0.58, "learning_rate": 7.81147781875266e-06, "loss": 21.3927, "step": 53940 }, { "epoch": 0.58, "learning_rate": 7.808061475719491e-06, "loss": 21.1646, "step": 53950 }, { "epoch": 0.58, "learning_rate": 7.804645401407053e-06, "loss": 21.3408, "step": 53960 }, { "epoch": 0.58, "learning_rate": 7.801229596234144e-06, "loss": 21.1368, "step": 53970 }, { "epoch": 0.58, "learning_rate": 7.797814060619527e-06, "loss": 21.5296, "step": 53980 }, { "epoch": 0.58, "learning_rate": 7.794398794981921e-06, "loss": 20.8617, "step": 53990 }, { "epoch": 0.58, "learning_rate": 7.790983799740025e-06, "loss": 21.4159, "step": 54000 }, { "epoch": 0.58, "learning_rate": 7.787569075312503e-06, "loss": 21.716, "step": 54010 }, { "epoch": 0.58, "learning_rate": 7.784154622117978e-06, "loss": 21.3577, "step": 54020 }, { "epoch": 0.58, "learning_rate": 7.780740440575054e-06, "loss": 21.5411, "step": 54030 }, { "epoch": 0.58, "learning_rate": 7.777326531102279e-06, "loss": 21.6667, "step": 54040 }, { "epoch": 0.58, "learning_rate": 7.773912894118192e-06, "loss": 20.6804, "step": 54050 }, { "epoch": 0.58, "learning_rate": 7.770499530041284e-06, "loss": 20.9878, "step": 54060 }, { "epoch": 0.58, "learning_rate": 7.767086439290015e-06, "loss": 20.9908, "step": 54070 }, { "epoch": 0.58, "learning_rate": 7.763673622282822e-06, "loss": 20.8495, "step": 54080 }, { "epoch": 0.58, "learning_rate": 7.760261079438085e-06, "loss": 21.4338, "step": 54090 }, { "epoch": 0.58, "learning_rate": 7.756848811174173e-06, "loss": 21.0735, "step": 54100 }, { "epoch": 0.58, "learning_rate": 7.753436817909413e-06, "loss": 20.865, "step": 54110 }, { "epoch": 0.59, "learning_rate": 7.750025100062095e-06, "loss": 21.2371, "step": 54120 }, { "epoch": 0.59, "learning_rate": 7.746613658050483e-06, "loss": 21.5613, "step": 54130 }, { "epoch": 0.59, "learning_rate": 7.743202492292804e-06, "loss": 20.6209, "step": 54140 }, { "epoch": 0.59, "learning_rate": 7.739791603207245e-06, "loss": 20.7712, "step": 54150 }, { "epoch": 0.59, "learning_rate": 7.736380991211963e-06, "loss": 20.895, "step": 54160 }, { "epoch": 0.59, "learning_rate": 7.732970656725085e-06, "loss": 21.9964, "step": 54170 }, { "epoch": 0.59, "learning_rate": 7.7295606001647e-06, "loss": 21.5519, "step": 54180 }, { "epoch": 0.59, "learning_rate": 7.726150821948868e-06, "loss": 21.0631, "step": 54190 }, { "epoch": 0.59, "learning_rate": 7.722741322495608e-06, "loss": 21.4324, "step": 54200 }, { "epoch": 0.59, "learning_rate": 7.719332102222904e-06, "loss": 21.0739, "step": 54210 }, { "epoch": 0.59, "learning_rate": 7.71592316154871e-06, "loss": 21.9828, "step": 54220 }, { "epoch": 0.59, "learning_rate": 7.71251450089095e-06, "loss": 20.613, "step": 54230 }, { "epoch": 0.59, "learning_rate": 7.70910612066751e-06, "loss": 21.5291, "step": 54240 }, { "epoch": 0.59, "learning_rate": 7.705698021296235e-06, "loss": 20.9371, "step": 54250 }, { "epoch": 0.59, "learning_rate": 7.702290203194942e-06, "loss": 22.3709, "step": 54260 }, { "epoch": 0.59, "learning_rate": 7.698882666781411e-06, "loss": 20.5317, "step": 54270 }, { "epoch": 0.59, "learning_rate": 7.695475412473393e-06, "loss": 21.2706, "step": 54280 }, { "epoch": 0.59, "learning_rate": 7.692068440688597e-06, "loss": 21.1124, "step": 54290 }, { "epoch": 0.59, "learning_rate": 7.688661751844707e-06, "loss": 21.2058, "step": 54300 }, { "epoch": 0.59, "learning_rate": 7.685255346359361e-06, "loss": 21.1745, "step": 54310 }, { "epoch": 0.59, "learning_rate": 7.681849224650164e-06, "loss": 20.5704, "step": 54320 }, { "epoch": 0.59, "learning_rate": 7.678443387134694e-06, "loss": 21.0847, "step": 54330 }, { "epoch": 0.59, "learning_rate": 7.67503783423049e-06, "loss": 21.3443, "step": 54340 }, { "epoch": 0.59, "learning_rate": 7.671632566355057e-06, "loss": 22.074, "step": 54350 }, { "epoch": 0.59, "learning_rate": 7.66822758392586e-06, "loss": 21.6074, "step": 54360 }, { "epoch": 0.59, "learning_rate": 7.664822887360332e-06, "loss": 20.5448, "step": 54370 }, { "epoch": 0.59, "learning_rate": 7.661418477075876e-06, "loss": 21.3336, "step": 54380 }, { "epoch": 0.59, "learning_rate": 7.658014353489856e-06, "loss": 20.9632, "step": 54390 }, { "epoch": 0.59, "learning_rate": 7.654610517019594e-06, "loss": 21.1527, "step": 54400 }, { "epoch": 0.59, "learning_rate": 7.651206968082396e-06, "loss": 21.17, "step": 54410 }, { "epoch": 0.59, "learning_rate": 7.647803707095506e-06, "loss": 21.0998, "step": 54420 }, { "epoch": 0.59, "learning_rate": 7.644400734476156e-06, "loss": 21.5566, "step": 54430 }, { "epoch": 0.59, "learning_rate": 7.640998050641528e-06, "loss": 22.3301, "step": 54440 }, { "epoch": 0.59, "learning_rate": 7.637595656008777e-06, "loss": 21.4938, "step": 54450 }, { "epoch": 0.59, "learning_rate": 7.634193550995023e-06, "loss": 21.8802, "step": 54460 }, { "epoch": 0.59, "learning_rate": 7.630791736017338e-06, "loss": 21.0766, "step": 54470 }, { "epoch": 0.59, "learning_rate": 7.627390211492776e-06, "loss": 21.9324, "step": 54480 }, { "epoch": 0.59, "learning_rate": 7.6239889778383436e-06, "loss": 21.1431, "step": 54490 }, { "epoch": 0.59, "learning_rate": 7.620588035471012e-06, "loss": 21.12, "step": 54500 }, { "epoch": 0.59, "learning_rate": 7.61718738480773e-06, "loss": 21.1761, "step": 54510 }, { "epoch": 0.59, "learning_rate": 7.613787026265388e-06, "loss": 21.4308, "step": 54520 }, { "epoch": 0.59, "learning_rate": 7.610386960260859e-06, "loss": 21.2492, "step": 54530 }, { "epoch": 0.59, "learning_rate": 7.606987187210974e-06, "loss": 20.8746, "step": 54540 }, { "epoch": 0.59, "learning_rate": 7.603587707532527e-06, "loss": 20.7964, "step": 54550 }, { "epoch": 0.59, "learning_rate": 7.6001885216422795e-06, "loss": 21.2541, "step": 54560 }, { "epoch": 0.59, "learning_rate": 7.596789629956955e-06, "loss": 20.8028, "step": 54570 }, { "epoch": 0.59, "learning_rate": 7.593391032893238e-06, "loss": 21.333, "step": 54580 }, { "epoch": 0.59, "learning_rate": 7.58999273086778e-06, "loss": 20.8238, "step": 54590 }, { "epoch": 0.59, "learning_rate": 7.586594724297195e-06, "loss": 21.7667, "step": 54600 }, { "epoch": 0.59, "learning_rate": 7.583197013598065e-06, "loss": 21.8501, "step": 54610 }, { "epoch": 0.59, "learning_rate": 7.579799599186932e-06, "loss": 21.1283, "step": 54620 }, { "epoch": 0.59, "learning_rate": 7.576402481480298e-06, "loss": 21.4682, "step": 54630 }, { "epoch": 0.59, "learning_rate": 7.573005660894637e-06, "loss": 21.5116, "step": 54640 }, { "epoch": 0.59, "learning_rate": 7.569609137846376e-06, "loss": 21.4394, "step": 54650 }, { "epoch": 0.59, "learning_rate": 7.56621291275192e-06, "loss": 21.8025, "step": 54660 }, { "epoch": 0.59, "learning_rate": 7.562816986027625e-06, "loss": 21.5607, "step": 54670 }, { "epoch": 0.59, "learning_rate": 7.559421358089819e-06, "loss": 21.948, "step": 54680 }, { "epoch": 0.59, "learning_rate": 7.556026029354782e-06, "loss": 20.9544, "step": 54690 }, { "epoch": 0.59, "learning_rate": 7.552631000238766e-06, "loss": 21.1318, "step": 54700 }, { "epoch": 0.59, "learning_rate": 7.549236271157988e-06, "loss": 21.3377, "step": 54710 }, { "epoch": 0.59, "learning_rate": 7.545841842528624e-06, "loss": 21.903, "step": 54720 }, { "epoch": 0.59, "learning_rate": 7.542447714766814e-06, "loss": 21.0691, "step": 54730 }, { "epoch": 0.59, "learning_rate": 7.539053888288659e-06, "loss": 21.1646, "step": 54740 }, { "epoch": 0.59, "learning_rate": 7.535660363510225e-06, "loss": 21.2421, "step": 54750 }, { "epoch": 0.59, "learning_rate": 7.532267140847544e-06, "loss": 20.9734, "step": 54760 }, { "epoch": 0.59, "learning_rate": 7.528874220716608e-06, "loss": 21.3306, "step": 54770 }, { "epoch": 0.59, "learning_rate": 7.525481603533372e-06, "loss": 21.8134, "step": 54780 }, { "epoch": 0.59, "learning_rate": 7.522089289713752e-06, "loss": 20.7826, "step": 54790 }, { "epoch": 0.59, "learning_rate": 7.518697279673627e-06, "loss": 20.5655, "step": 54800 }, { "epoch": 0.59, "learning_rate": 7.515305573828846e-06, "loss": 21.4711, "step": 54810 }, { "epoch": 0.59, "learning_rate": 7.511914172595212e-06, "loss": 20.5607, "step": 54820 }, { "epoch": 0.59, "learning_rate": 7.508523076388492e-06, "loss": 21.8037, "step": 54830 }, { "epoch": 0.59, "learning_rate": 7.505132285624427e-06, "loss": 20.874, "step": 54840 }, { "epoch": 0.59, "learning_rate": 7.501741800718696e-06, "loss": 21.5218, "step": 54850 }, { "epoch": 0.59, "learning_rate": 7.4983516220869675e-06, "loss": 21.3236, "step": 54860 }, { "epoch": 0.59, "learning_rate": 7.494961750144856e-06, "loss": 21.6711, "step": 54870 }, { "epoch": 0.59, "learning_rate": 7.49157218530794e-06, "loss": 20.8809, "step": 54880 }, { "epoch": 0.59, "learning_rate": 7.488182927991774e-06, "loss": 21.1766, "step": 54890 }, { "epoch": 0.59, "learning_rate": 7.484793978611851e-06, "loss": 20.8867, "step": 54900 }, { "epoch": 0.59, "learning_rate": 7.481405337583646e-06, "loss": 21.2508, "step": 54910 }, { "epoch": 0.59, "learning_rate": 7.478017005322589e-06, "loss": 21.6727, "step": 54920 }, { "epoch": 0.59, "learning_rate": 7.47462898224407e-06, "loss": 21.0762, "step": 54930 }, { "epoch": 0.59, "learning_rate": 7.471241268763448e-06, "loss": 21.5394, "step": 54940 }, { "epoch": 0.59, "learning_rate": 7.467853865296039e-06, "loss": 21.5193, "step": 54950 }, { "epoch": 0.59, "learning_rate": 7.464466772257118e-06, "loss": 21.1255, "step": 54960 }, { "epoch": 0.59, "learning_rate": 7.461079990061929e-06, "loss": 20.8963, "step": 54970 }, { "epoch": 0.59, "learning_rate": 7.457693519125674e-06, "loss": 21.1183, "step": 54980 }, { "epoch": 0.59, "learning_rate": 7.454307359863515e-06, "loss": 21.0934, "step": 54990 }, { "epoch": 0.59, "learning_rate": 7.450921512690583e-06, "loss": 20.5979, "step": 55000 }, { "epoch": 0.59, "learning_rate": 7.447535978021963e-06, "loss": 21.0428, "step": 55010 }, { "epoch": 0.59, "learning_rate": 7.444150756272704e-06, "loss": 21.563, "step": 55020 }, { "epoch": 0.59, "learning_rate": 7.440765847857819e-06, "loss": 21.5919, "step": 55030 }, { "epoch": 0.6, "learning_rate": 7.437381253192279e-06, "loss": 21.9754, "step": 55040 }, { "epoch": 0.6, "learning_rate": 7.433996972691022e-06, "loss": 20.7263, "step": 55050 }, { "epoch": 0.6, "learning_rate": 7.430613006768941e-06, "loss": 21.6129, "step": 55060 }, { "epoch": 0.6, "learning_rate": 7.4272293558408925e-06, "loss": 20.9171, "step": 55070 }, { "epoch": 0.6, "learning_rate": 7.4238460203216985e-06, "loss": 21.2522, "step": 55080 }, { "epoch": 0.6, "learning_rate": 7.420463000626134e-06, "loss": 20.4737, "step": 55090 }, { "epoch": 0.6, "learning_rate": 7.417080297168946e-06, "loss": 21.2673, "step": 55100 }, { "epoch": 0.6, "learning_rate": 7.413697910364837e-06, "loss": 21.6774, "step": 55110 }, { "epoch": 0.6, "learning_rate": 7.410315840628466e-06, "loss": 21.1776, "step": 55120 }, { "epoch": 0.6, "learning_rate": 7.40693408837446e-06, "loss": 20.7963, "step": 55130 }, { "epoch": 0.6, "learning_rate": 7.403552654017403e-06, "loss": 21.3676, "step": 55140 }, { "epoch": 0.6, "learning_rate": 7.400171537971848e-06, "loss": 20.9566, "step": 55150 }, { "epoch": 0.6, "learning_rate": 7.3967907406523e-06, "loss": 20.9372, "step": 55160 }, { "epoch": 0.6, "learning_rate": 7.393410262473225e-06, "loss": 21.2599, "step": 55170 }, { "epoch": 0.6, "learning_rate": 7.390030103849055e-06, "loss": 20.5253, "step": 55180 }, { "epoch": 0.6, "learning_rate": 7.386650265194178e-06, "loss": 21.1945, "step": 55190 }, { "epoch": 0.6, "learning_rate": 7.3832707469229505e-06, "loss": 21.4697, "step": 55200 }, { "epoch": 0.6, "learning_rate": 7.379891549449682e-06, "loss": 20.3318, "step": 55210 }, { "epoch": 0.6, "learning_rate": 7.376512673188647e-06, "loss": 21.105, "step": 55220 }, { "epoch": 0.6, "learning_rate": 7.3731341185540765e-06, "loss": 22.5671, "step": 55230 }, { "epoch": 0.6, "learning_rate": 7.369755885960161e-06, "loss": 20.7861, "step": 55240 }, { "epoch": 0.6, "learning_rate": 7.366377975821062e-06, "loss": 21.2805, "step": 55250 }, { "epoch": 0.6, "learning_rate": 7.363000388550891e-06, "loss": 21.2318, "step": 55260 }, { "epoch": 0.6, "learning_rate": 7.359623124563726e-06, "loss": 21.1349, "step": 55270 }, { "epoch": 0.6, "learning_rate": 7.356246184273599e-06, "loss": 20.3917, "step": 55280 }, { "epoch": 0.6, "learning_rate": 7.352869568094505e-06, "loss": 21.2378, "step": 55290 }, { "epoch": 0.6, "learning_rate": 7.349493276440405e-06, "loss": 21.4666, "step": 55300 }, { "epoch": 0.6, "learning_rate": 7.346117309725213e-06, "loss": 21.4852, "step": 55310 }, { "epoch": 0.6, "learning_rate": 7.34274166836281e-06, "loss": 21.2272, "step": 55320 }, { "epoch": 0.6, "learning_rate": 7.339366352767026e-06, "loss": 21.0624, "step": 55330 }, { "epoch": 0.6, "learning_rate": 7.3359913633516574e-06, "loss": 20.7205, "step": 55340 }, { "epoch": 0.6, "learning_rate": 7.332616700530467e-06, "loss": 21.5926, "step": 55350 }, { "epoch": 0.6, "learning_rate": 7.329242364717169e-06, "loss": 21.6428, "step": 55360 }, { "epoch": 0.6, "learning_rate": 7.325868356325438e-06, "loss": 21.0808, "step": 55370 }, { "epoch": 0.6, "learning_rate": 7.3224946757689205e-06, "loss": 20.6293, "step": 55380 }, { "epoch": 0.6, "learning_rate": 7.319121323461198e-06, "loss": 21.3554, "step": 55390 }, { "epoch": 0.6, "learning_rate": 7.315748299815837e-06, "loss": 21.3057, "step": 55400 }, { "epoch": 0.6, "learning_rate": 7.312375605246349e-06, "loss": 21.6864, "step": 55410 }, { "epoch": 0.6, "learning_rate": 7.309003240166208e-06, "loss": 21.1951, "step": 55420 }, { "epoch": 0.6, "learning_rate": 7.30563120498886e-06, "loss": 21.9055, "step": 55430 }, { "epoch": 0.6, "learning_rate": 7.302259500127684e-06, "loss": 20.9854, "step": 55440 }, { "epoch": 0.6, "learning_rate": 7.298888125996045e-06, "loss": 20.8702, "step": 55450 }, { "epoch": 0.6, "learning_rate": 7.295517083007253e-06, "loss": 21.4138, "step": 55460 }, { "epoch": 0.6, "learning_rate": 7.29214637157458e-06, "loss": 21.3344, "step": 55470 }, { "epoch": 0.6, "learning_rate": 7.288775992111265e-06, "loss": 21.7258, "step": 55480 }, { "epoch": 0.6, "learning_rate": 7.28540594503049e-06, "loss": 21.1125, "step": 55490 }, { "epoch": 0.6, "learning_rate": 7.282036230745413e-06, "loss": 21.3223, "step": 55500 }, { "epoch": 0.6, "learning_rate": 7.2786668496691406e-06, "loss": 21.3354, "step": 55510 }, { "epoch": 0.6, "learning_rate": 7.275297802214742e-06, "loss": 22.3156, "step": 55520 }, { "epoch": 0.6, "learning_rate": 7.271929088795249e-06, "loss": 21.0204, "step": 55530 }, { "epoch": 0.6, "learning_rate": 7.268560709823649e-06, "loss": 21.608, "step": 55540 }, { "epoch": 0.6, "learning_rate": 7.265192665712884e-06, "loss": 20.812, "step": 55550 }, { "epoch": 0.6, "learning_rate": 7.2618249568758625e-06, "loss": 21.2474, "step": 55560 }, { "epoch": 0.6, "learning_rate": 7.2584575837254465e-06, "loss": 21.1139, "step": 55570 }, { "epoch": 0.6, "learning_rate": 7.255090546674462e-06, "loss": 21.2669, "step": 55580 }, { "epoch": 0.6, "learning_rate": 7.251723846135693e-06, "loss": 20.701, "step": 55590 }, { "epoch": 0.6, "learning_rate": 7.248357482521875e-06, "loss": 21.1149, "step": 55600 }, { "epoch": 0.6, "learning_rate": 7.2449914562457094e-06, "loss": 21.6256, "step": 55610 }, { "epoch": 0.6, "learning_rate": 7.241625767719851e-06, "loss": 21.7823, "step": 55620 }, { "epoch": 0.6, "learning_rate": 7.238260417356922e-06, "loss": 21.8078, "step": 55630 }, { "epoch": 0.6, "learning_rate": 7.234895405569497e-06, "loss": 21.4877, "step": 55640 }, { "epoch": 0.6, "learning_rate": 7.231530732770109e-06, "loss": 21.3553, "step": 55650 }, { "epoch": 0.6, "learning_rate": 7.2281663993712455e-06, "loss": 21.2333, "step": 55660 }, { "epoch": 0.6, "learning_rate": 7.2248024057853605e-06, "loss": 21.6685, "step": 55670 }, { "epoch": 0.6, "learning_rate": 7.221438752424865e-06, "loss": 20.8501, "step": 55680 }, { "epoch": 0.6, "learning_rate": 7.218075439702123e-06, "loss": 21.2326, "step": 55690 }, { "epoch": 0.6, "learning_rate": 7.214712468029464e-06, "loss": 21.6268, "step": 55700 }, { "epoch": 0.6, "learning_rate": 7.211349837819166e-06, "loss": 21.0084, "step": 55710 }, { "epoch": 0.6, "learning_rate": 7.20798754948347e-06, "loss": 21.2271, "step": 55720 }, { "epoch": 0.6, "learning_rate": 7.204625603434583e-06, "loss": 21.8311, "step": 55730 }, { "epoch": 0.6, "learning_rate": 7.201264000084658e-06, "loss": 20.7408, "step": 55740 }, { "epoch": 0.6, "learning_rate": 7.197902739845813e-06, "loss": 20.8285, "step": 55750 }, { "epoch": 0.6, "learning_rate": 7.194541823130119e-06, "loss": 20.9544, "step": 55760 }, { "epoch": 0.6, "learning_rate": 7.191181250349607e-06, "loss": 20.5938, "step": 55770 }, { "epoch": 0.6, "learning_rate": 7.18782102191627e-06, "loss": 21.8338, "step": 55780 }, { "epoch": 0.6, "learning_rate": 7.184461138242054e-06, "loss": 21.4091, "step": 55790 }, { "epoch": 0.6, "learning_rate": 7.181101599738862e-06, "loss": 22.1745, "step": 55800 }, { "epoch": 0.6, "learning_rate": 7.177742406818564e-06, "loss": 21.2555, "step": 55810 }, { "epoch": 0.6, "learning_rate": 7.174383559892968e-06, "loss": 21.0507, "step": 55820 }, { "epoch": 0.6, "learning_rate": 7.171025059373862e-06, "loss": 21.5066, "step": 55830 }, { "epoch": 0.6, "learning_rate": 7.167666905672977e-06, "loss": 20.8036, "step": 55840 }, { "epoch": 0.6, "learning_rate": 7.164309099202005e-06, "loss": 21.1894, "step": 55850 }, { "epoch": 0.6, "learning_rate": 7.160951640372604e-06, "loss": 21.4058, "step": 55860 }, { "epoch": 0.6, "learning_rate": 7.15759452959637e-06, "loss": 21.1821, "step": 55870 }, { "epoch": 0.6, "learning_rate": 7.154237767284875e-06, "loss": 21.6493, "step": 55880 }, { "epoch": 0.6, "learning_rate": 7.150881353849641e-06, "loss": 21.3037, "step": 55890 }, { "epoch": 0.6, "learning_rate": 7.147525289702145e-06, "loss": 21.5546, "step": 55900 }, { "epoch": 0.6, "learning_rate": 7.144169575253827e-06, "loss": 21.0055, "step": 55910 }, { "epoch": 0.6, "learning_rate": 7.140814210916083e-06, "loss": 21.3703, "step": 55920 }, { "epoch": 0.6, "learning_rate": 7.137459197100257e-06, "loss": 21.6365, "step": 55930 }, { "epoch": 0.6, "learning_rate": 7.134104534217661e-06, "loss": 21.531, "step": 55940 }, { "epoch": 0.6, "learning_rate": 7.130750222679556e-06, "loss": 20.8171, "step": 55950 }, { "epoch": 0.6, "learning_rate": 7.1273962628971705e-06, "loss": 20.6199, "step": 55960 }, { "epoch": 0.61, "learning_rate": 7.124042655281681e-06, "loss": 20.7422, "step": 55970 }, { "epoch": 0.61, "learning_rate": 7.120689400244221e-06, "loss": 21.136, "step": 55980 }, { "epoch": 0.61, "learning_rate": 7.117336498195881e-06, "loss": 20.3966, "step": 55990 }, { "epoch": 0.61, "learning_rate": 7.113983949547714e-06, "loss": 20.8124, "step": 56000 }, { "epoch": 0.61, "learning_rate": 7.110631754710725e-06, "loss": 21.2079, "step": 56010 }, { "epoch": 0.61, "learning_rate": 7.107279914095879e-06, "loss": 21.2985, "step": 56020 }, { "epoch": 0.61, "learning_rate": 7.103928428114089e-06, "loss": 21.1005, "step": 56030 }, { "epoch": 0.61, "learning_rate": 7.100577297176234e-06, "loss": 22.3396, "step": 56040 }, { "epoch": 0.61, "learning_rate": 7.097226521693143e-06, "loss": 21.4445, "step": 56050 }, { "epoch": 0.61, "learning_rate": 7.093876102075609e-06, "loss": 20.2076, "step": 56060 }, { "epoch": 0.61, "learning_rate": 7.090526038734373e-06, "loss": 21.1644, "step": 56070 }, { "epoch": 0.61, "learning_rate": 7.087176332080141e-06, "loss": 21.4327, "step": 56080 }, { "epoch": 0.61, "learning_rate": 7.083826982523565e-06, "loss": 20.7745, "step": 56090 }, { "epoch": 0.61, "learning_rate": 7.080477990475258e-06, "loss": 20.6851, "step": 56100 }, { "epoch": 0.61, "learning_rate": 7.077129356345793e-06, "loss": 20.7978, "step": 56110 }, { "epoch": 0.61, "learning_rate": 7.073781080545697e-06, "loss": 21.4087, "step": 56120 }, { "epoch": 0.61, "learning_rate": 7.070433163485451e-06, "loss": 21.2454, "step": 56130 }, { "epoch": 0.61, "learning_rate": 7.067085605575488e-06, "loss": 21.3211, "step": 56140 }, { "epoch": 0.61, "learning_rate": 7.063738407226206e-06, "loss": 21.4667, "step": 56150 }, { "epoch": 0.61, "learning_rate": 7.060391568847956e-06, "loss": 21.1566, "step": 56160 }, { "epoch": 0.61, "learning_rate": 7.057045090851042e-06, "loss": 21.0962, "step": 56170 }, { "epoch": 0.61, "learning_rate": 7.0536989736457266e-06, "loss": 21.3107, "step": 56180 }, { "epoch": 0.61, "learning_rate": 7.0503532176422275e-06, "loss": 20.5011, "step": 56190 }, { "epoch": 0.61, "learning_rate": 7.047007823250712e-06, "loss": 20.7845, "step": 56200 }, { "epoch": 0.61, "learning_rate": 7.043662790881316e-06, "loss": 20.6429, "step": 56210 }, { "epoch": 0.61, "learning_rate": 7.0403181209441205e-06, "loss": 20.8324, "step": 56220 }, { "epoch": 0.61, "learning_rate": 7.036973813849166e-06, "loss": 21.0751, "step": 56230 }, { "epoch": 0.61, "learning_rate": 7.033629870006451e-06, "loss": 21.4863, "step": 56240 }, { "epoch": 0.61, "learning_rate": 7.030286289825917e-06, "loss": 21.2579, "step": 56250 }, { "epoch": 0.61, "learning_rate": 7.0269430737174796e-06, "loss": 21.2744, "step": 56260 }, { "epoch": 0.61, "learning_rate": 7.023600222090996e-06, "loss": 21.6098, "step": 56270 }, { "epoch": 0.61, "learning_rate": 7.020257735356286e-06, "loss": 20.9994, "step": 56280 }, { "epoch": 0.61, "learning_rate": 7.0169156139231205e-06, "loss": 21.3915, "step": 56290 }, { "epoch": 0.61, "learning_rate": 7.013573858201224e-06, "loss": 20.7539, "step": 56300 }, { "epoch": 0.61, "learning_rate": 7.010232468600283e-06, "loss": 21.5236, "step": 56310 }, { "epoch": 0.61, "learning_rate": 7.006891445529934e-06, "loss": 21.1052, "step": 56320 }, { "epoch": 0.61, "learning_rate": 7.003550789399769e-06, "loss": 21.4718, "step": 56330 }, { "epoch": 0.61, "learning_rate": 7.000210500619335e-06, "loss": 20.5438, "step": 56340 }, { "epoch": 0.61, "learning_rate": 6.996870579598141e-06, "loss": 21.281, "step": 56350 }, { "epoch": 0.61, "learning_rate": 6.993531026745636e-06, "loss": 20.9692, "step": 56360 }, { "epoch": 0.61, "learning_rate": 6.990191842471237e-06, "loss": 21.7546, "step": 56370 }, { "epoch": 0.61, "learning_rate": 6.98685302718431e-06, "loss": 20.7945, "step": 56380 }, { "epoch": 0.61, "learning_rate": 6.9835145812941775e-06, "loss": 21.7286, "step": 56390 }, { "epoch": 0.61, "learning_rate": 6.980176505210121e-06, "loss": 21.6221, "step": 56400 }, { "epoch": 0.61, "learning_rate": 6.976838799341363e-06, "loss": 21.2027, "step": 56410 }, { "epoch": 0.61, "learning_rate": 6.973501464097096e-06, "loss": 21.8898, "step": 56420 }, { "epoch": 0.61, "learning_rate": 6.970164499886458e-06, "loss": 21.0132, "step": 56430 }, { "epoch": 0.61, "learning_rate": 6.966827907118543e-06, "loss": 20.3429, "step": 56440 }, { "epoch": 0.61, "learning_rate": 6.9634916862024096e-06, "loss": 21.226, "step": 56450 }, { "epoch": 0.61, "learning_rate": 6.9601558375470466e-06, "loss": 21.5155, "step": 56460 }, { "epoch": 0.61, "learning_rate": 6.956820361561425e-06, "loss": 20.419, "step": 56470 }, { "epoch": 0.61, "learning_rate": 6.953485258654453e-06, "loss": 21.3165, "step": 56480 }, { "epoch": 0.61, "learning_rate": 6.950150529234996e-06, "loss": 21.4065, "step": 56490 }, { "epoch": 0.61, "learning_rate": 6.946816173711878e-06, "loss": 20.869, "step": 56500 }, { "epoch": 0.61, "learning_rate": 6.9434821924938756e-06, "loss": 20.8595, "step": 56510 }, { "epoch": 0.61, "learning_rate": 6.940148585989714e-06, "loss": 21.5486, "step": 56520 }, { "epoch": 0.61, "learning_rate": 6.93681535460808e-06, "loss": 20.6725, "step": 56530 }, { "epoch": 0.61, "learning_rate": 6.933482498757606e-06, "loss": 21.3732, "step": 56540 }, { "epoch": 0.61, "learning_rate": 6.9301500188468905e-06, "loss": 21.5818, "step": 56550 }, { "epoch": 0.61, "learning_rate": 6.926817915284479e-06, "loss": 20.2941, "step": 56560 }, { "epoch": 0.61, "learning_rate": 6.923486188478864e-06, "loss": 21.4345, "step": 56570 }, { "epoch": 0.61, "learning_rate": 6.920154838838502e-06, "loss": 21.2361, "step": 56580 }, { "epoch": 0.61, "learning_rate": 6.9168238667718e-06, "loss": 21.4838, "step": 56590 }, { "epoch": 0.61, "learning_rate": 6.913493272687119e-06, "loss": 21.0136, "step": 56600 }, { "epoch": 0.61, "learning_rate": 6.910163056992774e-06, "loss": 21.2907, "step": 56610 }, { "epoch": 0.61, "learning_rate": 6.906833220097033e-06, "loss": 20.7013, "step": 56620 }, { "epoch": 0.61, "learning_rate": 6.903503762408115e-06, "loss": 20.9834, "step": 56630 }, { "epoch": 0.61, "learning_rate": 6.900174684334193e-06, "loss": 21.9689, "step": 56640 }, { "epoch": 0.61, "learning_rate": 6.896845986283401e-06, "loss": 21.3844, "step": 56650 }, { "epoch": 0.61, "learning_rate": 6.8935176686638175e-06, "loss": 21.1089, "step": 56660 }, { "epoch": 0.61, "learning_rate": 6.890189731883481e-06, "loss": 20.8605, "step": 56670 }, { "epoch": 0.61, "learning_rate": 6.886862176350375e-06, "loss": 21.9226, "step": 56680 }, { "epoch": 0.61, "learning_rate": 6.883535002472441e-06, "loss": 21.3641, "step": 56690 }, { "epoch": 0.61, "learning_rate": 6.880208210657579e-06, "loss": 21.7278, "step": 56700 }, { "epoch": 0.61, "learning_rate": 6.876881801313635e-06, "loss": 21.111, "step": 56710 }, { "epoch": 0.61, "learning_rate": 6.8735557748484115e-06, "loss": 20.6455, "step": 56720 }, { "epoch": 0.61, "learning_rate": 6.870230131669659e-06, "loss": 21.3883, "step": 56730 }, { "epoch": 0.61, "learning_rate": 6.866904872185085e-06, "loss": 21.1209, "step": 56740 }, { "epoch": 0.61, "learning_rate": 6.863579996802353e-06, "loss": 21.7043, "step": 56750 }, { "epoch": 0.61, "learning_rate": 6.860255505929074e-06, "loss": 21.1937, "step": 56760 }, { "epoch": 0.61, "learning_rate": 6.856931399972815e-06, "loss": 21.9996, "step": 56770 }, { "epoch": 0.61, "learning_rate": 6.853607679341099e-06, "loss": 22.3081, "step": 56780 }, { "epoch": 0.61, "learning_rate": 6.850284344441386e-06, "loss": 21.1268, "step": 56790 }, { "epoch": 0.61, "learning_rate": 6.846961395681111e-06, "loss": 20.7087, "step": 56800 }, { "epoch": 0.61, "learning_rate": 6.843638833467645e-06, "loss": 21.1036, "step": 56810 }, { "epoch": 0.61, "learning_rate": 6.840316658208321e-06, "loss": 21.6205, "step": 56820 }, { "epoch": 0.61, "learning_rate": 6.836994870310424e-06, "loss": 20.9337, "step": 56830 }, { "epoch": 0.61, "learning_rate": 6.8336734701811795e-06, "loss": 20.8019, "step": 56840 }, { "epoch": 0.61, "learning_rate": 6.83035245822778e-06, "loss": 21.3087, "step": 56850 }, { "epoch": 0.61, "learning_rate": 6.827031834857366e-06, "loss": 21.6667, "step": 56860 }, { "epoch": 0.61, "learning_rate": 6.823711600477025e-06, "loss": 21.108, "step": 56870 }, { "epoch": 0.61, "learning_rate": 6.820391755493808e-06, "loss": 20.4982, "step": 56880 }, { "epoch": 0.62, "learning_rate": 6.8170723003147085e-06, "loss": 20.5867, "step": 56890 }, { "epoch": 0.62, "learning_rate": 6.813753235346674e-06, "loss": 21.7079, "step": 56900 }, { "epoch": 0.62, "learning_rate": 6.810434560996604e-06, "loss": 20.8539, "step": 56910 }, { "epoch": 0.62, "learning_rate": 6.807116277671351e-06, "loss": 21.0213, "step": 56920 }, { "epoch": 0.62, "learning_rate": 6.803798385777725e-06, "loss": 20.9231, "step": 56930 }, { "epoch": 0.62, "learning_rate": 6.800480885722481e-06, "loss": 21.2848, "step": 56940 }, { "epoch": 0.62, "learning_rate": 6.797163777912326e-06, "loss": 20.8172, "step": 56950 }, { "epoch": 0.62, "learning_rate": 6.793847062753922e-06, "loss": 20.906, "step": 56960 }, { "epoch": 0.62, "learning_rate": 6.790530740653878e-06, "loss": 21.1519, "step": 56970 }, { "epoch": 0.62, "learning_rate": 6.787214812018765e-06, "loss": 20.7326, "step": 56980 }, { "epoch": 0.62, "learning_rate": 6.783899277255099e-06, "loss": 20.8058, "step": 56990 }, { "epoch": 0.62, "learning_rate": 6.780584136769344e-06, "loss": 21.1333, "step": 57000 }, { "epoch": 0.62, "learning_rate": 6.777269390967921e-06, "loss": 20.7302, "step": 57010 }, { "epoch": 0.62, "learning_rate": 6.773955040257199e-06, "loss": 21.3703, "step": 57020 }, { "epoch": 0.62, "learning_rate": 6.770641085043505e-06, "loss": 21.2168, "step": 57030 }, { "epoch": 0.62, "learning_rate": 6.767327525733114e-06, "loss": 20.5813, "step": 57040 }, { "epoch": 0.62, "learning_rate": 6.76401436273225e-06, "loss": 20.0947, "step": 57050 }, { "epoch": 0.62, "learning_rate": 6.7607015964470875e-06, "loss": 21.5392, "step": 57060 }, { "epoch": 0.62, "learning_rate": 6.757389227283757e-06, "loss": 20.9179, "step": 57070 }, { "epoch": 0.62, "learning_rate": 6.754077255648341e-06, "loss": 20.8562, "step": 57080 }, { "epoch": 0.62, "learning_rate": 6.750765681946867e-06, "loss": 20.9245, "step": 57090 }, { "epoch": 0.62, "learning_rate": 6.747454506585323e-06, "loss": 21.85, "step": 57100 }, { "epoch": 0.62, "learning_rate": 6.744143729969634e-06, "loss": 21.8976, "step": 57110 }, { "epoch": 0.62, "learning_rate": 6.74083335250569e-06, "loss": 21.5416, "step": 57120 }, { "epoch": 0.62, "learning_rate": 6.737523374599327e-06, "loss": 20.7626, "step": 57130 }, { "epoch": 0.62, "learning_rate": 6.734213796656332e-06, "loss": 21.463, "step": 57140 }, { "epoch": 0.62, "learning_rate": 6.7309046190824435e-06, "loss": 21.1136, "step": 57150 }, { "epoch": 0.62, "learning_rate": 6.727595842283346e-06, "loss": 21.5542, "step": 57160 }, { "epoch": 0.62, "learning_rate": 6.724287466664679e-06, "loss": 21.6602, "step": 57170 }, { "epoch": 0.62, "learning_rate": 6.7209794926320385e-06, "loss": 20.3474, "step": 57180 }, { "epoch": 0.62, "learning_rate": 6.717671920590961e-06, "loss": 21.5096, "step": 57190 }, { "epoch": 0.62, "learning_rate": 6.714364750946938e-06, "loss": 20.8741, "step": 57200 }, { "epoch": 0.62, "learning_rate": 6.71105798410542e-06, "loss": 21.2583, "step": 57210 }, { "epoch": 0.62, "learning_rate": 6.7077516204717895e-06, "loss": 21.5493, "step": 57220 }, { "epoch": 0.62, "learning_rate": 6.7044456604513955e-06, "loss": 21.8928, "step": 57230 }, { "epoch": 0.62, "learning_rate": 6.7011401044495304e-06, "loss": 21.3996, "step": 57240 }, { "epoch": 0.62, "learning_rate": 6.697834952871438e-06, "loss": 20.9124, "step": 57250 }, { "epoch": 0.62, "learning_rate": 6.694530206122323e-06, "loss": 21.9051, "step": 57260 }, { "epoch": 0.62, "learning_rate": 6.691225864607314e-06, "loss": 21.0538, "step": 57270 }, { "epoch": 0.62, "learning_rate": 6.68792192873152e-06, "loss": 20.6072, "step": 57280 }, { "epoch": 0.62, "learning_rate": 6.684618398899982e-06, "loss": 21.7617, "step": 57290 }, { "epoch": 0.62, "learning_rate": 6.681315275517697e-06, "loss": 21.5036, "step": 57300 }, { "epoch": 0.62, "learning_rate": 6.678012558989612e-06, "loss": 21.4322, "step": 57310 }, { "epoch": 0.62, "learning_rate": 6.674710249720626e-06, "loss": 21.4064, "step": 57320 }, { "epoch": 0.62, "learning_rate": 6.67140834811558e-06, "loss": 21.8171, "step": 57330 }, { "epoch": 0.62, "learning_rate": 6.668106854579275e-06, "loss": 21.7269, "step": 57340 }, { "epoch": 0.62, "learning_rate": 6.664805769516452e-06, "loss": 21.2076, "step": 57350 }, { "epoch": 0.62, "learning_rate": 6.661505093331816e-06, "loss": 20.7138, "step": 57360 }, { "epoch": 0.62, "learning_rate": 6.65820482643001e-06, "loss": 20.5116, "step": 57370 }, { "epoch": 0.62, "learning_rate": 6.654904969215628e-06, "loss": 20.9251, "step": 57380 }, { "epoch": 0.62, "learning_rate": 6.651605522093217e-06, "loss": 21.2315, "step": 57390 }, { "epoch": 0.62, "learning_rate": 6.648306485467274e-06, "loss": 21.8267, "step": 57400 }, { "epoch": 0.62, "learning_rate": 6.645007859742241e-06, "loss": 20.8328, "step": 57410 }, { "epoch": 0.62, "learning_rate": 6.64170964532252e-06, "loss": 21.7467, "step": 57420 }, { "epoch": 0.62, "learning_rate": 6.638411842612451e-06, "loss": 21.1259, "step": 57430 }, { "epoch": 0.62, "learning_rate": 6.635114452016327e-06, "loss": 21.5825, "step": 57440 }, { "epoch": 0.62, "learning_rate": 6.631817473938393e-06, "loss": 21.2087, "step": 57450 }, { "epoch": 0.62, "learning_rate": 6.628520908782841e-06, "loss": 21.2735, "step": 57460 }, { "epoch": 0.62, "learning_rate": 6.625224756953816e-06, "loss": 20.6762, "step": 57470 }, { "epoch": 0.62, "learning_rate": 6.621929018855413e-06, "loss": 21.1135, "step": 57480 }, { "epoch": 0.62, "learning_rate": 6.618633694891664e-06, "loss": 20.3356, "step": 57490 }, { "epoch": 0.62, "learning_rate": 6.615338785466565e-06, "loss": 20.1893, "step": 57500 }, { "epoch": 0.62, "learning_rate": 6.612044290984052e-06, "loss": 21.2222, "step": 57510 }, { "epoch": 0.62, "learning_rate": 6.608750211848018e-06, "loss": 20.642, "step": 57520 }, { "epoch": 0.62, "learning_rate": 6.605456548462301e-06, "loss": 21.0755, "step": 57530 }, { "epoch": 0.62, "learning_rate": 6.602163301230684e-06, "loss": 21.7082, "step": 57540 }, { "epoch": 0.62, "learning_rate": 6.598870470556903e-06, "loss": 20.962, "step": 57550 }, { "epoch": 0.62, "learning_rate": 6.595578056844642e-06, "loss": 20.7186, "step": 57560 }, { "epoch": 0.62, "learning_rate": 6.592286060497537e-06, "loss": 20.368, "step": 57570 }, { "epoch": 0.62, "learning_rate": 6.588994481919171e-06, "loss": 21.2155, "step": 57580 }, { "epoch": 0.62, "learning_rate": 6.585703321513075e-06, "loss": 21.3163, "step": 57590 }, { "epoch": 0.62, "learning_rate": 6.582412579682726e-06, "loss": 20.9886, "step": 57600 }, { "epoch": 0.62, "learning_rate": 6.579122256831551e-06, "loss": 21.3307, "step": 57610 }, { "epoch": 0.62, "learning_rate": 6.575832353362934e-06, "loss": 20.9124, "step": 57620 }, { "epoch": 0.62, "learning_rate": 6.572542869680196e-06, "loss": 20.8417, "step": 57630 }, { "epoch": 0.62, "learning_rate": 6.569253806186615e-06, "loss": 21.3688, "step": 57640 }, { "epoch": 0.62, "learning_rate": 6.565965163285408e-06, "loss": 21.1108, "step": 57650 }, { "epoch": 0.62, "learning_rate": 6.562676941379746e-06, "loss": 21.154, "step": 57660 }, { "epoch": 0.62, "learning_rate": 6.559389140872756e-06, "loss": 21.1359, "step": 57670 }, { "epoch": 0.62, "learning_rate": 6.556101762167502e-06, "loss": 20.974, "step": 57680 }, { "epoch": 0.62, "learning_rate": 6.552814805667001e-06, "loss": 20.8668, "step": 57690 }, { "epoch": 0.62, "learning_rate": 6.549528271774215e-06, "loss": 21.2818, "step": 57700 }, { "epoch": 0.62, "learning_rate": 6.546242160892056e-06, "loss": 21.3748, "step": 57710 }, { "epoch": 0.62, "learning_rate": 6.54295647342339e-06, "loss": 21.9979, "step": 57720 }, { "epoch": 0.62, "learning_rate": 6.539671209771021e-06, "loss": 21.4808, "step": 57730 }, { "epoch": 0.62, "learning_rate": 6.536386370337707e-06, "loss": 21.0624, "step": 57740 }, { "epoch": 0.62, "learning_rate": 6.53310195552616e-06, "loss": 21.2673, "step": 57750 }, { "epoch": 0.62, "learning_rate": 6.5298179657390206e-06, "loss": 21.2424, "step": 57760 }, { "epoch": 0.62, "learning_rate": 6.526534401378896e-06, "loss": 21.4234, "step": 57770 }, { "epoch": 0.62, "learning_rate": 6.523251262848338e-06, "loss": 21.3386, "step": 57780 }, { "epoch": 0.62, "learning_rate": 6.519968550549834e-06, "loss": 21.5361, "step": 57790 }, { "epoch": 0.62, "learning_rate": 6.516686264885842e-06, "loss": 21.2007, "step": 57800 }, { "epoch": 0.62, "learning_rate": 6.513404406258738e-06, "loss": 20.4568, "step": 57810 }, { "epoch": 0.63, "learning_rate": 6.510122975070872e-06, "loss": 20.9167, "step": 57820 }, { "epoch": 0.63, "learning_rate": 6.5068419717245266e-06, "loss": 21.3648, "step": 57830 }, { "epoch": 0.63, "learning_rate": 6.503561396621938e-06, "loss": 20.8649, "step": 57840 }, { "epoch": 0.63, "learning_rate": 6.50028125016529e-06, "loss": 21.2718, "step": 57850 }, { "epoch": 0.63, "learning_rate": 6.497001532756711e-06, "loss": 21.3113, "step": 57860 }, { "epoch": 0.63, "learning_rate": 6.493722244798277e-06, "loss": 21.0249, "step": 57870 }, { "epoch": 0.63, "learning_rate": 6.490443386692012e-06, "loss": 21.7342, "step": 57880 }, { "epoch": 0.63, "learning_rate": 6.487164958839887e-06, "loss": 21.0303, "step": 57890 }, { "epoch": 0.63, "learning_rate": 6.483886961643824e-06, "loss": 21.3831, "step": 57900 }, { "epoch": 0.63, "learning_rate": 6.48060939550569e-06, "loss": 20.4216, "step": 57910 }, { "epoch": 0.63, "learning_rate": 6.477332260827294e-06, "loss": 20.3796, "step": 57920 }, { "epoch": 0.63, "learning_rate": 6.474055558010397e-06, "loss": 20.8983, "step": 57930 }, { "epoch": 0.63, "learning_rate": 6.470779287456706e-06, "loss": 21.3628, "step": 57940 }, { "epoch": 0.63, "learning_rate": 6.46750344956788e-06, "loss": 21.3349, "step": 57950 }, { "epoch": 0.63, "learning_rate": 6.464228044745519e-06, "loss": 20.7033, "step": 57960 }, { "epoch": 0.63, "learning_rate": 6.460953073391167e-06, "loss": 21.3991, "step": 57970 }, { "epoch": 0.63, "learning_rate": 6.4576785359063225e-06, "loss": 21.7412, "step": 57980 }, { "epoch": 0.63, "learning_rate": 6.454404432692425e-06, "loss": 21.258, "step": 57990 }, { "epoch": 0.63, "learning_rate": 6.451130764150866e-06, "loss": 20.6816, "step": 58000 }, { "epoch": 0.63, "learning_rate": 6.447857530682982e-06, "loss": 20.1945, "step": 58010 }, { "epoch": 0.63, "learning_rate": 6.444584732690053e-06, "loss": 20.6858, "step": 58020 }, { "epoch": 0.63, "learning_rate": 6.441312370573307e-06, "loss": 21.2579, "step": 58030 }, { "epoch": 0.63, "learning_rate": 6.438040444733917e-06, "loss": 21.6703, "step": 58040 }, { "epoch": 0.63, "learning_rate": 6.434768955573012e-06, "loss": 21.1205, "step": 58050 }, { "epoch": 0.63, "learning_rate": 6.431497903491655e-06, "loss": 21.0158, "step": 58060 }, { "epoch": 0.63, "learning_rate": 6.428227288890864e-06, "loss": 21.5818, "step": 58070 }, { "epoch": 0.63, "learning_rate": 6.424957112171596e-06, "loss": 21.511, "step": 58080 }, { "epoch": 0.63, "learning_rate": 6.4216873737347576e-06, "loss": 21.5322, "step": 58090 }, { "epoch": 0.63, "learning_rate": 6.418418073981207e-06, "loss": 21.3709, "step": 58100 }, { "epoch": 0.63, "learning_rate": 6.415149213311743e-06, "loss": 20.837, "step": 58110 }, { "epoch": 0.63, "learning_rate": 6.411880792127112e-06, "loss": 20.8257, "step": 58120 }, { "epoch": 0.63, "learning_rate": 6.408612810828003e-06, "loss": 21.1052, "step": 58130 }, { "epoch": 0.63, "learning_rate": 6.405345269815055e-06, "loss": 20.9241, "step": 58140 }, { "epoch": 0.63, "learning_rate": 6.402078169488855e-06, "loss": 21.2149, "step": 58150 }, { "epoch": 0.63, "learning_rate": 6.3988115102499316e-06, "loss": 20.746, "step": 58160 }, { "epoch": 0.63, "learning_rate": 6.395545292498758e-06, "loss": 20.2705, "step": 58170 }, { "epoch": 0.63, "learning_rate": 6.392279516635766e-06, "loss": 21.1384, "step": 58180 }, { "epoch": 0.63, "learning_rate": 6.38901418306131e-06, "loss": 21.2504, "step": 58190 }, { "epoch": 0.63, "learning_rate": 6.385749292175711e-06, "loss": 21.1882, "step": 58200 }, { "epoch": 0.63, "learning_rate": 6.38248484437923e-06, "loss": 21.1, "step": 58210 }, { "epoch": 0.63, "learning_rate": 6.3792208400720665e-06, "loss": 21.2373, "step": 58220 }, { "epoch": 0.63, "learning_rate": 6.375957279654379e-06, "loss": 20.8929, "step": 58230 }, { "epoch": 0.63, "learning_rate": 6.372694163526254e-06, "loss": 22.0503, "step": 58240 }, { "epoch": 0.63, "learning_rate": 6.369431492087741e-06, "loss": 21.33, "step": 58250 }, { "epoch": 0.63, "learning_rate": 6.366169265738822e-06, "loss": 21.3234, "step": 58260 }, { "epoch": 0.63, "learning_rate": 6.362907484879433e-06, "loss": 21.9578, "step": 58270 }, { "epoch": 0.63, "learning_rate": 6.3596461499094505e-06, "loss": 20.7666, "step": 58280 }, { "epoch": 0.63, "learning_rate": 6.356385261228701e-06, "loss": 20.4365, "step": 58290 }, { "epoch": 0.63, "learning_rate": 6.353124819236951e-06, "loss": 20.9882, "step": 58300 }, { "epoch": 0.63, "learning_rate": 6.3498648243339125e-06, "loss": 20.8651, "step": 58310 }, { "epoch": 0.63, "learning_rate": 6.346605276919245e-06, "loss": 20.7502, "step": 58320 }, { "epoch": 0.63, "learning_rate": 6.343346177392556e-06, "loss": 21.1021, "step": 58330 }, { "epoch": 0.63, "learning_rate": 6.340087526153394e-06, "loss": 21.776, "step": 58340 }, { "epoch": 0.63, "learning_rate": 6.33682932360125e-06, "loss": 21.5336, "step": 58350 }, { "epoch": 0.63, "learning_rate": 6.333571570135566e-06, "loss": 21.6755, "step": 58360 }, { "epoch": 0.63, "learning_rate": 6.3303142661557245e-06, "loss": 21.748, "step": 58370 }, { "epoch": 0.63, "learning_rate": 6.327057412061059e-06, "loss": 21.4, "step": 58380 }, { "epoch": 0.63, "learning_rate": 6.323801008250843e-06, "loss": 21.9125, "step": 58390 }, { "epoch": 0.63, "learning_rate": 6.32054505512429e-06, "loss": 20.4632, "step": 58400 }, { "epoch": 0.63, "learning_rate": 6.3172895530805666e-06, "loss": 20.9328, "step": 58410 }, { "epoch": 0.63, "learning_rate": 6.31403450251878e-06, "loss": 20.7346, "step": 58420 }, { "epoch": 0.63, "learning_rate": 6.310779903837987e-06, "loss": 20.7888, "step": 58430 }, { "epoch": 0.63, "learning_rate": 6.307525757437182e-06, "loss": 20.8685, "step": 58440 }, { "epoch": 0.63, "learning_rate": 6.304272063715309e-06, "loss": 21.4137, "step": 58450 }, { "epoch": 0.63, "learning_rate": 6.301018823071252e-06, "loss": 21.6171, "step": 58460 }, { "epoch": 0.63, "learning_rate": 6.297766035903843e-06, "loss": 21.7802, "step": 58470 }, { "epoch": 0.63, "learning_rate": 6.294513702611859e-06, "loss": 21.8689, "step": 58480 }, { "epoch": 0.63, "learning_rate": 6.291261823594018e-06, "loss": 21.193, "step": 58490 }, { "epoch": 0.63, "learning_rate": 6.288010399248989e-06, "loss": 21.2693, "step": 58500 }, { "epoch": 0.63, "learning_rate": 6.2847594299753725e-06, "loss": 20.5997, "step": 58510 }, { "epoch": 0.63, "learning_rate": 6.281508916171724e-06, "loss": 20.9031, "step": 58520 }, { "epoch": 0.63, "learning_rate": 6.2782588582365426e-06, "loss": 21.5618, "step": 58530 }, { "epoch": 0.63, "learning_rate": 6.275009256568267e-06, "loss": 21.4345, "step": 58540 }, { "epoch": 0.63, "learning_rate": 6.271760111565286e-06, "loss": 20.9574, "step": 58550 }, { "epoch": 0.63, "learning_rate": 6.268511423625926e-06, "loss": 20.6691, "step": 58560 }, { "epoch": 0.63, "learning_rate": 6.265263193148455e-06, "loss": 21.0543, "step": 58570 }, { "epoch": 0.63, "learning_rate": 6.262015420531098e-06, "loss": 20.8915, "step": 58580 }, { "epoch": 0.63, "learning_rate": 6.258768106172011e-06, "loss": 21.4989, "step": 58590 }, { "epoch": 0.63, "learning_rate": 6.2555212504693e-06, "loss": 21.2218, "step": 58600 }, { "epoch": 0.63, "learning_rate": 6.252274853821014e-06, "loss": 20.8874, "step": 58610 }, { "epoch": 0.63, "learning_rate": 6.249028916625142e-06, "loss": 21.4595, "step": 58620 }, { "epoch": 0.63, "learning_rate": 6.245783439279623e-06, "loss": 21.7118, "step": 58630 }, { "epoch": 0.63, "learning_rate": 6.242538422182336e-06, "loss": 21.6983, "step": 58640 }, { "epoch": 0.63, "learning_rate": 6.239293865731102e-06, "loss": 20.4646, "step": 58650 }, { "epoch": 0.63, "learning_rate": 6.236049770323691e-06, "loss": 20.8762, "step": 58660 }, { "epoch": 0.63, "learning_rate": 6.2328061363578054e-06, "loss": 21.6121, "step": 58670 }, { "epoch": 0.63, "learning_rate": 6.2295629642311065e-06, "loss": 21.7331, "step": 58680 }, { "epoch": 0.63, "learning_rate": 6.226320254341187e-06, "loss": 20.8213, "step": 58690 }, { "epoch": 0.63, "learning_rate": 6.22307800708559e-06, "loss": 21.108, "step": 58700 }, { "epoch": 0.63, "learning_rate": 6.219836222861794e-06, "loss": 21.5757, "step": 58710 }, { "epoch": 0.63, "learning_rate": 6.216594902067233e-06, "loss": 20.8951, "step": 58720 }, { "epoch": 0.63, "learning_rate": 6.2133540450992694e-06, "loss": 21.3295, "step": 58730 }, { "epoch": 0.64, "learning_rate": 6.2101136523552185e-06, "loss": 21.6146, "step": 58740 }, { "epoch": 0.64, "learning_rate": 6.206873724232338e-06, "loss": 21.0342, "step": 58750 }, { "epoch": 0.64, "learning_rate": 6.203634261127825e-06, "loss": 21.601, "step": 58760 }, { "epoch": 0.64, "learning_rate": 6.2003952634388235e-06, "loss": 21.6438, "step": 58770 }, { "epoch": 0.64, "learning_rate": 6.197156731562416e-06, "loss": 21.7655, "step": 58780 }, { "epoch": 0.64, "learning_rate": 6.193918665895632e-06, "loss": 21.4429, "step": 58790 }, { "epoch": 0.64, "learning_rate": 6.190681066835443e-06, "loss": 21.9946, "step": 58800 }, { "epoch": 0.64, "learning_rate": 6.187443934778756e-06, "loss": 20.5925, "step": 58810 }, { "epoch": 0.64, "learning_rate": 6.184207270122441e-06, "loss": 21.4481, "step": 58820 }, { "epoch": 0.64, "learning_rate": 6.180971073263282e-06, "loss": 21.0796, "step": 58830 }, { "epoch": 0.64, "learning_rate": 6.177735344598028e-06, "loss": 21.6787, "step": 58840 }, { "epoch": 0.64, "learning_rate": 6.174500084523364e-06, "loss": 22.0901, "step": 58850 }, { "epoch": 0.64, "learning_rate": 6.171265293435912e-06, "loss": 21.3636, "step": 58860 }, { "epoch": 0.64, "learning_rate": 6.168030971732246e-06, "loss": 21.3927, "step": 58870 }, { "epoch": 0.64, "learning_rate": 6.164797119808878e-06, "loss": 21.0744, "step": 58880 }, { "epoch": 0.64, "learning_rate": 6.1615637380622594e-06, "loss": 20.7298, "step": 58890 }, { "epoch": 0.64, "learning_rate": 6.158330826888786e-06, "loss": 20.3647, "step": 58900 }, { "epoch": 0.64, "learning_rate": 6.155098386684797e-06, "loss": 20.8735, "step": 58910 }, { "epoch": 0.64, "learning_rate": 6.1518664178465755e-06, "loss": 21.1453, "step": 58920 }, { "epoch": 0.64, "learning_rate": 6.148634920770346e-06, "loss": 21.8689, "step": 58930 }, { "epoch": 0.64, "learning_rate": 6.145403895852271e-06, "loss": 20.8264, "step": 58940 }, { "epoch": 0.64, "learning_rate": 6.142173343488457e-06, "loss": 20.8408, "step": 58950 }, { "epoch": 0.64, "learning_rate": 6.138943264074954e-06, "loss": 20.6922, "step": 58960 }, { "epoch": 0.64, "learning_rate": 6.135713658007756e-06, "loss": 21.4376, "step": 58970 }, { "epoch": 0.64, "learning_rate": 6.132484525682796e-06, "loss": 21.445, "step": 58980 }, { "epoch": 0.64, "learning_rate": 6.129255867495951e-06, "loss": 20.8926, "step": 58990 }, { "epoch": 0.64, "learning_rate": 6.126027683843034e-06, "loss": 21.5676, "step": 59000 }, { "epoch": 0.64, "learning_rate": 6.1227999751198065e-06, "loss": 21.4445, "step": 59010 }, { "epoch": 0.64, "learning_rate": 6.119572741721971e-06, "loss": 20.7237, "step": 59020 }, { "epoch": 0.64, "learning_rate": 6.116345984045168e-06, "loss": 20.5016, "step": 59030 }, { "epoch": 0.64, "learning_rate": 6.1131197024849845e-06, "loss": 21.3281, "step": 59040 }, { "epoch": 0.64, "learning_rate": 6.109893897436943e-06, "loss": 20.5428, "step": 59050 }, { "epoch": 0.64, "learning_rate": 6.1066685692965125e-06, "loss": 21.1054, "step": 59060 }, { "epoch": 0.64, "learning_rate": 6.103443718459102e-06, "loss": 21.435, "step": 59070 }, { "epoch": 0.64, "learning_rate": 6.100219345320064e-06, "loss": 20.9594, "step": 59080 }, { "epoch": 0.64, "learning_rate": 6.0969954502746916e-06, "loss": 20.6894, "step": 59090 }, { "epoch": 0.64, "learning_rate": 6.093772033718214e-06, "loss": 21.4271, "step": 59100 }, { "epoch": 0.64, "learning_rate": 6.090549096045806e-06, "loss": 21.0023, "step": 59110 }, { "epoch": 0.64, "learning_rate": 6.0873266376525865e-06, "loss": 20.8684, "step": 59120 }, { "epoch": 0.64, "learning_rate": 6.084104658933612e-06, "loss": 20.8568, "step": 59130 }, { "epoch": 0.64, "learning_rate": 6.080883160283879e-06, "loss": 21.4012, "step": 59140 }, { "epoch": 0.64, "learning_rate": 6.0776621420983375e-06, "loss": 21.2785, "step": 59150 }, { "epoch": 0.64, "learning_rate": 6.0744416047718515e-06, "loss": 21.9565, "step": 59160 }, { "epoch": 0.64, "learning_rate": 6.071221548699253e-06, "loss": 21.4129, "step": 59170 }, { "epoch": 0.64, "learning_rate": 6.068001974275303e-06, "loss": 21.7693, "step": 59180 }, { "epoch": 0.64, "learning_rate": 6.064782881894705e-06, "loss": 21.5985, "step": 59190 }, { "epoch": 0.64, "learning_rate": 6.061564271952109e-06, "loss": 21.1803, "step": 59200 }, { "epoch": 0.64, "learning_rate": 6.05834614484209e-06, "loss": 20.6335, "step": 59210 }, { "epoch": 0.64, "learning_rate": 6.055128500959182e-06, "loss": 21.2812, "step": 59220 }, { "epoch": 0.64, "learning_rate": 6.051911340697849e-06, "loss": 21.1417, "step": 59230 }, { "epoch": 0.64, "learning_rate": 6.048694664452499e-06, "loss": 20.876, "step": 59240 }, { "epoch": 0.64, "learning_rate": 6.045478472617482e-06, "loss": 21.391, "step": 59250 }, { "epoch": 0.64, "learning_rate": 6.042262765587088e-06, "loss": 20.451, "step": 59260 }, { "epoch": 0.64, "learning_rate": 6.039047543755545e-06, "loss": 21.0121, "step": 59270 }, { "epoch": 0.64, "learning_rate": 6.035832807517021e-06, "loss": 20.7607, "step": 59280 }, { "epoch": 0.64, "learning_rate": 6.032618557265628e-06, "loss": 20.9801, "step": 59290 }, { "epoch": 0.64, "learning_rate": 6.029404793395419e-06, "loss": 20.7363, "step": 59300 }, { "epoch": 0.64, "learning_rate": 6.026191516300387e-06, "loss": 21.2784, "step": 59310 }, { "epoch": 0.64, "learning_rate": 6.022978726374458e-06, "loss": 20.9209, "step": 59320 }, { "epoch": 0.64, "learning_rate": 6.019766424011508e-06, "loss": 21.265, "step": 59330 }, { "epoch": 0.64, "learning_rate": 6.016554609605347e-06, "loss": 21.2209, "step": 59340 }, { "epoch": 0.64, "learning_rate": 6.013343283549729e-06, "loss": 21.8226, "step": 59350 }, { "epoch": 0.64, "learning_rate": 6.010132446238348e-06, "loss": 21.2314, "step": 59360 }, { "epoch": 0.64, "learning_rate": 6.006922098064833e-06, "loss": 21.7685, "step": 59370 }, { "epoch": 0.64, "learning_rate": 6.003712239422761e-06, "loss": 22.0428, "step": 59380 }, { "epoch": 0.64, "learning_rate": 6.000502870705638e-06, "loss": 21.3498, "step": 59390 }, { "epoch": 0.64, "learning_rate": 5.997293992306923e-06, "loss": 22.1307, "step": 59400 }, { "epoch": 0.64, "learning_rate": 5.994085604620008e-06, "loss": 20.9258, "step": 59410 }, { "epoch": 0.64, "learning_rate": 5.990877708038224e-06, "loss": 21.4788, "step": 59420 }, { "epoch": 0.64, "learning_rate": 5.987670302954841e-06, "loss": 22.2292, "step": 59430 }, { "epoch": 0.64, "learning_rate": 5.984463389763071e-06, "loss": 20.7698, "step": 59440 }, { "epoch": 0.64, "learning_rate": 5.9812569688560695e-06, "loss": 21.0625, "step": 59450 }, { "epoch": 0.64, "learning_rate": 5.9780510406269245e-06, "loss": 21.3372, "step": 59460 }, { "epoch": 0.64, "learning_rate": 5.974845605468671e-06, "loss": 21.0037, "step": 59470 }, { "epoch": 0.64, "learning_rate": 5.971640663774274e-06, "loss": 21.8306, "step": 59480 }, { "epoch": 0.64, "learning_rate": 5.9684362159366415e-06, "loss": 20.4933, "step": 59490 }, { "epoch": 0.64, "learning_rate": 5.9652322623486316e-06, "loss": 21.1576, "step": 59500 }, { "epoch": 0.64, "learning_rate": 5.962028803403026e-06, "loss": 21.1617, "step": 59510 }, { "epoch": 0.64, "learning_rate": 5.958825839492555e-06, "loss": 21.6074, "step": 59520 }, { "epoch": 0.64, "learning_rate": 5.955623371009891e-06, "loss": 21.1957, "step": 59530 }, { "epoch": 0.64, "learning_rate": 5.95242139834763e-06, "loss": 20.7815, "step": 59540 }, { "epoch": 0.64, "learning_rate": 5.949219921898326e-06, "loss": 21.5135, "step": 59550 }, { "epoch": 0.64, "learning_rate": 5.9460189420544615e-06, "loss": 21.4201, "step": 59560 }, { "epoch": 0.64, "learning_rate": 5.942818459208457e-06, "loss": 21.3361, "step": 59570 }, { "epoch": 0.64, "learning_rate": 5.939618473752687e-06, "loss": 21.8908, "step": 59580 }, { "epoch": 0.64, "learning_rate": 5.936418986079441e-06, "loss": 19.9591, "step": 59590 }, { "epoch": 0.64, "learning_rate": 5.9332199965809675e-06, "loss": 21.0871, "step": 59600 }, { "epoch": 0.64, "learning_rate": 5.930021505649443e-06, "loss": 20.8019, "step": 59610 }, { "epoch": 0.64, "learning_rate": 5.926823513676988e-06, "loss": 21.2942, "step": 59620 }, { "epoch": 0.64, "learning_rate": 5.923626021055666e-06, "loss": 21.2105, "step": 59630 }, { "epoch": 0.64, "learning_rate": 5.9204290281774635e-06, "loss": 20.946, "step": 59640 }, { "epoch": 0.64, "learning_rate": 5.917232535434321e-06, "loss": 21.3059, "step": 59650 }, { "epoch": 0.64, "learning_rate": 5.914036543218113e-06, "loss": 21.2207, "step": 59660 }, { "epoch": 0.65, "learning_rate": 5.910841051920648e-06, "loss": 21.578, "step": 59670 }, { "epoch": 0.65, "learning_rate": 5.907646061933685e-06, "loss": 20.9811, "step": 59680 }, { "epoch": 0.65, "learning_rate": 5.904451573648911e-06, "loss": 21.4572, "step": 59690 }, { "epoch": 0.65, "learning_rate": 5.90125758745795e-06, "loss": 20.8835, "step": 59700 }, { "epoch": 0.65, "learning_rate": 5.898064103752372e-06, "loss": 21.2101, "step": 59710 }, { "epoch": 0.65, "learning_rate": 5.894871122923681e-06, "loss": 21.743, "step": 59720 }, { "epoch": 0.65, "learning_rate": 5.891678645363323e-06, "loss": 20.9606, "step": 59730 }, { "epoch": 0.65, "learning_rate": 5.88848667146268e-06, "loss": 21.4128, "step": 59740 }, { "epoch": 0.65, "learning_rate": 5.885295201613068e-06, "loss": 21.2402, "step": 59750 }, { "epoch": 0.65, "learning_rate": 5.882104236205748e-06, "loss": 21.0591, "step": 59760 }, { "epoch": 0.65, "learning_rate": 5.878913775631914e-06, "loss": 20.601, "step": 59770 }, { "epoch": 0.65, "learning_rate": 5.875723820282704e-06, "loss": 21.2125, "step": 59780 }, { "epoch": 0.65, "learning_rate": 5.8725343705491925e-06, "loss": 21.4928, "step": 59790 }, { "epoch": 0.65, "learning_rate": 5.8693454268223835e-06, "loss": 20.7709, "step": 59800 }, { "epoch": 0.65, "learning_rate": 5.86615698949323e-06, "loss": 21.3133, "step": 59810 }, { "epoch": 0.65, "learning_rate": 5.862969058952618e-06, "loss": 20.5318, "step": 59820 }, { "epoch": 0.65, "learning_rate": 5.8597816355913685e-06, "loss": 20.4475, "step": 59830 }, { "epoch": 0.65, "learning_rate": 5.856594719800248e-06, "loss": 21.0524, "step": 59840 }, { "epoch": 0.65, "learning_rate": 5.853408311969959e-06, "loss": 20.8148, "step": 59850 }, { "epoch": 0.65, "learning_rate": 5.8502224124911325e-06, "loss": 21.0012, "step": 59860 }, { "epoch": 0.65, "learning_rate": 5.847037021754346e-06, "loss": 21.353, "step": 59870 }, { "epoch": 0.65, "learning_rate": 5.843852140150112e-06, "loss": 21.0309, "step": 59880 }, { "epoch": 0.65, "learning_rate": 5.840667768068884e-06, "loss": 21.5821, "step": 59890 }, { "epoch": 0.65, "learning_rate": 5.83748390590105e-06, "loss": 21.4076, "step": 59900 }, { "epoch": 0.65, "learning_rate": 5.834300554036933e-06, "loss": 20.8102, "step": 59910 }, { "epoch": 0.65, "learning_rate": 5.831117712866797e-06, "loss": 20.8708, "step": 59920 }, { "epoch": 0.65, "learning_rate": 5.827935382780842e-06, "loss": 20.8196, "step": 59930 }, { "epoch": 0.65, "learning_rate": 5.824753564169202e-06, "loss": 21.308, "step": 59940 }, { "epoch": 0.65, "learning_rate": 5.821572257421961e-06, "loss": 20.8523, "step": 59950 }, { "epoch": 0.65, "learning_rate": 5.818391462929131e-06, "loss": 21.3463, "step": 59960 }, { "epoch": 0.65, "learning_rate": 5.815211181080654e-06, "loss": 21.6942, "step": 59970 }, { "epoch": 0.65, "learning_rate": 5.8120314122664186e-06, "loss": 21.2978, "step": 59980 }, { "epoch": 0.65, "learning_rate": 5.808852156876248e-06, "loss": 21.2767, "step": 59990 }, { "epoch": 0.65, "learning_rate": 5.805673415299908e-06, "loss": 21.0222, "step": 60000 }, { "epoch": 0.65, "learning_rate": 5.802495187927098e-06, "loss": 21.6007, "step": 60010 }, { "epoch": 0.65, "learning_rate": 5.799317475147444e-06, "loss": 21.2805, "step": 60020 }, { "epoch": 0.65, "learning_rate": 5.796140277350524e-06, "loss": 21.7737, "step": 60030 }, { "epoch": 0.65, "learning_rate": 5.792963594925838e-06, "loss": 21.2022, "step": 60040 }, { "epoch": 0.65, "learning_rate": 5.789787428262844e-06, "loss": 21.0006, "step": 60050 }, { "epoch": 0.65, "learning_rate": 5.786611777750922e-06, "loss": 22.1125, "step": 60060 }, { "epoch": 0.65, "learning_rate": 5.783436643779383e-06, "loss": 21.0308, "step": 60070 }, { "epoch": 0.65, "learning_rate": 5.7802620267374875e-06, "loss": 21.3429, "step": 60080 }, { "epoch": 0.65, "learning_rate": 5.777087927014423e-06, "loss": 21.0473, "step": 60090 }, { "epoch": 0.65, "learning_rate": 5.773914344999327e-06, "loss": 21.1375, "step": 60100 }, { "epoch": 0.65, "learning_rate": 5.77074128108126e-06, "loss": 21.3166, "step": 60110 }, { "epoch": 0.65, "learning_rate": 5.767568735649227e-06, "loss": 21.065, "step": 60120 }, { "epoch": 0.65, "learning_rate": 5.764396709092161e-06, "loss": 21.3084, "step": 60130 }, { "epoch": 0.65, "learning_rate": 5.761225201798934e-06, "loss": 20.725, "step": 60140 }, { "epoch": 0.65, "learning_rate": 5.7580542141583665e-06, "loss": 20.1849, "step": 60150 }, { "epoch": 0.65, "learning_rate": 5.7548837465592e-06, "loss": 21.2265, "step": 60160 }, { "epoch": 0.65, "learning_rate": 5.751713799390124e-06, "loss": 21.0033, "step": 60170 }, { "epoch": 0.65, "learning_rate": 5.7485443730397504e-06, "loss": 21.4277, "step": 60180 }, { "epoch": 0.65, "learning_rate": 5.745375467896632e-06, "loss": 21.3779, "step": 60190 }, { "epoch": 0.65, "learning_rate": 5.742207084349274e-06, "loss": 21.1183, "step": 60200 }, { "epoch": 0.65, "learning_rate": 5.739039222786095e-06, "loss": 20.7142, "step": 60210 }, { "epoch": 0.65, "learning_rate": 5.735871883595462e-06, "loss": 21.1241, "step": 60220 }, { "epoch": 0.65, "learning_rate": 5.732705067165678e-06, "loss": 21.2662, "step": 60230 }, { "epoch": 0.65, "learning_rate": 5.729538773884968e-06, "loss": 21.1211, "step": 60240 }, { "epoch": 0.65, "learning_rate": 5.7263730041415145e-06, "loss": 21.6748, "step": 60250 }, { "epoch": 0.65, "learning_rate": 5.723207758323421e-06, "loss": 20.7566, "step": 60260 }, { "epoch": 0.65, "learning_rate": 5.720043036818733e-06, "loss": 21.365, "step": 60270 }, { "epoch": 0.65, "learning_rate": 5.716878840015432e-06, "loss": 20.5023, "step": 60280 }, { "epoch": 0.65, "learning_rate": 5.713715168301419e-06, "loss": 21.1145, "step": 60290 }, { "epoch": 0.65, "learning_rate": 5.710552022064561e-06, "loss": 20.7996, "step": 60300 }, { "epoch": 0.65, "learning_rate": 5.7073894016926355e-06, "loss": 21.5152, "step": 60310 }, { "epoch": 0.65, "learning_rate": 5.704227307573365e-06, "loss": 21.0415, "step": 60320 }, { "epoch": 0.65, "learning_rate": 5.701065740094411e-06, "loss": 21.1621, "step": 60330 }, { "epoch": 0.65, "learning_rate": 5.697904699643355e-06, "loss": 20.5021, "step": 60340 }, { "epoch": 0.65, "learning_rate": 5.694744186607737e-06, "loss": 21.4535, "step": 60350 }, { "epoch": 0.65, "learning_rate": 5.691584201375013e-06, "loss": 21.3207, "step": 60360 }, { "epoch": 0.65, "learning_rate": 5.688424744332584e-06, "loss": 21.1828, "step": 60370 }, { "epoch": 0.65, "learning_rate": 5.685265815867782e-06, "loss": 21.8023, "step": 60380 }, { "epoch": 0.65, "learning_rate": 5.682107416367879e-06, "loss": 20.4205, "step": 60390 }, { "epoch": 0.65, "learning_rate": 5.678949546220076e-06, "loss": 20.7626, "step": 60400 }, { "epoch": 0.65, "learning_rate": 5.675792205811512e-06, "loss": 21.2572, "step": 60410 }, { "epoch": 0.65, "learning_rate": 5.672635395529265e-06, "loss": 21.6185, "step": 60420 }, { "epoch": 0.65, "learning_rate": 5.669479115760339e-06, "loss": 20.8674, "step": 60430 }, { "epoch": 0.65, "learning_rate": 5.6663233668916815e-06, "loss": 20.7233, "step": 60440 }, { "epoch": 0.65, "learning_rate": 5.6631681493101706e-06, "loss": 20.829, "step": 60450 }, { "epoch": 0.65, "learning_rate": 5.6600134634026204e-06, "loss": 20.955, "step": 60460 }, { "epoch": 0.65, "learning_rate": 5.65685930955578e-06, "loss": 21.0852, "step": 60470 }, { "epoch": 0.65, "learning_rate": 5.653705688156333e-06, "loss": 21.229, "step": 60480 }, { "epoch": 0.65, "learning_rate": 5.650552599590896e-06, "loss": 21.2028, "step": 60490 }, { "epoch": 0.65, "learning_rate": 5.647400044246023e-06, "loss": 20.8313, "step": 60500 }, { "epoch": 0.65, "learning_rate": 5.644248022508203e-06, "loss": 21.3184, "step": 60510 }, { "epoch": 0.65, "learning_rate": 5.641096534763857e-06, "loss": 21.2396, "step": 60520 }, { "epoch": 0.65, "learning_rate": 5.63794558139934e-06, "loss": 20.2638, "step": 60530 }, { "epoch": 0.65, "learning_rate": 5.634795162800946e-06, "loss": 21.528, "step": 60540 }, { "epoch": 0.65, "learning_rate": 5.631645279354899e-06, "loss": 21.2678, "step": 60550 }, { "epoch": 0.65, "learning_rate": 5.62849593144736e-06, "loss": 21.034, "step": 60560 }, { "epoch": 0.65, "learning_rate": 5.625347119464422e-06, "loss": 21.7324, "step": 60570 }, { "epoch": 0.65, "learning_rate": 5.622198843792115e-06, "loss": 20.9829, "step": 60580 }, { "epoch": 0.66, "learning_rate": 5.6190511048164e-06, "loss": 21.5214, "step": 60590 }, { "epoch": 0.66, "learning_rate": 5.615903902923177e-06, "loss": 21.1712, "step": 60600 }, { "epoch": 0.66, "learning_rate": 5.612757238498274e-06, "loss": 21.1035, "step": 60610 }, { "epoch": 0.66, "learning_rate": 5.6096111119274585e-06, "loss": 20.6633, "step": 60620 }, { "epoch": 0.66, "learning_rate": 5.60646552359643e-06, "loss": 20.45, "step": 60630 }, { "epoch": 0.66, "learning_rate": 5.6033204738908206e-06, "loss": 20.8124, "step": 60640 }, { "epoch": 0.66, "learning_rate": 5.6001759631961994e-06, "loss": 20.6916, "step": 60650 }, { "epoch": 0.66, "learning_rate": 5.5970319918980655e-06, "loss": 20.7656, "step": 60660 }, { "epoch": 0.66, "learning_rate": 5.593888560381857e-06, "loss": 21.4318, "step": 60670 }, { "epoch": 0.66, "learning_rate": 5.5907456690329395e-06, "loss": 21.278, "step": 60680 }, { "epoch": 0.66, "learning_rate": 5.5876033182366196e-06, "loss": 21.1296, "step": 60690 }, { "epoch": 0.66, "learning_rate": 5.584461508378131e-06, "loss": 21.1729, "step": 60700 }, { "epoch": 0.66, "learning_rate": 5.581320239842645e-06, "loss": 21.2134, "step": 60710 }, { "epoch": 0.66, "learning_rate": 5.578179513015265e-06, "loss": 21.18, "step": 60720 }, { "epoch": 0.66, "learning_rate": 5.575039328281029e-06, "loss": 21.4319, "step": 60730 }, { "epoch": 0.66, "learning_rate": 5.571899686024906e-06, "loss": 21.4396, "step": 60740 }, { "epoch": 0.66, "learning_rate": 5.568760586631805e-06, "loss": 21.2541, "step": 60750 }, { "epoch": 0.66, "learning_rate": 5.56562203048656e-06, "loss": 21.2589, "step": 60760 }, { "epoch": 0.66, "learning_rate": 5.562484017973943e-06, "loss": 20.8686, "step": 60770 }, { "epoch": 0.66, "learning_rate": 5.559346549478659e-06, "loss": 21.4851, "step": 60780 }, { "epoch": 0.66, "learning_rate": 5.556209625385347e-06, "loss": 20.9727, "step": 60790 }, { "epoch": 0.66, "learning_rate": 5.5530732460785775e-06, "loss": 21.0437, "step": 60800 }, { "epoch": 0.66, "learning_rate": 5.54993741194285e-06, "loss": 20.9318, "step": 60810 }, { "epoch": 0.66, "learning_rate": 5.546802123362616e-06, "loss": 20.8534, "step": 60820 }, { "epoch": 0.66, "learning_rate": 5.543667380722232e-06, "loss": 20.786, "step": 60830 }, { "epoch": 0.66, "learning_rate": 5.540533184406007e-06, "loss": 21.5477, "step": 60840 }, { "epoch": 0.66, "learning_rate": 5.537399534798179e-06, "loss": 20.7458, "step": 60850 }, { "epoch": 0.66, "learning_rate": 5.534266432282912e-06, "loss": 21.7308, "step": 60860 }, { "epoch": 0.66, "learning_rate": 5.531133877244321e-06, "loss": 20.9416, "step": 60870 }, { "epoch": 0.66, "learning_rate": 5.528001870066432e-06, "loss": 20.8044, "step": 60880 }, { "epoch": 0.66, "learning_rate": 5.524870411133214e-06, "loss": 21.5606, "step": 60890 }, { "epoch": 0.66, "learning_rate": 5.52173950082857e-06, "loss": 21.6706, "step": 60900 }, { "epoch": 0.66, "learning_rate": 5.5186091395363305e-06, "loss": 20.8953, "step": 60910 }, { "epoch": 0.66, "learning_rate": 5.515479327640269e-06, "loss": 22.0043, "step": 60920 }, { "epoch": 0.66, "learning_rate": 5.512350065524085e-06, "loss": 21.239, "step": 60930 }, { "epoch": 0.66, "learning_rate": 5.509221353571404e-06, "loss": 21.6029, "step": 60940 }, { "epoch": 0.66, "learning_rate": 5.506093192165791e-06, "loss": 20.8584, "step": 60950 }, { "epoch": 0.66, "learning_rate": 5.502965581690743e-06, "loss": 20.9032, "step": 60960 }, { "epoch": 0.66, "learning_rate": 5.499838522529695e-06, "loss": 21.9113, "step": 60970 }, { "epoch": 0.66, "learning_rate": 5.4967120150660104e-06, "loss": 21.3663, "step": 60980 }, { "epoch": 0.66, "learning_rate": 5.493586059682973e-06, "loss": 21.8007, "step": 60990 }, { "epoch": 0.66, "learning_rate": 5.490460656763816e-06, "loss": 20.5948, "step": 61000 }, { "epoch": 0.66, "learning_rate": 5.487335806691693e-06, "loss": 21.625, "step": 61010 }, { "epoch": 0.66, "learning_rate": 5.484211509849703e-06, "loss": 20.7254, "step": 61020 }, { "epoch": 0.66, "learning_rate": 5.48108776662087e-06, "loss": 20.5034, "step": 61030 }, { "epoch": 0.66, "learning_rate": 5.47796457738814e-06, "loss": 21.114, "step": 61040 }, { "epoch": 0.66, "learning_rate": 5.4748419425344045e-06, "loss": 21.2948, "step": 61050 }, { "epoch": 0.66, "learning_rate": 5.471719862442481e-06, "loss": 20.9928, "step": 61060 }, { "epoch": 0.66, "learning_rate": 5.468598337495125e-06, "loss": 20.4568, "step": 61070 }, { "epoch": 0.66, "learning_rate": 5.465477368075021e-06, "loss": 21.0296, "step": 61080 }, { "epoch": 0.66, "learning_rate": 5.462356954564786e-06, "loss": 21.2265, "step": 61090 }, { "epoch": 0.66, "learning_rate": 5.459237097346958e-06, "loss": 20.9616, "step": 61100 }, { "epoch": 0.66, "learning_rate": 5.456117796804017e-06, "loss": 21.0603, "step": 61110 }, { "epoch": 0.66, "learning_rate": 5.452999053318381e-06, "loss": 21.4807, "step": 61120 }, { "epoch": 0.66, "learning_rate": 5.449880867272389e-06, "loss": 21.0711, "step": 61130 }, { "epoch": 0.66, "learning_rate": 5.446763239048318e-06, "loss": 21.6578, "step": 61140 }, { "epoch": 0.66, "learning_rate": 5.44364616902837e-06, "loss": 20.6223, "step": 61150 }, { "epoch": 0.66, "learning_rate": 5.440529657594676e-06, "loss": 21.6472, "step": 61160 }, { "epoch": 0.66, "learning_rate": 5.4374137051293155e-06, "loss": 21.1665, "step": 61170 }, { "epoch": 0.66, "learning_rate": 5.434298312014286e-06, "loss": 21.8069, "step": 61180 }, { "epoch": 0.66, "learning_rate": 5.431183478631519e-06, "loss": 21.2441, "step": 61190 }, { "epoch": 0.66, "learning_rate": 5.428069205362878e-06, "loss": 21.3675, "step": 61200 }, { "epoch": 0.66, "learning_rate": 5.4249554925901495e-06, "loss": 21.126, "step": 61210 }, { "epoch": 0.66, "learning_rate": 5.4218423406950695e-06, "loss": 21.302, "step": 61220 }, { "epoch": 0.66, "learning_rate": 5.418729750059291e-06, "loss": 20.8301, "step": 61230 }, { "epoch": 0.66, "learning_rate": 5.415617721064402e-06, "loss": 21.9442, "step": 61240 }, { "epoch": 0.66, "learning_rate": 5.412506254091927e-06, "loss": 20.4144, "step": 61250 }, { "epoch": 0.66, "learning_rate": 5.4093953495233006e-06, "loss": 21.3571, "step": 61260 }, { "epoch": 0.66, "learning_rate": 5.406285007739922e-06, "loss": 21.1608, "step": 61270 }, { "epoch": 0.66, "learning_rate": 5.403175229123094e-06, "loss": 22.0142, "step": 61280 }, { "epoch": 0.66, "learning_rate": 5.400066014054063e-06, "loss": 22.278, "step": 61290 }, { "epoch": 0.66, "learning_rate": 5.396957362914006e-06, "loss": 21.7093, "step": 61300 }, { "epoch": 0.66, "learning_rate": 5.3938492760840176e-06, "loss": 20.4782, "step": 61310 }, { "epoch": 0.66, "learning_rate": 5.390741753945146e-06, "loss": 20.8178, "step": 61320 }, { "epoch": 0.66, "learning_rate": 5.387634796878351e-06, "loss": 21.6044, "step": 61330 }, { "epoch": 0.66, "learning_rate": 5.38452840526453e-06, "loss": 21.6385, "step": 61340 }, { "epoch": 0.66, "learning_rate": 5.381422579484517e-06, "loss": 20.5199, "step": 61350 }, { "epoch": 0.66, "learning_rate": 5.378317319919064e-06, "loss": 21.177, "step": 61360 }, { "epoch": 0.66, "learning_rate": 5.375212626948865e-06, "loss": 21.3747, "step": 61370 }, { "epoch": 0.66, "learning_rate": 5.372108500954536e-06, "loss": 20.8586, "step": 61380 }, { "epoch": 0.66, "learning_rate": 5.369004942316631e-06, "loss": 21.6287, "step": 61390 }, { "epoch": 0.66, "learning_rate": 5.365901951415629e-06, "loss": 21.1819, "step": 61400 }, { "epoch": 0.66, "learning_rate": 5.362799528631939e-06, "loss": 21.3951, "step": 61410 }, { "epoch": 0.66, "learning_rate": 5.3596976743459074e-06, "loss": 21.0575, "step": 61420 }, { "epoch": 0.66, "learning_rate": 5.356596388937802e-06, "loss": 21.6501, "step": 61430 }, { "epoch": 0.66, "learning_rate": 5.353495672787827e-06, "loss": 20.8421, "step": 61440 }, { "epoch": 0.66, "learning_rate": 5.3503955262761155e-06, "loss": 21.6149, "step": 61450 }, { "epoch": 0.66, "learning_rate": 5.347295949782727e-06, "loss": 21.1949, "step": 61460 }, { "epoch": 0.66, "learning_rate": 5.344196943687656e-06, "loss": 20.6928, "step": 61470 }, { "epoch": 0.66, "learning_rate": 5.341098508370826e-06, "loss": 21.8538, "step": 61480 }, { "epoch": 0.66, "learning_rate": 5.338000644212088e-06, "loss": 20.4104, "step": 61490 }, { "epoch": 0.66, "learning_rate": 5.334903351591225e-06, "loss": 21.0198, "step": 61500 }, { "epoch": 0.66, "learning_rate": 5.3318066308879515e-06, "loss": 21.647, "step": 61510 }, { "epoch": 0.67, "learning_rate": 5.328710482481907e-06, "loss": 20.8615, "step": 61520 }, { "epoch": 0.67, "learning_rate": 5.3256149067526675e-06, "loss": 20.894, "step": 61530 }, { "epoch": 0.67, "learning_rate": 5.322519904079732e-06, "loss": 21.5598, "step": 61540 }, { "epoch": 0.67, "learning_rate": 5.319425474842532e-06, "loss": 20.7238, "step": 61550 }, { "epoch": 0.67, "learning_rate": 5.316331619420433e-06, "loss": 20.3187, "step": 61560 }, { "epoch": 0.67, "learning_rate": 5.313238338192723e-06, "loss": 21.3956, "step": 61570 }, { "epoch": 0.67, "learning_rate": 5.310145631538623e-06, "loss": 21.2869, "step": 61580 }, { "epoch": 0.67, "learning_rate": 5.307053499837285e-06, "loss": 20.6653, "step": 61590 }, { "epoch": 0.67, "learning_rate": 5.303961943467788e-06, "loss": 21.4452, "step": 61600 }, { "epoch": 0.67, "learning_rate": 5.300870962809142e-06, "loss": 20.7699, "step": 61610 }, { "epoch": 0.67, "learning_rate": 5.297780558240284e-06, "loss": 21.3159, "step": 61620 }, { "epoch": 0.67, "learning_rate": 5.294690730140084e-06, "loss": 21.0938, "step": 61630 }, { "epoch": 0.67, "learning_rate": 5.291601478887338e-06, "loss": 20.8303, "step": 61640 }, { "epoch": 0.67, "learning_rate": 5.288512804860776e-06, "loss": 21.0901, "step": 61650 }, { "epoch": 0.67, "learning_rate": 5.285424708439051e-06, "loss": 21.1992, "step": 61660 }, { "epoch": 0.67, "learning_rate": 5.282337190000748e-06, "loss": 21.0165, "step": 61670 }, { "epoch": 0.67, "learning_rate": 5.279250249924384e-06, "loss": 21.155, "step": 61680 }, { "epoch": 0.67, "learning_rate": 5.276163888588399e-06, "loss": 21.6779, "step": 61690 }, { "epoch": 0.67, "learning_rate": 5.273078106371168e-06, "loss": 21.2726, "step": 61700 }, { "epoch": 0.67, "learning_rate": 5.269992903650992e-06, "loss": 20.8179, "step": 61710 }, { "epoch": 0.67, "learning_rate": 5.2669082808061025e-06, "loss": 20.7573, "step": 61720 }, { "epoch": 0.67, "learning_rate": 5.263824238214656e-06, "loss": 20.7386, "step": 61730 }, { "epoch": 0.67, "learning_rate": 5.2607407762547435e-06, "loss": 21.148, "step": 61740 }, { "epoch": 0.67, "learning_rate": 5.25765789530438e-06, "loss": 20.764, "step": 61750 }, { "epoch": 0.67, "learning_rate": 5.254575595741513e-06, "loss": 21.3881, "step": 61760 }, { "epoch": 0.67, "learning_rate": 5.2514938779440175e-06, "loss": 20.8693, "step": 61770 }, { "epoch": 0.67, "learning_rate": 5.248412742289691e-06, "loss": 21.038, "step": 61780 }, { "epoch": 0.67, "learning_rate": 5.245332189156278e-06, "loss": 21.5887, "step": 61790 }, { "epoch": 0.67, "learning_rate": 5.242252218921426e-06, "loss": 20.7125, "step": 61800 }, { "epoch": 0.67, "learning_rate": 5.23917283196273e-06, "loss": 21.2872, "step": 61810 }, { "epoch": 0.67, "learning_rate": 5.2360940286577055e-06, "loss": 21.6003, "step": 61820 }, { "epoch": 0.67, "learning_rate": 5.233015809383797e-06, "loss": 21.2188, "step": 61830 }, { "epoch": 0.67, "learning_rate": 5.229938174518388e-06, "loss": 21.2254, "step": 61840 }, { "epoch": 0.67, "learning_rate": 5.2268611244387714e-06, "loss": 21.058, "step": 61850 }, { "epoch": 0.67, "learning_rate": 5.22378465952218e-06, "loss": 20.9742, "step": 61860 }, { "epoch": 0.67, "learning_rate": 5.220708780145776e-06, "loss": 21.5046, "step": 61870 }, { "epoch": 0.67, "learning_rate": 5.21763348668664e-06, "loss": 21.7948, "step": 61880 }, { "epoch": 0.67, "learning_rate": 5.2145587795217965e-06, "loss": 20.7293, "step": 61890 }, { "epoch": 0.67, "learning_rate": 5.21148465902819e-06, "loss": 20.2695, "step": 61900 }, { "epoch": 0.67, "learning_rate": 5.2084111255826845e-06, "loss": 21.8137, "step": 61910 }, { "epoch": 0.67, "learning_rate": 5.205338179562081e-06, "loss": 22.2354, "step": 61920 }, { "epoch": 0.67, "learning_rate": 5.202265821343109e-06, "loss": 20.7089, "step": 61930 }, { "epoch": 0.67, "learning_rate": 5.199194051302426e-06, "loss": 21.364, "step": 61940 }, { "epoch": 0.67, "learning_rate": 5.19612286981662e-06, "loss": 21.8653, "step": 61950 }, { "epoch": 0.67, "learning_rate": 5.193052277262194e-06, "loss": 21.4436, "step": 61960 }, { "epoch": 0.67, "learning_rate": 5.189982274015588e-06, "loss": 21.5151, "step": 61970 }, { "epoch": 0.67, "learning_rate": 5.18691286045317e-06, "loss": 20.3424, "step": 61980 }, { "epoch": 0.67, "learning_rate": 5.18384403695124e-06, "loss": 21.6839, "step": 61990 }, { "epoch": 0.67, "learning_rate": 5.18077580388602e-06, "loss": 21.3446, "step": 62000 }, { "epoch": 0.67, "learning_rate": 5.177708161633653e-06, "loss": 20.6142, "step": 62010 }, { "epoch": 0.67, "learning_rate": 5.174641110570222e-06, "loss": 21.9667, "step": 62020 }, { "epoch": 0.67, "learning_rate": 5.1715746510717244e-06, "loss": 21.2794, "step": 62030 }, { "epoch": 0.67, "learning_rate": 5.168508783514106e-06, "loss": 21.48, "step": 62040 }, { "epoch": 0.67, "learning_rate": 5.165443508273218e-06, "loss": 21.3659, "step": 62050 }, { "epoch": 0.67, "learning_rate": 5.162378825724854e-06, "loss": 21.3671, "step": 62060 }, { "epoch": 0.67, "learning_rate": 5.159314736244721e-06, "loss": 21.3944, "step": 62070 }, { "epoch": 0.67, "learning_rate": 5.156251240208462e-06, "loss": 21.0819, "step": 62080 }, { "epoch": 0.67, "learning_rate": 5.153188337991652e-06, "loss": 21.3362, "step": 62090 }, { "epoch": 0.67, "learning_rate": 5.1501260299697844e-06, "loss": 21.2491, "step": 62100 }, { "epoch": 0.67, "learning_rate": 5.147064316518288e-06, "loss": 21.2485, "step": 62110 }, { "epoch": 0.67, "learning_rate": 5.144003198012504e-06, "loss": 21.9009, "step": 62120 }, { "epoch": 0.67, "learning_rate": 5.140942674827713e-06, "loss": 20.3606, "step": 62130 }, { "epoch": 0.67, "learning_rate": 5.137882747339125e-06, "loss": 20.7777, "step": 62140 }, { "epoch": 0.67, "learning_rate": 5.134823415921867e-06, "loss": 21.3235, "step": 62150 }, { "epoch": 0.67, "learning_rate": 5.131764680951005e-06, "loss": 21.7632, "step": 62160 }, { "epoch": 0.67, "learning_rate": 5.128706542801515e-06, "loss": 20.8707, "step": 62170 }, { "epoch": 0.67, "learning_rate": 5.125649001848309e-06, "loss": 20.4472, "step": 62180 }, { "epoch": 0.67, "learning_rate": 5.122592058466237e-06, "loss": 21.2767, "step": 62190 }, { "epoch": 0.67, "learning_rate": 5.119535713030057e-06, "loss": 21.3521, "step": 62200 }, { "epoch": 0.67, "learning_rate": 5.1164799659144645e-06, "loss": 21.0067, "step": 62210 }, { "epoch": 0.67, "learning_rate": 5.1134248174940825e-06, "loss": 21.5194, "step": 62220 }, { "epoch": 0.67, "learning_rate": 5.110370268143445e-06, "loss": 21.1658, "step": 62230 }, { "epoch": 0.67, "learning_rate": 5.107316318237034e-06, "loss": 21.2218, "step": 62240 }, { "epoch": 0.67, "learning_rate": 5.104262968149248e-06, "loss": 20.9874, "step": 62250 }, { "epoch": 0.67, "learning_rate": 5.101210218254411e-06, "loss": 21.4227, "step": 62260 }, { "epoch": 0.67, "learning_rate": 5.09815806892678e-06, "loss": 20.9769, "step": 62270 }, { "epoch": 0.67, "learning_rate": 5.0951065205405185e-06, "loss": 20.88, "step": 62280 }, { "epoch": 0.67, "learning_rate": 5.0920555734697454e-06, "loss": 21.3129, "step": 62290 }, { "epoch": 0.67, "learning_rate": 5.0890052280884885e-06, "loss": 21.1022, "step": 62300 }, { "epoch": 0.67, "learning_rate": 5.085955484770702e-06, "loss": 21.3988, "step": 62310 }, { "epoch": 0.67, "learning_rate": 5.0829063438902705e-06, "loss": 21.0531, "step": 62320 }, { "epoch": 0.67, "learning_rate": 5.079857805821005e-06, "loss": 21.244, "step": 62330 }, { "epoch": 0.67, "learning_rate": 5.076809870936639e-06, "loss": 20.5119, "step": 62340 }, { "epoch": 0.67, "learning_rate": 5.0737625396108355e-06, "loss": 21.5885, "step": 62350 }, { "epoch": 0.67, "learning_rate": 5.070715812217181e-06, "loss": 20.1273, "step": 62360 }, { "epoch": 0.67, "learning_rate": 5.06766968912919e-06, "loss": 21.3247, "step": 62370 }, { "epoch": 0.67, "learning_rate": 5.064624170720301e-06, "loss": 21.9503, "step": 62380 }, { "epoch": 0.67, "learning_rate": 5.06157925736388e-06, "loss": 21.368, "step": 62390 }, { "epoch": 0.67, "learning_rate": 5.05853494943322e-06, "loss": 21.9011, "step": 62400 }, { "epoch": 0.67, "learning_rate": 5.055491247301534e-06, "loss": 21.6208, "step": 62410 }, { "epoch": 0.67, "learning_rate": 5.0524481513419675e-06, "loss": 21.0103, "step": 62420 }, { "epoch": 0.67, "learning_rate": 5.049405661927589e-06, "loss": 21.1812, "step": 62430 }, { "epoch": 0.68, "learning_rate": 5.046363779431391e-06, "loss": 21.7082, "step": 62440 }, { "epoch": 0.68, "learning_rate": 5.043322504226294e-06, "loss": 21.7668, "step": 62450 }, { "epoch": 0.68, "learning_rate": 5.040281836685143e-06, "loss": 20.8863, "step": 62460 }, { "epoch": 0.68, "learning_rate": 5.03724177718071e-06, "loss": 20.8172, "step": 62470 }, { "epoch": 0.68, "learning_rate": 5.034202326085689e-06, "loss": 21.0423, "step": 62480 }, { "epoch": 0.68, "learning_rate": 5.031163483772703e-06, "loss": 21.3178, "step": 62490 }, { "epoch": 0.68, "learning_rate": 5.028125250614297e-06, "loss": 21.0759, "step": 62500 }, { "epoch": 0.68, "learning_rate": 5.025087626982946e-06, "loss": 21.4172, "step": 62510 }, { "epoch": 0.68, "learning_rate": 5.022050613251046e-06, "loss": 21.8618, "step": 62520 }, { "epoch": 0.68, "learning_rate": 5.01901420979092e-06, "loss": 20.6303, "step": 62530 }, { "epoch": 0.68, "learning_rate": 5.015978416974815e-06, "loss": 21.0593, "step": 62540 }, { "epoch": 0.68, "learning_rate": 5.012943235174905e-06, "loss": 20.8108, "step": 62550 }, { "epoch": 0.68, "learning_rate": 5.009908664763288e-06, "loss": 21.5004, "step": 62560 }, { "epoch": 0.68, "learning_rate": 5.0068747061119886e-06, "loss": 20.9634, "step": 62570 }, { "epoch": 0.68, "learning_rate": 5.003841359592951e-06, "loss": 21.0777, "step": 62580 }, { "epoch": 0.68, "learning_rate": 5.000808625578048e-06, "loss": 21.2329, "step": 62590 }, { "epoch": 0.68, "learning_rate": 4.99777650443909e-06, "loss": 20.8515, "step": 62600 }, { "epoch": 0.68, "learning_rate": 4.9947449965477855e-06, "loss": 20.5957, "step": 62610 }, { "epoch": 0.68, "learning_rate": 4.991714102275788e-06, "loss": 22.1578, "step": 62620 }, { "epoch": 0.68, "learning_rate": 4.988683821994669e-06, "loss": 20.8996, "step": 62630 }, { "epoch": 0.68, "learning_rate": 4.985654156075922e-06, "loss": 22.4648, "step": 62640 }, { "epoch": 0.68, "learning_rate": 4.982625104890981e-06, "loss": 20.9852, "step": 62650 }, { "epoch": 0.68, "learning_rate": 4.9795966688111805e-06, "loss": 21.3571, "step": 62660 }, { "epoch": 0.68, "learning_rate": 4.976568848207795e-06, "loss": 21.211, "step": 62670 }, { "epoch": 0.68, "learning_rate": 4.973541643452022e-06, "loss": 21.2732, "step": 62680 }, { "epoch": 0.68, "learning_rate": 4.9705150549149776e-06, "loss": 20.8296, "step": 62690 }, { "epoch": 0.68, "learning_rate": 4.967489082967717e-06, "loss": 21.5597, "step": 62700 }, { "epoch": 0.68, "learning_rate": 4.964463727981197e-06, "loss": 21.1976, "step": 62710 }, { "epoch": 0.68, "learning_rate": 4.961438990326316e-06, "loss": 21.396, "step": 62720 }, { "epoch": 0.68, "learning_rate": 4.958414870373892e-06, "loss": 21.7997, "step": 62730 }, { "epoch": 0.68, "learning_rate": 4.9553913684946664e-06, "loss": 21.1057, "step": 62740 }, { "epoch": 0.68, "learning_rate": 4.952368485059303e-06, "loss": 21.7225, "step": 62750 }, { "epoch": 0.68, "learning_rate": 4.949346220438401e-06, "loss": 21.3243, "step": 62760 }, { "epoch": 0.68, "learning_rate": 4.946324575002466e-06, "loss": 21.2569, "step": 62770 }, { "epoch": 0.68, "learning_rate": 4.9433035491219395e-06, "loss": 21.232, "step": 62780 }, { "epoch": 0.68, "learning_rate": 4.9402831431671834e-06, "loss": 21.0501, "step": 62790 }, { "epoch": 0.68, "learning_rate": 4.9372633575084824e-06, "loss": 21.6993, "step": 62800 }, { "epoch": 0.68, "learning_rate": 4.934244192516058e-06, "loss": 21.3766, "step": 62810 }, { "epoch": 0.68, "learning_rate": 4.931225648560032e-06, "loss": 21.2218, "step": 62820 }, { "epoch": 0.68, "learning_rate": 4.9282077260104684e-06, "loss": 21.5133, "step": 62830 }, { "epoch": 0.68, "learning_rate": 4.925190425237348e-06, "loss": 20.6413, "step": 62840 }, { "epoch": 0.68, "learning_rate": 4.922173746610575e-06, "loss": 21.1001, "step": 62850 }, { "epoch": 0.68, "learning_rate": 4.919157690499985e-06, "loss": 21.0607, "step": 62860 }, { "epoch": 0.68, "learning_rate": 4.916142257275331e-06, "loss": 20.6448, "step": 62870 }, { "epoch": 0.68, "learning_rate": 4.913127447306285e-06, "loss": 21.2265, "step": 62880 }, { "epoch": 0.68, "learning_rate": 4.910113260962449e-06, "loss": 21.3564, "step": 62890 }, { "epoch": 0.68, "learning_rate": 4.9070996986133446e-06, "loss": 20.8897, "step": 62900 }, { "epoch": 0.68, "learning_rate": 4.904086760628427e-06, "loss": 21.6395, "step": 62910 }, { "epoch": 0.68, "learning_rate": 4.901074447377067e-06, "loss": 21.4914, "step": 62920 }, { "epoch": 0.68, "learning_rate": 4.898062759228551e-06, "loss": 21.2297, "step": 62930 }, { "epoch": 0.68, "learning_rate": 4.895051696552102e-06, "loss": 21.6739, "step": 62940 }, { "epoch": 0.68, "learning_rate": 4.892041259716857e-06, "loss": 20.7151, "step": 62950 }, { "epoch": 0.68, "learning_rate": 4.889031449091889e-06, "loss": 21.251, "step": 62960 }, { "epoch": 0.68, "learning_rate": 4.886022265046185e-06, "loss": 21.1784, "step": 62970 }, { "epoch": 0.68, "learning_rate": 4.883013707948648e-06, "loss": 20.4723, "step": 62980 }, { "epoch": 0.68, "learning_rate": 4.880005778168115e-06, "loss": 21.1856, "step": 62990 }, { "epoch": 0.68, "learning_rate": 4.876998476073342e-06, "loss": 21.1074, "step": 63000 }, { "epoch": 0.68, "learning_rate": 4.873991802033015e-06, "loss": 20.8021, "step": 63010 }, { "epoch": 0.68, "learning_rate": 4.870985756415734e-06, "loss": 20.9461, "step": 63020 }, { "epoch": 0.68, "learning_rate": 4.8679803395900285e-06, "loss": 21.5886, "step": 63030 }, { "epoch": 0.68, "learning_rate": 4.864975551924342e-06, "loss": 20.65, "step": 63040 }, { "epoch": 0.68, "learning_rate": 4.861971393787043e-06, "loss": 21.1957, "step": 63050 }, { "epoch": 0.68, "learning_rate": 4.8589678655464355e-06, "loss": 20.9854, "step": 63060 }, { "epoch": 0.68, "learning_rate": 4.8559649675707344e-06, "loss": 21.7283, "step": 63070 }, { "epoch": 0.68, "learning_rate": 4.852962700228083e-06, "loss": 21.2877, "step": 63080 }, { "epoch": 0.68, "learning_rate": 4.849961063886537e-06, "loss": 21.7778, "step": 63090 }, { "epoch": 0.68, "learning_rate": 4.846960058914082e-06, "loss": 21.1505, "step": 63100 }, { "epoch": 0.68, "learning_rate": 4.843959685678633e-06, "loss": 20.6416, "step": 63110 }, { "epoch": 0.68, "learning_rate": 4.840959944548017e-06, "loss": 21.9861, "step": 63120 }, { "epoch": 0.68, "learning_rate": 4.837960835889993e-06, "loss": 21.3341, "step": 63130 }, { "epoch": 0.68, "learning_rate": 4.8349623600722275e-06, "loss": 21.615, "step": 63140 }, { "epoch": 0.68, "learning_rate": 4.831964517462319e-06, "loss": 20.9304, "step": 63150 }, { "epoch": 0.68, "learning_rate": 4.828967308427795e-06, "loss": 20.6232, "step": 63160 }, { "epoch": 0.68, "learning_rate": 4.825970733336096e-06, "loss": 22.0297, "step": 63170 }, { "epoch": 0.68, "learning_rate": 4.822974792554587e-06, "loss": 20.7496, "step": 63180 }, { "epoch": 0.68, "learning_rate": 4.819979486450558e-06, "loss": 21.6647, "step": 63190 }, { "epoch": 0.68, "learning_rate": 4.816984815391207e-06, "loss": 21.5068, "step": 63200 }, { "epoch": 0.68, "learning_rate": 4.813990779743679e-06, "loss": 21.2295, "step": 63210 }, { "epoch": 0.68, "learning_rate": 4.810997379875023e-06, "loss": 21.8675, "step": 63220 }, { "epoch": 0.68, "learning_rate": 4.8080046161522145e-06, "loss": 21.0162, "step": 63230 }, { "epoch": 0.68, "learning_rate": 4.805012488942157e-06, "loss": 20.5837, "step": 63240 }, { "epoch": 0.68, "learning_rate": 4.802020998611656e-06, "loss": 21.2646, "step": 63250 }, { "epoch": 0.68, "learning_rate": 4.799030145527467e-06, "loss": 21.0996, "step": 63260 }, { "epoch": 0.68, "learning_rate": 4.796039930056249e-06, "loss": 20.1672, "step": 63270 }, { "epoch": 0.68, "learning_rate": 4.7930503525645875e-06, "loss": 20.896, "step": 63280 }, { "epoch": 0.68, "learning_rate": 4.7900614134189906e-06, "loss": 21.0954, "step": 63290 }, { "epoch": 0.68, "learning_rate": 4.787073112985886e-06, "loss": 21.3847, "step": 63300 }, { "epoch": 0.68, "learning_rate": 4.784085451631626e-06, "loss": 21.9464, "step": 63310 }, { "epoch": 0.68, "learning_rate": 4.781098429722482e-06, "loss": 20.6036, "step": 63320 }, { "epoch": 0.68, "learning_rate": 4.778112047624648e-06, "loss": 21.5737, "step": 63330 }, { "epoch": 0.68, "learning_rate": 4.7751263057042396e-06, "loss": 21.09, "step": 63340 }, { "epoch": 0.68, "learning_rate": 4.772141204327294e-06, "loss": 20.6836, "step": 63350 }, { "epoch": 0.68, "learning_rate": 4.769156743859769e-06, "loss": 20.5852, "step": 63360 }, { "epoch": 0.69, "learning_rate": 4.766172924667547e-06, "loss": 21.2286, "step": 63370 }, { "epoch": 0.69, "learning_rate": 4.763189747116427e-06, "loss": 21.2873, "step": 63380 }, { "epoch": 0.69, "learning_rate": 4.760207211572132e-06, "loss": 21.0553, "step": 63390 }, { "epoch": 0.69, "learning_rate": 4.757225318400306e-06, "loss": 21.0321, "step": 63400 }, { "epoch": 0.69, "learning_rate": 4.754244067966515e-06, "loss": 21.1015, "step": 63410 }, { "epoch": 0.69, "learning_rate": 4.751263460636245e-06, "loss": 21.022, "step": 63420 }, { "epoch": 0.69, "learning_rate": 4.748283496774904e-06, "loss": 20.943, "step": 63430 }, { "epoch": 0.69, "learning_rate": 4.745304176747819e-06, "loss": 21.5455, "step": 63440 }, { "epoch": 0.69, "learning_rate": 4.742325500920242e-06, "loss": 22.2426, "step": 63450 }, { "epoch": 0.69, "learning_rate": 4.739347469657343e-06, "loss": 21.6632, "step": 63460 }, { "epoch": 0.69, "learning_rate": 4.736370083324213e-06, "loss": 20.7178, "step": 63470 }, { "epoch": 0.69, "learning_rate": 4.733393342285866e-06, "loss": 20.4001, "step": 63480 }, { "epoch": 0.69, "learning_rate": 4.7304172469072355e-06, "loss": 20.9418, "step": 63490 }, { "epoch": 0.69, "learning_rate": 4.727441797553174e-06, "loss": 21.6009, "step": 63500 }, { "epoch": 0.69, "learning_rate": 4.724466994588459e-06, "loss": 21.5726, "step": 63510 }, { "epoch": 0.69, "learning_rate": 4.721492838377786e-06, "loss": 21.3147, "step": 63520 }, { "epoch": 0.69, "learning_rate": 4.718519329285771e-06, "loss": 21.0813, "step": 63530 }, { "epoch": 0.69, "learning_rate": 4.715546467676952e-06, "loss": 20.8025, "step": 63540 }, { "epoch": 0.69, "learning_rate": 4.712574253915787e-06, "loss": 21.6442, "step": 63550 }, { "epoch": 0.69, "learning_rate": 4.70960268836665e-06, "loss": 21.4697, "step": 63560 }, { "epoch": 0.69, "learning_rate": 4.706631771393853e-06, "loss": 21.7529, "step": 63570 }, { "epoch": 0.69, "learning_rate": 4.703661503361603e-06, "loss": 21.9905, "step": 63580 }, { "epoch": 0.69, "learning_rate": 4.700691884634044e-06, "loss": 20.8367, "step": 63590 }, { "epoch": 0.69, "learning_rate": 4.697722915575237e-06, "loss": 20.8687, "step": 63600 }, { "epoch": 0.69, "learning_rate": 4.694754596549158e-06, "loss": 21.2534, "step": 63610 }, { "epoch": 0.69, "learning_rate": 4.691786927919721e-06, "loss": 20.7372, "step": 63620 }, { "epoch": 0.69, "learning_rate": 4.688819910050735e-06, "loss": 21.2674, "step": 63630 }, { "epoch": 0.69, "learning_rate": 4.685853543305945e-06, "loss": 21.4345, "step": 63640 }, { "epoch": 0.69, "learning_rate": 4.682887828049014e-06, "loss": 21.1812, "step": 63650 }, { "epoch": 0.69, "learning_rate": 4.679922764643519e-06, "loss": 21.0239, "step": 63660 }, { "epoch": 0.69, "learning_rate": 4.676958353452974e-06, "loss": 21.6564, "step": 63670 }, { "epoch": 0.69, "learning_rate": 4.67399459484079e-06, "loss": 21.4331, "step": 63680 }, { "epoch": 0.69, "learning_rate": 4.67103148917031e-06, "loss": 21.1229, "step": 63690 }, { "epoch": 0.69, "learning_rate": 4.6680690368048e-06, "loss": 21.1462, "step": 63700 }, { "epoch": 0.69, "learning_rate": 4.665107238107437e-06, "loss": 21.3204, "step": 63710 }, { "epoch": 0.69, "learning_rate": 4.662146093441329e-06, "loss": 20.9756, "step": 63720 }, { "epoch": 0.69, "learning_rate": 4.659185603169497e-06, "loss": 21.6478, "step": 63730 }, { "epoch": 0.69, "learning_rate": 4.656225767654877e-06, "loss": 21.3323, "step": 63740 }, { "epoch": 0.69, "learning_rate": 4.653266587260333e-06, "loss": 21.1403, "step": 63750 }, { "epoch": 0.69, "learning_rate": 4.650308062348642e-06, "loss": 21.5434, "step": 63760 }, { "epoch": 0.69, "learning_rate": 4.6473501932825116e-06, "loss": 21.4892, "step": 63770 }, { "epoch": 0.69, "learning_rate": 4.644392980424562e-06, "loss": 21.5068, "step": 63780 }, { "epoch": 0.69, "learning_rate": 4.641436424137325e-06, "loss": 20.7188, "step": 63790 }, { "epoch": 0.69, "learning_rate": 4.638480524783264e-06, "loss": 21.006, "step": 63800 }, { "epoch": 0.69, "learning_rate": 4.635525282724754e-06, "loss": 21.4278, "step": 63810 }, { "epoch": 0.69, "learning_rate": 4.632570698324099e-06, "loss": 20.9771, "step": 63820 }, { "epoch": 0.69, "learning_rate": 4.629616771943518e-06, "loss": 20.3681, "step": 63830 }, { "epoch": 0.69, "learning_rate": 4.626663503945138e-06, "loss": 20.6763, "step": 63840 }, { "epoch": 0.69, "learning_rate": 4.6237108946910216e-06, "loss": 21.507, "step": 63850 }, { "epoch": 0.69, "learning_rate": 4.620758944543137e-06, "loss": 20.6518, "step": 63860 }, { "epoch": 0.69, "learning_rate": 4.617807653863389e-06, "loss": 21.0091, "step": 63870 }, { "epoch": 0.69, "learning_rate": 4.614857023013585e-06, "loss": 22.0095, "step": 63880 }, { "epoch": 0.69, "learning_rate": 4.611907052355463e-06, "loss": 21.3988, "step": 63890 }, { "epoch": 0.69, "learning_rate": 4.608957742250667e-06, "loss": 21.5354, "step": 63900 }, { "epoch": 0.69, "learning_rate": 4.606009093060767e-06, "loss": 20.8986, "step": 63910 }, { "epoch": 0.69, "learning_rate": 4.603061105147261e-06, "loss": 21.4192, "step": 63920 }, { "epoch": 0.69, "learning_rate": 4.600113778871552e-06, "loss": 21.0066, "step": 63930 }, { "epoch": 0.69, "learning_rate": 4.5971671145949734e-06, "loss": 20.683, "step": 63940 }, { "epoch": 0.69, "learning_rate": 4.594221112678764e-06, "loss": 20.5137, "step": 63950 }, { "epoch": 0.69, "learning_rate": 4.5912757734840875e-06, "loss": 21.6755, "step": 63960 }, { "epoch": 0.69, "learning_rate": 4.588331097372037e-06, "loss": 21.0847, "step": 63970 }, { "epoch": 0.69, "learning_rate": 4.5853870847036094e-06, "loss": 21.307, "step": 63980 }, { "epoch": 0.69, "learning_rate": 4.582443735839728e-06, "loss": 21.062, "step": 63990 }, { "epoch": 0.69, "learning_rate": 4.579501051141234e-06, "loss": 21.7876, "step": 64000 }, { "epoch": 0.69, "learning_rate": 4.576559030968877e-06, "loss": 21.5935, "step": 64010 }, { "epoch": 0.69, "learning_rate": 4.573617675683344e-06, "loss": 21.1344, "step": 64020 }, { "epoch": 0.69, "learning_rate": 4.570676985645227e-06, "loss": 21.1471, "step": 64030 }, { "epoch": 0.69, "learning_rate": 4.5677369612150405e-06, "loss": 21.1665, "step": 64040 }, { "epoch": 0.69, "learning_rate": 4.56479760275322e-06, "loss": 20.9258, "step": 64050 }, { "epoch": 0.69, "learning_rate": 4.561858910620105e-06, "loss": 21.7291, "step": 64060 }, { "epoch": 0.69, "learning_rate": 4.558920885175976e-06, "loss": 21.7757, "step": 64070 }, { "epoch": 0.69, "learning_rate": 4.555983526781015e-06, "loss": 21.066, "step": 64080 }, { "epoch": 0.69, "learning_rate": 4.553046835795329e-06, "loss": 21.3014, "step": 64090 }, { "epoch": 0.69, "learning_rate": 4.5501108125789476e-06, "loss": 21.8039, "step": 64100 }, { "epoch": 0.69, "learning_rate": 4.547175457491796e-06, "loss": 21.3177, "step": 64110 }, { "epoch": 0.69, "learning_rate": 4.54424077089375e-06, "loss": 21.5192, "step": 64120 }, { "epoch": 0.69, "learning_rate": 4.541306753144582e-06, "loss": 21.4434, "step": 64130 }, { "epoch": 0.69, "learning_rate": 4.538373404603987e-06, "loss": 21.7512, "step": 64140 }, { "epoch": 0.69, "learning_rate": 4.535440725631582e-06, "loss": 20.9163, "step": 64150 }, { "epoch": 0.69, "learning_rate": 4.532508716586898e-06, "loss": 21.1103, "step": 64160 }, { "epoch": 0.69, "learning_rate": 4.529577377829378e-06, "loss": 21.5258, "step": 64170 }, { "epoch": 0.69, "learning_rate": 4.526646709718397e-06, "loss": 21.2461, "step": 64180 }, { "epoch": 0.69, "learning_rate": 4.52371671261324e-06, "loss": 21.1137, "step": 64190 }, { "epoch": 0.69, "learning_rate": 4.520787386873107e-06, "loss": 21.2128, "step": 64200 }, { "epoch": 0.69, "learning_rate": 4.517858732857125e-06, "loss": 20.9871, "step": 64210 }, { "epoch": 0.69, "learning_rate": 4.514930750924318e-06, "loss": 20.5678, "step": 64220 }, { "epoch": 0.69, "learning_rate": 4.5120034414336566e-06, "loss": 20.9457, "step": 64230 }, { "epoch": 0.69, "learning_rate": 4.509076804744009e-06, "loss": 21.7514, "step": 64240 }, { "epoch": 0.69, "learning_rate": 4.506150841214166e-06, "loss": 21.186, "step": 64250 }, { "epoch": 0.69, "learning_rate": 4.503225551202837e-06, "loss": 22.4171, "step": 64260 }, { "epoch": 0.69, "learning_rate": 4.500300935068647e-06, "loss": 21.3038, "step": 64270 }, { "epoch": 0.69, "learning_rate": 4.49737699317014e-06, "loss": 21.7801, "step": 64280 }, { "epoch": 0.7, "learning_rate": 4.4944537258657774e-06, "loss": 21.363, "step": 64290 }, { "epoch": 0.7, "learning_rate": 4.491531133513936e-06, "loss": 21.0924, "step": 64300 }, { "epoch": 0.7, "learning_rate": 4.488609216472911e-06, "loss": 21.0737, "step": 64310 }, { "epoch": 0.7, "learning_rate": 4.4856879751009166e-06, "loss": 21.6313, "step": 64320 }, { "epoch": 0.7, "learning_rate": 4.482767409756079e-06, "loss": 20.6199, "step": 64330 }, { "epoch": 0.7, "learning_rate": 4.4798475207964484e-06, "loss": 21.3535, "step": 64340 }, { "epoch": 0.7, "learning_rate": 4.476928308579987e-06, "loss": 21.7273, "step": 64350 }, { "epoch": 0.7, "learning_rate": 4.474009773464576e-06, "loss": 20.9656, "step": 64360 }, { "epoch": 0.7, "learning_rate": 4.471091915808013e-06, "loss": 21.2117, "step": 64370 }, { "epoch": 0.7, "learning_rate": 4.468174735968014e-06, "loss": 20.9547, "step": 64380 }, { "epoch": 0.7, "learning_rate": 4.465258234302209e-06, "loss": 21.8765, "step": 64390 }, { "epoch": 0.7, "learning_rate": 4.4623424111681465e-06, "loss": 21.1978, "step": 64400 }, { "epoch": 0.7, "learning_rate": 4.459427266923293e-06, "loss": 21.2606, "step": 64410 }, { "epoch": 0.7, "learning_rate": 4.456512801925032e-06, "loss": 20.907, "step": 64420 }, { "epoch": 0.7, "learning_rate": 4.453599016530658e-06, "loss": 21.4383, "step": 64430 }, { "epoch": 0.7, "learning_rate": 4.450685911097391e-06, "loss": 20.5256, "step": 64440 }, { "epoch": 0.7, "learning_rate": 4.44777348598236e-06, "loss": 21.2423, "step": 64450 }, { "epoch": 0.7, "learning_rate": 4.4448617415426165e-06, "loss": 21.0695, "step": 64460 }, { "epoch": 0.7, "learning_rate": 4.4419506781351255e-06, "loss": 21.743, "step": 64470 }, { "epoch": 0.7, "learning_rate": 4.439040296116766e-06, "loss": 21.9907, "step": 64480 }, { "epoch": 0.7, "learning_rate": 4.436130595844339e-06, "loss": 20.5856, "step": 64490 }, { "epoch": 0.7, "learning_rate": 4.4332215776745575e-06, "loss": 21.3673, "step": 64500 }, { "epoch": 0.7, "learning_rate": 4.430313241964056e-06, "loss": 21.2479, "step": 64510 }, { "epoch": 0.7, "learning_rate": 4.427405589069378e-06, "loss": 20.8131, "step": 64520 }, { "epoch": 0.7, "learning_rate": 4.424498619346985e-06, "loss": 22.2523, "step": 64530 }, { "epoch": 0.7, "learning_rate": 4.421592333153268e-06, "loss": 21.3233, "step": 64540 }, { "epoch": 0.7, "learning_rate": 4.4186867308445135e-06, "loss": 21.6575, "step": 64550 }, { "epoch": 0.7, "learning_rate": 4.415781812776936e-06, "loss": 20.9243, "step": 64560 }, { "epoch": 0.7, "learning_rate": 4.412877579306664e-06, "loss": 21.7302, "step": 64570 }, { "epoch": 0.7, "learning_rate": 4.409974030789739e-06, "loss": 21.4457, "step": 64580 }, { "epoch": 0.7, "learning_rate": 4.407071167582132e-06, "loss": 20.8557, "step": 64590 }, { "epoch": 0.7, "learning_rate": 4.4041689900397086e-06, "loss": 20.6721, "step": 64600 }, { "epoch": 0.7, "learning_rate": 4.401267498518266e-06, "loss": 21.2953, "step": 64610 }, { "epoch": 0.7, "learning_rate": 4.398366693373511e-06, "loss": 21.4462, "step": 64620 }, { "epoch": 0.7, "learning_rate": 4.395466574961066e-06, "loss": 21.2062, "step": 64630 }, { "epoch": 0.7, "learning_rate": 4.39256714363648e-06, "loss": 21.376, "step": 64640 }, { "epoch": 0.7, "learning_rate": 4.389668399755199e-06, "loss": 21.4615, "step": 64650 }, { "epoch": 0.7, "learning_rate": 4.386770343672598e-06, "loss": 21.2441, "step": 64660 }, { "epoch": 0.7, "learning_rate": 4.3838729757439655e-06, "loss": 22.2432, "step": 64670 }, { "epoch": 0.7, "learning_rate": 4.380976296324499e-06, "loss": 21.5643, "step": 64680 }, { "epoch": 0.7, "learning_rate": 4.378080305769324e-06, "loss": 21.2129, "step": 64690 }, { "epoch": 0.7, "learning_rate": 4.375185004433476e-06, "loss": 20.9261, "step": 64700 }, { "epoch": 0.7, "learning_rate": 4.3722903926718965e-06, "loss": 21.1384, "step": 64710 }, { "epoch": 0.7, "learning_rate": 4.369396470839453e-06, "loss": 21.4875, "step": 64720 }, { "epoch": 0.7, "learning_rate": 4.3665032392909245e-06, "loss": 20.3151, "step": 64730 }, { "epoch": 0.7, "learning_rate": 4.363610698381014e-06, "loss": 20.8806, "step": 64740 }, { "epoch": 0.7, "learning_rate": 4.360718848464329e-06, "loss": 20.5701, "step": 64750 }, { "epoch": 0.7, "learning_rate": 4.357827689895392e-06, "loss": 21.4671, "step": 64760 }, { "epoch": 0.7, "learning_rate": 4.354937223028648e-06, "loss": 20.6589, "step": 64770 }, { "epoch": 0.7, "learning_rate": 4.352047448218448e-06, "loss": 21.0568, "step": 64780 }, { "epoch": 0.7, "learning_rate": 4.3491583658190735e-06, "loss": 20.9586, "step": 64790 }, { "epoch": 0.7, "learning_rate": 4.346269976184711e-06, "loss": 21.3864, "step": 64800 }, { "epoch": 0.7, "learning_rate": 4.343382279669457e-06, "loss": 20.7823, "step": 64810 }, { "epoch": 0.7, "learning_rate": 4.340495276627329e-06, "loss": 20.9516, "step": 64820 }, { "epoch": 0.7, "learning_rate": 4.337608967412257e-06, "loss": 21.4004, "step": 64830 }, { "epoch": 0.7, "learning_rate": 4.334723352378095e-06, "loss": 20.0968, "step": 64840 }, { "epoch": 0.7, "learning_rate": 4.3318384318786035e-06, "loss": 21.138, "step": 64850 }, { "epoch": 0.7, "learning_rate": 4.3289542062674605e-06, "loss": 20.6943, "step": 64860 }, { "epoch": 0.7, "learning_rate": 4.326070675898252e-06, "loss": 20.3861, "step": 64870 }, { "epoch": 0.7, "learning_rate": 4.323187841124483e-06, "loss": 20.6303, "step": 64880 }, { "epoch": 0.7, "learning_rate": 4.320305702299583e-06, "loss": 21.0086, "step": 64890 }, { "epoch": 0.7, "learning_rate": 4.317424259776884e-06, "loss": 21.2827, "step": 64900 }, { "epoch": 0.7, "learning_rate": 4.314543513909639e-06, "loss": 21.4213, "step": 64910 }, { "epoch": 0.7, "learning_rate": 4.311663465051008e-06, "loss": 21.2901, "step": 64920 }, { "epoch": 0.7, "learning_rate": 4.30878411355407e-06, "loss": 21.0751, "step": 64930 }, { "epoch": 0.7, "learning_rate": 4.305905459771825e-06, "loss": 21.1106, "step": 64940 }, { "epoch": 0.7, "learning_rate": 4.303027504057179e-06, "loss": 21.6284, "step": 64950 }, { "epoch": 0.7, "learning_rate": 4.300150246762955e-06, "loss": 20.9641, "step": 64960 }, { "epoch": 0.7, "learning_rate": 4.297273688241895e-06, "loss": 20.8321, "step": 64970 }, { "epoch": 0.7, "learning_rate": 4.294397828846637e-06, "loss": 20.8813, "step": 64980 }, { "epoch": 0.7, "learning_rate": 4.291522668929759e-06, "loss": 21.3896, "step": 64990 }, { "epoch": 0.7, "learning_rate": 4.288648208843741e-06, "loss": 21.7304, "step": 65000 }, { "epoch": 0.7, "learning_rate": 4.2857744489409725e-06, "loss": 20.7359, "step": 65010 }, { "epoch": 0.7, "learning_rate": 4.282901389573769e-06, "loss": 21.3406, "step": 65020 }, { "epoch": 0.7, "learning_rate": 4.280029031094341e-06, "loss": 21.4267, "step": 65030 }, { "epoch": 0.7, "learning_rate": 4.277157373854838e-06, "loss": 21.0941, "step": 65040 }, { "epoch": 0.7, "learning_rate": 4.274286418207305e-06, "loss": 21.3128, "step": 65050 }, { "epoch": 0.7, "learning_rate": 4.271416164503708e-06, "loss": 21.3179, "step": 65060 }, { "epoch": 0.7, "learning_rate": 4.268546613095928e-06, "loss": 21.197, "step": 65070 }, { "epoch": 0.7, "learning_rate": 4.2656777643357485e-06, "loss": 21.473, "step": 65080 }, { "epoch": 0.7, "learning_rate": 4.262809618574887e-06, "loss": 20.8964, "step": 65090 }, { "epoch": 0.7, "learning_rate": 4.259942176164958e-06, "loss": 21.063, "step": 65100 }, { "epoch": 0.7, "learning_rate": 4.257075437457499e-06, "loss": 21.233, "step": 65110 }, { "epoch": 0.7, "learning_rate": 4.254209402803956e-06, "loss": 21.0737, "step": 65120 }, { "epoch": 0.7, "learning_rate": 4.25134407255569e-06, "loss": 20.6278, "step": 65130 }, { "epoch": 0.7, "learning_rate": 4.248479447063977e-06, "loss": 21.4354, "step": 65140 }, { "epoch": 0.7, "learning_rate": 4.245615526680006e-06, "loss": 21.2609, "step": 65150 }, { "epoch": 0.7, "learning_rate": 4.242752311754879e-06, "loss": 20.6679, "step": 65160 }, { "epoch": 0.7, "learning_rate": 4.239889802639611e-06, "loss": 21.4668, "step": 65170 }, { "epoch": 0.7, "learning_rate": 4.237027999685133e-06, "loss": 20.8487, "step": 65180 }, { "epoch": 0.7, "learning_rate": 4.234166903242287e-06, "loss": 22.1163, "step": 65190 }, { "epoch": 0.7, "learning_rate": 4.231306513661829e-06, "loss": 21.0526, "step": 65200 }, { "epoch": 0.7, "learning_rate": 4.22844683129443e-06, "loss": 21.7053, "step": 65210 }, { "epoch": 0.71, "learning_rate": 4.225587856490669e-06, "loss": 21.6719, "step": 65220 }, { "epoch": 0.71, "learning_rate": 4.222729589601047e-06, "loss": 21.4435, "step": 65230 }, { "epoch": 0.71, "learning_rate": 4.219872030975969e-06, "loss": 21.5067, "step": 65240 }, { "epoch": 0.71, "learning_rate": 4.21701518096576e-06, "loss": 21.7388, "step": 65250 }, { "epoch": 0.71, "learning_rate": 4.214159039920654e-06, "loss": 20.5011, "step": 65260 }, { "epoch": 0.71, "learning_rate": 4.211303608190802e-06, "loss": 21.6496, "step": 65270 }, { "epoch": 0.71, "learning_rate": 4.208448886126264e-06, "loss": 20.5073, "step": 65280 }, { "epoch": 0.71, "learning_rate": 4.205594874077014e-06, "loss": 21.3422, "step": 65290 }, { "epoch": 0.71, "learning_rate": 4.202741572392941e-06, "loss": 21.68, "step": 65300 }, { "epoch": 0.71, "learning_rate": 4.199888981423845e-06, "loss": 21.0569, "step": 65310 }, { "epoch": 0.71, "learning_rate": 4.197037101519439e-06, "loss": 20.9267, "step": 65320 }, { "epoch": 0.71, "learning_rate": 4.19418593302935e-06, "loss": 21.0604, "step": 65330 }, { "epoch": 0.71, "learning_rate": 4.191335476303118e-06, "loss": 21.7358, "step": 65340 }, { "epoch": 0.71, "learning_rate": 4.188485731690192e-06, "loss": 20.8981, "step": 65350 }, { "epoch": 0.71, "learning_rate": 4.185636699539939e-06, "loss": 21.2391, "step": 65360 }, { "epoch": 0.71, "learning_rate": 4.182788380201634e-06, "loss": 21.0493, "step": 65370 }, { "epoch": 0.71, "learning_rate": 4.179940774024469e-06, "loss": 21.1605, "step": 65380 }, { "epoch": 0.71, "learning_rate": 4.177093881357545e-06, "loss": 21.4989, "step": 65390 }, { "epoch": 0.71, "learning_rate": 4.174247702549877e-06, "loss": 20.3191, "step": 65400 }, { "epoch": 0.71, "learning_rate": 4.171402237950393e-06, "loss": 21.0045, "step": 65410 }, { "epoch": 0.71, "learning_rate": 4.168557487907932e-06, "loss": 20.5612, "step": 65420 }, { "epoch": 0.71, "learning_rate": 4.165713452771245e-06, "loss": 21.2025, "step": 65430 }, { "epoch": 0.71, "learning_rate": 4.162870132888998e-06, "loss": 22.5184, "step": 65440 }, { "epoch": 0.71, "learning_rate": 4.1600275286097704e-06, "loss": 21.1038, "step": 65450 }, { "epoch": 0.71, "learning_rate": 4.157185640282047e-06, "loss": 20.8929, "step": 65460 }, { "epoch": 0.71, "learning_rate": 4.15434446825423e-06, "loss": 21.403, "step": 65470 }, { "epoch": 0.71, "learning_rate": 4.151504012874634e-06, "loss": 20.9284, "step": 65480 }, { "epoch": 0.71, "learning_rate": 4.148664274491485e-06, "loss": 21.5856, "step": 65490 }, { "epoch": 0.71, "learning_rate": 4.145825253452921e-06, "loss": 21.0896, "step": 65500 }, { "epoch": 0.71, "learning_rate": 4.14298695010699e-06, "loss": 21.118, "step": 65510 }, { "epoch": 0.71, "learning_rate": 4.140149364801654e-06, "loss": 21.1383, "step": 65520 }, { "epoch": 0.71, "learning_rate": 4.137312497884789e-06, "loss": 20.9513, "step": 65530 }, { "epoch": 0.71, "learning_rate": 4.134476349704179e-06, "loss": 21.5909, "step": 65540 }, { "epoch": 0.71, "learning_rate": 4.131640920607518e-06, "loss": 21.2061, "step": 65550 }, { "epoch": 0.71, "learning_rate": 4.128806210942426e-06, "loss": 22.1944, "step": 65560 }, { "epoch": 0.71, "learning_rate": 4.125972221056416e-06, "loss": 21.5858, "step": 65570 }, { "epoch": 0.71, "learning_rate": 4.123138951296921e-06, "loss": 21.153, "step": 65580 }, { "epoch": 0.71, "learning_rate": 4.120306402011288e-06, "loss": 21.4352, "step": 65590 }, { "epoch": 0.71, "learning_rate": 4.11747457354677e-06, "loss": 21.2333, "step": 65600 }, { "epoch": 0.71, "learning_rate": 4.114643466250544e-06, "loss": 21.2597, "step": 65610 }, { "epoch": 0.71, "learning_rate": 4.111813080469681e-06, "loss": 21.6252, "step": 65620 }, { "epoch": 0.71, "learning_rate": 4.1089834165511744e-06, "loss": 21.3054, "step": 65630 }, { "epoch": 0.71, "learning_rate": 4.106154474841928e-06, "loss": 20.8589, "step": 65640 }, { "epoch": 0.71, "learning_rate": 4.103326255688751e-06, "loss": 21.3481, "step": 65650 }, { "epoch": 0.71, "learning_rate": 4.100498759438376e-06, "loss": 21.5563, "step": 65660 }, { "epoch": 0.71, "learning_rate": 4.097671986437441e-06, "loss": 20.6664, "step": 65670 }, { "epoch": 0.71, "learning_rate": 4.094845937032488e-06, "loss": 21.7577, "step": 65680 }, { "epoch": 0.71, "learning_rate": 4.092020611569978e-06, "loss": 21.0341, "step": 65690 }, { "epoch": 0.71, "learning_rate": 4.0891960103962804e-06, "loss": 20.6825, "step": 65700 }, { "epoch": 0.71, "learning_rate": 4.086372133857681e-06, "loss": 21.0723, "step": 65710 }, { "epoch": 0.71, "learning_rate": 4.083548982300377e-06, "loss": 21.8208, "step": 65720 }, { "epoch": 0.71, "learning_rate": 4.080726556070464e-06, "loss": 21.4808, "step": 65730 }, { "epoch": 0.71, "learning_rate": 4.077904855513959e-06, "loss": 20.7147, "step": 65740 }, { "epoch": 0.71, "learning_rate": 4.0750838809767875e-06, "loss": 21.6268, "step": 65750 }, { "epoch": 0.71, "learning_rate": 4.0722636328047924e-06, "loss": 21.0947, "step": 65760 }, { "epoch": 0.71, "learning_rate": 4.069444111343723e-06, "loss": 20.4908, "step": 65770 }, { "epoch": 0.71, "learning_rate": 4.066625316939233e-06, "loss": 21.4963, "step": 65780 }, { "epoch": 0.71, "learning_rate": 4.063807249936892e-06, "loss": 21.8584, "step": 65790 }, { "epoch": 0.71, "learning_rate": 4.060989910682181e-06, "loss": 20.7471, "step": 65800 }, { "epoch": 0.71, "learning_rate": 4.058173299520496e-06, "loss": 21.0582, "step": 65810 }, { "epoch": 0.71, "learning_rate": 4.055357416797139e-06, "loss": 20.8402, "step": 65820 }, { "epoch": 0.71, "learning_rate": 4.052542262857324e-06, "loss": 21.3977, "step": 65830 }, { "epoch": 0.71, "learning_rate": 4.04972783804617e-06, "loss": 21.4037, "step": 65840 }, { "epoch": 0.71, "learning_rate": 4.04691414270871e-06, "loss": 20.7726, "step": 65850 }, { "epoch": 0.71, "learning_rate": 4.044101177189897e-06, "loss": 21.1123, "step": 65860 }, { "epoch": 0.71, "learning_rate": 4.041288941834581e-06, "loss": 21.1458, "step": 65870 }, { "epoch": 0.71, "learning_rate": 4.038477436987535e-06, "loss": 21.0732, "step": 65880 }, { "epoch": 0.71, "learning_rate": 4.0356666629934245e-06, "loss": 21.3154, "step": 65890 }, { "epoch": 0.71, "learning_rate": 4.03285662019684e-06, "loss": 21.6181, "step": 65900 }, { "epoch": 0.71, "learning_rate": 4.030047308942283e-06, "loss": 21.2813, "step": 65910 }, { "epoch": 0.71, "learning_rate": 4.02723872957416e-06, "loss": 21.573, "step": 65920 }, { "epoch": 0.71, "learning_rate": 4.024430882436786e-06, "loss": 20.9981, "step": 65930 }, { "epoch": 0.71, "learning_rate": 4.021623767874396e-06, "loss": 21.1156, "step": 65940 }, { "epoch": 0.71, "learning_rate": 4.018817386231114e-06, "loss": 21.7601, "step": 65950 }, { "epoch": 0.71, "learning_rate": 4.016011737851001e-06, "loss": 21.1411, "step": 65960 }, { "epoch": 0.71, "learning_rate": 4.013206823078013e-06, "loss": 20.9655, "step": 65970 }, { "epoch": 0.71, "learning_rate": 4.010402642256016e-06, "loss": 21.3161, "step": 65980 }, { "epoch": 0.71, "learning_rate": 4.007599195728794e-06, "loss": 21.3259, "step": 65990 }, { "epoch": 0.71, "learning_rate": 4.004796483840023e-06, "loss": 21.288, "step": 66000 }, { "epoch": 0.71, "learning_rate": 4.001994506933315e-06, "loss": 22.1284, "step": 66010 }, { "epoch": 0.71, "learning_rate": 3.999193265352174e-06, "loss": 21.0111, "step": 66020 }, { "epoch": 0.71, "learning_rate": 3.996392759440015e-06, "loss": 20.8311, "step": 66030 }, { "epoch": 0.71, "learning_rate": 3.993592989540175e-06, "loss": 21.6714, "step": 66040 }, { "epoch": 0.71, "learning_rate": 3.990793955995876e-06, "loss": 21.4659, "step": 66050 }, { "epoch": 0.71, "learning_rate": 3.98799565915028e-06, "loss": 21.3718, "step": 66060 }, { "epoch": 0.71, "learning_rate": 3.9851980993464386e-06, "loss": 21.248, "step": 66070 }, { "epoch": 0.71, "learning_rate": 3.98240127692732e-06, "loss": 21.8956, "step": 66080 }, { "epoch": 0.71, "learning_rate": 3.979605192235799e-06, "loss": 20.8987, "step": 66090 }, { "epoch": 0.71, "learning_rate": 3.9768098456146645e-06, "loss": 21.6532, "step": 66100 }, { "epoch": 0.71, "learning_rate": 3.9740152374066085e-06, "loss": 20.7754, "step": 66110 }, { "epoch": 0.71, "learning_rate": 3.971221367954239e-06, "loss": 20.7693, "step": 66120 }, { "epoch": 0.71, "learning_rate": 3.9684282376000685e-06, "loss": 20.6277, "step": 66130 }, { "epoch": 0.72, "learning_rate": 3.965635846686521e-06, "loss": 21.2775, "step": 66140 }, { "epoch": 0.72, "learning_rate": 3.962844195555931e-06, "loss": 21.2332, "step": 66150 }, { "epoch": 0.72, "learning_rate": 3.96005328455054e-06, "loss": 21.4765, "step": 66160 }, { "epoch": 0.72, "learning_rate": 3.9572631140125005e-06, "loss": 21.4112, "step": 66170 }, { "epoch": 0.72, "learning_rate": 3.954473684283873e-06, "loss": 21.1134, "step": 66180 }, { "epoch": 0.72, "learning_rate": 3.951684995706628e-06, "loss": 20.7852, "step": 66190 }, { "epoch": 0.72, "learning_rate": 3.9488970486226445e-06, "loss": 20.5856, "step": 66200 }, { "epoch": 0.72, "learning_rate": 3.94610984337371e-06, "loss": 21.1566, "step": 66210 }, { "epoch": 0.72, "learning_rate": 3.943323380301524e-06, "loss": 21.3131, "step": 66220 }, { "epoch": 0.72, "learning_rate": 3.9405376597476905e-06, "loss": 21.1396, "step": 66230 }, { "epoch": 0.72, "learning_rate": 3.937752682053728e-06, "loss": 21.2339, "step": 66240 }, { "epoch": 0.72, "learning_rate": 3.9349684475610585e-06, "loss": 21.3642, "step": 66250 }, { "epoch": 0.72, "learning_rate": 3.932184956611016e-06, "loss": 20.7219, "step": 66260 }, { "epoch": 0.72, "learning_rate": 3.929402209544843e-06, "loss": 20.7933, "step": 66270 }, { "epoch": 0.72, "learning_rate": 3.926620206703689e-06, "loss": 20.8951, "step": 66280 }, { "epoch": 0.72, "learning_rate": 3.9238389484286155e-06, "loss": 21.3394, "step": 66290 }, { "epoch": 0.72, "learning_rate": 3.9210584350605905e-06, "loss": 21.1139, "step": 66300 }, { "epoch": 0.72, "learning_rate": 3.91827866694049e-06, "loss": 20.6219, "step": 66310 }, { "epoch": 0.72, "learning_rate": 3.915499644409101e-06, "loss": 21.0529, "step": 66320 }, { "epoch": 0.72, "learning_rate": 3.9127213678071165e-06, "loss": 21.6343, "step": 66330 }, { "epoch": 0.72, "learning_rate": 3.909943837475141e-06, "loss": 20.9549, "step": 66340 }, { "epoch": 0.72, "learning_rate": 3.907167053753683e-06, "loss": 20.5956, "step": 66350 }, { "epoch": 0.72, "learning_rate": 3.904391016983165e-06, "loss": 20.7415, "step": 66360 }, { "epoch": 0.72, "learning_rate": 3.901615727503916e-06, "loss": 21.3893, "step": 66370 }, { "epoch": 0.72, "learning_rate": 3.898841185656171e-06, "loss": 21.1375, "step": 66380 }, { "epoch": 0.72, "learning_rate": 3.896067391780074e-06, "loss": 21.0374, "step": 66390 }, { "epoch": 0.72, "learning_rate": 3.89329434621568e-06, "loss": 20.8116, "step": 66400 }, { "epoch": 0.72, "learning_rate": 3.890522049302949e-06, "loss": 21.8525, "step": 66410 }, { "epoch": 0.72, "learning_rate": 3.887750501381754e-06, "loss": 21.4239, "step": 66420 }, { "epoch": 0.72, "learning_rate": 3.884979702791869e-06, "loss": 20.6914, "step": 66430 }, { "epoch": 0.72, "learning_rate": 3.882209653872983e-06, "loss": 21.5402, "step": 66440 }, { "epoch": 0.72, "learning_rate": 3.879440354964688e-06, "loss": 20.723, "step": 66450 }, { "epoch": 0.72, "learning_rate": 3.876671806406488e-06, "loss": 21.2382, "step": 66460 }, { "epoch": 0.72, "learning_rate": 3.873904008537792e-06, "loss": 21.2282, "step": 66470 }, { "epoch": 0.72, "learning_rate": 3.8711369616979185e-06, "loss": 21.2569, "step": 66480 }, { "epoch": 0.72, "learning_rate": 3.8683706662260945e-06, "loss": 21.5477, "step": 66490 }, { "epoch": 0.72, "learning_rate": 3.865605122461453e-06, "loss": 21.5073, "step": 66500 }, { "epoch": 0.72, "learning_rate": 3.862840330743038e-06, "loss": 21.2336, "step": 66510 }, { "epoch": 0.72, "learning_rate": 3.860076291409792e-06, "loss": 21.7125, "step": 66520 }, { "epoch": 0.72, "learning_rate": 3.8573130048005855e-06, "loss": 21.3069, "step": 66530 }, { "epoch": 0.72, "learning_rate": 3.8545504712541725e-06, "loss": 21.2005, "step": 66540 }, { "epoch": 0.72, "learning_rate": 3.85178869110923e-06, "loss": 21.7788, "step": 66550 }, { "epoch": 0.72, "learning_rate": 3.849027664704337e-06, "loss": 20.921, "step": 66560 }, { "epoch": 0.72, "learning_rate": 3.846267392377979e-06, "loss": 21.2221, "step": 66570 }, { "epoch": 0.72, "learning_rate": 3.843507874468563e-06, "loss": 21.3206, "step": 66580 }, { "epoch": 0.72, "learning_rate": 3.84074911131438e-06, "loss": 20.6837, "step": 66590 }, { "epoch": 0.72, "learning_rate": 3.837991103253646e-06, "loss": 20.9075, "step": 66600 }, { "epoch": 0.72, "learning_rate": 3.835233850624476e-06, "loss": 21.8526, "step": 66610 }, { "epoch": 0.72, "learning_rate": 3.832477353764895e-06, "loss": 20.7729, "step": 66620 }, { "epoch": 0.72, "learning_rate": 3.829721613012841e-06, "loss": 21.4664, "step": 66630 }, { "epoch": 0.72, "learning_rate": 3.826966628706155e-06, "loss": 21.2838, "step": 66640 }, { "epoch": 0.72, "learning_rate": 3.824212401182576e-06, "loss": 21.8546, "step": 66650 }, { "epoch": 0.72, "learning_rate": 3.821458930779765e-06, "loss": 21.6433, "step": 66660 }, { "epoch": 0.72, "learning_rate": 3.818706217835277e-06, "loss": 20.8518, "step": 66670 }, { "epoch": 0.72, "learning_rate": 3.8159542626865895e-06, "loss": 20.9197, "step": 66680 }, { "epoch": 0.72, "learning_rate": 3.813203065671078e-06, "loss": 21.1963, "step": 66690 }, { "epoch": 0.72, "learning_rate": 3.810452627126019e-06, "loss": 21.6534, "step": 66700 }, { "epoch": 0.72, "learning_rate": 3.807702947388605e-06, "loss": 20.914, "step": 66710 }, { "epoch": 0.72, "learning_rate": 3.8049540267959305e-06, "loss": 21.3788, "step": 66720 }, { "epoch": 0.72, "learning_rate": 3.8022058656850068e-06, "loss": 21.1977, "step": 66730 }, { "epoch": 0.72, "learning_rate": 3.7994584643927445e-06, "loss": 21.4413, "step": 66740 }, { "epoch": 0.72, "learning_rate": 3.796711823255953e-06, "loss": 21.2098, "step": 66750 }, { "epoch": 0.72, "learning_rate": 3.7939659426113616e-06, "loss": 21.7925, "step": 66760 }, { "epoch": 0.72, "learning_rate": 3.791220822795597e-06, "loss": 21.5208, "step": 66770 }, { "epoch": 0.72, "learning_rate": 3.7884764641452064e-06, "loss": 22.0815, "step": 66780 }, { "epoch": 0.72, "learning_rate": 3.7857328669966287e-06, "loss": 21.1524, "step": 66790 }, { "epoch": 0.72, "learning_rate": 3.782990031686219e-06, "loss": 20.8428, "step": 66800 }, { "epoch": 0.72, "learning_rate": 3.7802479585502296e-06, "loss": 21.0945, "step": 66810 }, { "epoch": 0.72, "learning_rate": 3.7775066479248248e-06, "loss": 21.1948, "step": 66820 }, { "epoch": 0.72, "learning_rate": 3.774766100146081e-06, "loss": 20.5541, "step": 66830 }, { "epoch": 0.72, "learning_rate": 3.7720263155499737e-06, "loss": 21.3245, "step": 66840 }, { "epoch": 0.72, "learning_rate": 3.769287294472389e-06, "loss": 21.2641, "step": 66850 }, { "epoch": 0.72, "learning_rate": 3.766549037249112e-06, "loss": 20.932, "step": 66860 }, { "epoch": 0.72, "learning_rate": 3.7638115442158374e-06, "loss": 21.5031, "step": 66870 }, { "epoch": 0.72, "learning_rate": 3.7610748157081777e-06, "loss": 21.101, "step": 66880 }, { "epoch": 0.72, "learning_rate": 3.758338852061636e-06, "loss": 21.4875, "step": 66890 }, { "epoch": 0.72, "learning_rate": 3.755603653611629e-06, "loss": 21.4747, "step": 66900 }, { "epoch": 0.72, "learning_rate": 3.7528692206934826e-06, "loss": 20.2967, "step": 66910 }, { "epoch": 0.72, "learning_rate": 3.7501355536424135e-06, "loss": 21.8482, "step": 66920 }, { "epoch": 0.72, "learning_rate": 3.747402652793566e-06, "loss": 21.2633, "step": 66930 }, { "epoch": 0.72, "learning_rate": 3.7446705184819765e-06, "loss": 21.5528, "step": 66940 }, { "epoch": 0.72, "learning_rate": 3.7419391510425905e-06, "loss": 21.2488, "step": 66950 }, { "epoch": 0.72, "learning_rate": 3.739208550810265e-06, "loss": 21.4327, "step": 66960 }, { "epoch": 0.72, "learning_rate": 3.736478718119747e-06, "loss": 21.3602, "step": 66970 }, { "epoch": 0.72, "learning_rate": 3.7337496533057107e-06, "loss": 20.9521, "step": 66980 }, { "epoch": 0.72, "learning_rate": 3.731021356702722e-06, "loss": 21.1352, "step": 66990 }, { "epoch": 0.72, "learning_rate": 3.728293828645256e-06, "loss": 21.5463, "step": 67000 }, { "epoch": 0.72, "learning_rate": 3.7255670694676992e-06, "loss": 21.9949, "step": 67010 }, { "epoch": 0.72, "learning_rate": 3.722841079504327e-06, "loss": 20.8235, "step": 67020 }, { "epoch": 0.72, "learning_rate": 3.7201158590893427e-06, "loss": 21.2373, "step": 67030 }, { "epoch": 0.72, "learning_rate": 3.717391408556842e-06, "loss": 20.2928, "step": 67040 }, { "epoch": 0.72, "learning_rate": 3.7146677282408284e-06, "loss": 21.0504, "step": 67050 }, { "epoch": 0.72, "learning_rate": 3.7119448184752106e-06, "loss": 21.5112, "step": 67060 }, { "epoch": 0.73, "learning_rate": 3.709222679593806e-06, "loss": 20.6555, "step": 67070 }, { "epoch": 0.73, "learning_rate": 3.706501311930333e-06, "loss": 21.0902, "step": 67080 }, { "epoch": 0.73, "learning_rate": 3.703780715818419e-06, "loss": 21.0088, "step": 67090 }, { "epoch": 0.73, "learning_rate": 3.7010608915915946e-06, "loss": 21.5784, "step": 67100 }, { "epoch": 0.73, "learning_rate": 3.6983418395832983e-06, "loss": 20.8438, "step": 67110 }, { "epoch": 0.73, "learning_rate": 3.695623560126871e-06, "loss": 21.7833, "step": 67120 }, { "epoch": 0.73, "learning_rate": 3.6929060535555592e-06, "loss": 21.6531, "step": 67130 }, { "epoch": 0.73, "learning_rate": 3.6901893202025184e-06, "loss": 21.6692, "step": 67140 }, { "epoch": 0.73, "learning_rate": 3.687473360400805e-06, "loss": 21.2372, "step": 67150 }, { "epoch": 0.73, "learning_rate": 3.6847581744833818e-06, "loss": 21.3496, "step": 67160 }, { "epoch": 0.73, "learning_rate": 3.6820437627831173e-06, "loss": 21.5407, "step": 67170 }, { "epoch": 0.73, "learning_rate": 3.6793301256327853e-06, "loss": 21.3495, "step": 67180 }, { "epoch": 0.73, "learning_rate": 3.676617263365064e-06, "loss": 21.2701, "step": 67190 }, { "epoch": 0.73, "learning_rate": 3.6739051763125368e-06, "loss": 21.5598, "step": 67200 }, { "epoch": 0.73, "learning_rate": 3.6711938648076915e-06, "loss": 20.388, "step": 67210 }, { "epoch": 0.73, "learning_rate": 3.6684833291829224e-06, "loss": 21.0635, "step": 67220 }, { "epoch": 0.73, "learning_rate": 3.6657735697705267e-06, "loss": 21.7669, "step": 67230 }, { "epoch": 0.73, "learning_rate": 3.663064586902708e-06, "loss": 22.0583, "step": 67240 }, { "epoch": 0.73, "learning_rate": 3.6603563809115738e-06, "loss": 21.541, "step": 67250 }, { "epoch": 0.73, "learning_rate": 3.657648952129137e-06, "loss": 21.0229, "step": 67260 }, { "epoch": 0.73, "learning_rate": 3.654942300887314e-06, "loss": 21.3396, "step": 67270 }, { "epoch": 0.73, "learning_rate": 3.6522364275179277e-06, "loss": 21.5152, "step": 67280 }, { "epoch": 0.73, "learning_rate": 3.6495313323527038e-06, "loss": 20.7008, "step": 67290 }, { "epoch": 0.73, "learning_rate": 3.6468270157232745e-06, "loss": 20.7906, "step": 67300 }, { "epoch": 0.73, "learning_rate": 3.6441234779611744e-06, "loss": 21.5555, "step": 67310 }, { "epoch": 0.73, "learning_rate": 3.6414207193978457e-06, "loss": 21.0142, "step": 67320 }, { "epoch": 0.73, "learning_rate": 3.6387187403646276e-06, "loss": 21.814, "step": 67330 }, { "epoch": 0.73, "learning_rate": 3.63601754119278e-06, "loss": 20.8451, "step": 67340 }, { "epoch": 0.73, "learning_rate": 3.633317122213447e-06, "loss": 20.8154, "step": 67350 }, { "epoch": 0.73, "learning_rate": 3.630617483757688e-06, "loss": 21.0641, "step": 67360 }, { "epoch": 0.73, "learning_rate": 3.627918626156468e-06, "loss": 21.8936, "step": 67370 }, { "epoch": 0.73, "learning_rate": 3.625220549740649e-06, "loss": 21.981, "step": 67380 }, { "epoch": 0.73, "learning_rate": 3.6225232548410105e-06, "loss": 21.1126, "step": 67390 }, { "epoch": 0.73, "learning_rate": 3.619826741788219e-06, "loss": 21.2849, "step": 67400 }, { "epoch": 0.73, "learning_rate": 3.6171310109128564e-06, "loss": 20.7498, "step": 67410 }, { "epoch": 0.73, "learning_rate": 3.6144360625454056e-06, "loss": 21.0041, "step": 67420 }, { "epoch": 0.73, "learning_rate": 3.61174189701625e-06, "loss": 21.0572, "step": 67430 }, { "epoch": 0.73, "learning_rate": 3.609048514655692e-06, "loss": 21.1995, "step": 67440 }, { "epoch": 0.73, "learning_rate": 3.6063559157939165e-06, "loss": 21.1284, "step": 67450 }, { "epoch": 0.73, "learning_rate": 3.603664100761026e-06, "loss": 21.1865, "step": 67460 }, { "epoch": 0.73, "learning_rate": 3.600973069887024e-06, "loss": 21.1115, "step": 67470 }, { "epoch": 0.73, "learning_rate": 3.598282823501812e-06, "loss": 21.261, "step": 67480 }, { "epoch": 0.73, "learning_rate": 3.5955933619352102e-06, "loss": 21.3991, "step": 67490 }, { "epoch": 0.73, "learning_rate": 3.5929046855169314e-06, "loss": 21.0677, "step": 67500 }, { "epoch": 0.73, "learning_rate": 3.5902167945765885e-06, "loss": 21.383, "step": 67510 }, { "epoch": 0.73, "learning_rate": 3.5875296894437063e-06, "loss": 20.6923, "step": 67520 }, { "epoch": 0.73, "learning_rate": 3.584843370447707e-06, "loss": 21.6484, "step": 67530 }, { "epoch": 0.73, "learning_rate": 3.5821578379179267e-06, "loss": 20.9245, "step": 67540 }, { "epoch": 0.73, "learning_rate": 3.5794730921835974e-06, "loss": 20.9725, "step": 67550 }, { "epoch": 0.73, "learning_rate": 3.5767891335738513e-06, "loss": 21.393, "step": 67560 }, { "epoch": 0.73, "learning_rate": 3.5741059624177287e-06, "loss": 21.396, "step": 67570 }, { "epoch": 0.73, "learning_rate": 3.571423579044175e-06, "loss": 21.3826, "step": 67580 }, { "epoch": 0.73, "learning_rate": 3.5687419837820335e-06, "loss": 21.4545, "step": 67590 }, { "epoch": 0.73, "learning_rate": 3.5660611769600604e-06, "loss": 20.8824, "step": 67600 }, { "epoch": 0.73, "learning_rate": 3.5633811589069102e-06, "loss": 21.9783, "step": 67610 }, { "epoch": 0.73, "learning_rate": 3.5607019299511326e-06, "loss": 21.3866, "step": 67620 }, { "epoch": 0.73, "learning_rate": 3.5580234904211896e-06, "loss": 21.9611, "step": 67630 }, { "epoch": 0.73, "learning_rate": 3.5553458406454433e-06, "loss": 21.106, "step": 67640 }, { "epoch": 0.73, "learning_rate": 3.5526689809521663e-06, "loss": 20.7303, "step": 67650 }, { "epoch": 0.73, "learning_rate": 3.5499929116695276e-06, "loss": 21.9224, "step": 67660 }, { "epoch": 0.73, "learning_rate": 3.5473176331255945e-06, "loss": 21.5987, "step": 67670 }, { "epoch": 0.73, "learning_rate": 3.5446431456483445e-06, "loss": 21.182, "step": 67680 }, { "epoch": 0.73, "learning_rate": 3.5419694495656543e-06, "loss": 21.6851, "step": 67690 }, { "epoch": 0.73, "learning_rate": 3.5392965452053117e-06, "loss": 20.7387, "step": 67700 }, { "epoch": 0.73, "learning_rate": 3.5366244328950015e-06, "loss": 22.046, "step": 67710 }, { "epoch": 0.73, "learning_rate": 3.5339531129623062e-06, "loss": 20.5941, "step": 67720 }, { "epoch": 0.73, "learning_rate": 3.531282585734718e-06, "loss": 21.3091, "step": 67730 }, { "epoch": 0.73, "learning_rate": 3.5286128515396257e-06, "loss": 21.7525, "step": 67740 }, { "epoch": 0.73, "learning_rate": 3.5259439107043357e-06, "loss": 20.6575, "step": 67750 }, { "epoch": 0.73, "learning_rate": 3.52327576355604e-06, "loss": 21.176, "step": 67760 }, { "epoch": 0.73, "learning_rate": 3.520608410421846e-06, "loss": 21.0933, "step": 67770 }, { "epoch": 0.73, "learning_rate": 3.51794185162875e-06, "loss": 21.2546, "step": 67780 }, { "epoch": 0.73, "learning_rate": 3.5152760875036583e-06, "loss": 21.884, "step": 67790 }, { "epoch": 0.73, "learning_rate": 3.512611118373388e-06, "loss": 20.7156, "step": 67800 }, { "epoch": 0.73, "learning_rate": 3.509946944564647e-06, "loss": 21.0202, "step": 67810 }, { "epoch": 0.73, "learning_rate": 3.507283566404054e-06, "loss": 21.5445, "step": 67820 }, { "epoch": 0.73, "learning_rate": 3.504620984218118e-06, "loss": 21.1155, "step": 67830 }, { "epoch": 0.73, "learning_rate": 3.501959198333259e-06, "loss": 21.4972, "step": 67840 }, { "epoch": 0.73, "learning_rate": 3.4992982090758055e-06, "loss": 20.5904, "step": 67850 }, { "epoch": 0.73, "learning_rate": 3.496638016771978e-06, "loss": 21.6061, "step": 67860 }, { "epoch": 0.73, "learning_rate": 3.4939786217479023e-06, "loss": 21.2107, "step": 67870 }, { "epoch": 0.73, "learning_rate": 3.4913200243296107e-06, "loss": 21.1138, "step": 67880 }, { "epoch": 0.73, "learning_rate": 3.4886622248430247e-06, "loss": 21.4953, "step": 67890 }, { "epoch": 0.73, "learning_rate": 3.4860052236139864e-06, "loss": 21.8037, "step": 67900 }, { "epoch": 0.73, "learning_rate": 3.4833490209682274e-06, "loss": 21.626, "step": 67910 }, { "epoch": 0.73, "learning_rate": 3.4806936172313853e-06, "loss": 22.1131, "step": 67920 }, { "epoch": 0.73, "learning_rate": 3.478039012729002e-06, "loss": 21.2713, "step": 67930 }, { "epoch": 0.73, "learning_rate": 3.4753852077865103e-06, "loss": 21.5401, "step": 67940 }, { "epoch": 0.73, "learning_rate": 3.472732202729263e-06, "loss": 21.6602, "step": 67950 }, { "epoch": 0.73, "learning_rate": 3.4700799978825005e-06, "loss": 21.4282, "step": 67960 }, { "epoch": 0.73, "learning_rate": 3.4674285935713715e-06, "loss": 21.1549, "step": 67970 }, { "epoch": 0.73, "learning_rate": 3.4647779901209278e-06, "loss": 20.6487, "step": 67980 }, { "epoch": 0.74, "learning_rate": 3.46212818785611e-06, "loss": 21.1088, "step": 67990 }, { "epoch": 0.74, "learning_rate": 3.4594791871017796e-06, "loss": 20.7309, "step": 68000 }, { "epoch": 0.74, "learning_rate": 3.45683098818269e-06, "loss": 21.3746, "step": 68010 }, { "epoch": 0.74, "learning_rate": 3.4541835914234955e-06, "loss": 21.527, "step": 68020 }, { "epoch": 0.74, "learning_rate": 3.451536997148753e-06, "loss": 21.6323, "step": 68030 }, { "epoch": 0.74, "learning_rate": 3.448891205682925e-06, "loss": 22.0005, "step": 68040 }, { "epoch": 0.74, "learning_rate": 3.4462462173503684e-06, "loss": 21.6702, "step": 68050 }, { "epoch": 0.74, "learning_rate": 3.4436020324753482e-06, "loss": 20.9438, "step": 68060 }, { "epoch": 0.74, "learning_rate": 3.440958651382027e-06, "loss": 21.1884, "step": 68070 }, { "epoch": 0.74, "learning_rate": 3.438316074394471e-06, "loss": 21.1445, "step": 68080 }, { "epoch": 0.74, "learning_rate": 3.435674301836647e-06, "loss": 21.0289, "step": 68090 }, { "epoch": 0.74, "learning_rate": 3.433033334032422e-06, "loss": 21.3653, "step": 68100 }, { "epoch": 0.74, "learning_rate": 3.430393171305566e-06, "loss": 20.9163, "step": 68110 }, { "epoch": 0.74, "learning_rate": 3.4277538139797504e-06, "loss": 22.0107, "step": 68120 }, { "epoch": 0.74, "learning_rate": 3.4251152623785468e-06, "loss": 20.8406, "step": 68130 }, { "epoch": 0.74, "learning_rate": 3.4224775168254285e-06, "loss": 21.2612, "step": 68140 }, { "epoch": 0.74, "learning_rate": 3.419840577643769e-06, "loss": 21.5029, "step": 68150 }, { "epoch": 0.74, "learning_rate": 3.4172044451568464e-06, "loss": 21.1767, "step": 68160 }, { "epoch": 0.74, "learning_rate": 3.414569119687835e-06, "loss": 21.3092, "step": 68170 }, { "epoch": 0.74, "learning_rate": 3.4119346015598133e-06, "loss": 21.4098, "step": 68180 }, { "epoch": 0.74, "learning_rate": 3.4093008910957605e-06, "loss": 20.4053, "step": 68190 }, { "epoch": 0.74, "learning_rate": 3.4066679886185562e-06, "loss": 21.3601, "step": 68200 }, { "epoch": 0.74, "learning_rate": 3.404035894450981e-06, "loss": 21.313, "step": 68210 }, { "epoch": 0.74, "learning_rate": 3.401404608915716e-06, "loss": 21.378, "step": 68220 }, { "epoch": 0.74, "learning_rate": 3.398774132335344e-06, "loss": 21.5508, "step": 68230 }, { "epoch": 0.74, "learning_rate": 3.3961444650323493e-06, "loss": 20.4637, "step": 68240 }, { "epoch": 0.74, "learning_rate": 3.3935156073291144e-06, "loss": 20.8936, "step": 68250 }, { "epoch": 0.74, "learning_rate": 3.390887559547925e-06, "loss": 21.4788, "step": 68260 }, { "epoch": 0.74, "learning_rate": 3.388260322010968e-06, "loss": 21.827, "step": 68270 }, { "epoch": 0.74, "learning_rate": 3.385633895040327e-06, "loss": 20.6928, "step": 68280 }, { "epoch": 0.74, "learning_rate": 3.38300827895799e-06, "loss": 21.2788, "step": 68290 }, { "epoch": 0.74, "learning_rate": 3.380383474085841e-06, "loss": 20.9277, "step": 68300 }, { "epoch": 0.74, "learning_rate": 3.377759480745679e-06, "loss": 20.4992, "step": 68310 }, { "epoch": 0.74, "learning_rate": 3.375136299259181e-06, "loss": 20.859, "step": 68320 }, { "epoch": 0.74, "learning_rate": 3.3725139299479403e-06, "loss": 20.7881, "step": 68330 }, { "epoch": 0.74, "learning_rate": 3.3698923731334453e-06, "loss": 21.6154, "step": 68340 }, { "epoch": 0.74, "learning_rate": 3.3672716291370845e-06, "loss": 21.2004, "step": 68350 }, { "epoch": 0.74, "learning_rate": 3.364651698280156e-06, "loss": 21.0729, "step": 68360 }, { "epoch": 0.74, "learning_rate": 3.3620325808838405e-06, "loss": 20.3241, "step": 68370 }, { "epoch": 0.74, "learning_rate": 3.359414277269232e-06, "loss": 21.5151, "step": 68380 }, { "epoch": 0.74, "learning_rate": 3.3567967877573225e-06, "loss": 21.2685, "step": 68390 }, { "epoch": 0.74, "learning_rate": 3.354180112669e-06, "loss": 21.2307, "step": 68400 }, { "epoch": 0.74, "learning_rate": 3.3515642523250647e-06, "loss": 21.0006, "step": 68410 }, { "epoch": 0.74, "learning_rate": 3.348949207046198e-06, "loss": 21.4359, "step": 68420 }, { "epoch": 0.74, "learning_rate": 3.3463349771529964e-06, "loss": 21.8306, "step": 68430 }, { "epoch": 0.74, "learning_rate": 3.343721562965949e-06, "loss": 21.041, "step": 68440 }, { "epoch": 0.74, "learning_rate": 3.3411089648054453e-06, "loss": 21.1966, "step": 68450 }, { "epoch": 0.74, "learning_rate": 3.3384971829917846e-06, "loss": 21.4881, "step": 68460 }, { "epoch": 0.74, "learning_rate": 3.3358862178451555e-06, "loss": 21.5452, "step": 68470 }, { "epoch": 0.74, "learning_rate": 3.333276069685646e-06, "loss": 21.2753, "step": 68480 }, { "epoch": 0.74, "learning_rate": 3.330666738833248e-06, "loss": 21.7209, "step": 68490 }, { "epoch": 0.74, "learning_rate": 3.32805822560785e-06, "loss": 21.143, "step": 68500 }, { "epoch": 0.74, "learning_rate": 3.3254505303292494e-06, "loss": 22.1457, "step": 68510 }, { "epoch": 0.74, "learning_rate": 3.322843653317136e-06, "loss": 21.1187, "step": 68520 }, { "epoch": 0.74, "learning_rate": 3.320237594891095e-06, "loss": 21.3942, "step": 68530 }, { "epoch": 0.74, "learning_rate": 3.317632355370618e-06, "loss": 21.3133, "step": 68540 }, { "epoch": 0.74, "learning_rate": 3.3150279350750914e-06, "loss": 20.4364, "step": 68550 }, { "epoch": 0.74, "learning_rate": 3.3124243343238103e-06, "loss": 21.3619, "step": 68560 }, { "epoch": 0.74, "learning_rate": 3.3098215534359613e-06, "loss": 21.0578, "step": 68570 }, { "epoch": 0.74, "learning_rate": 3.307219592730635e-06, "loss": 22.0657, "step": 68580 }, { "epoch": 0.74, "learning_rate": 3.304618452526811e-06, "loss": 21.3035, "step": 68590 }, { "epoch": 0.74, "learning_rate": 3.3020181331433776e-06, "loss": 21.2504, "step": 68600 }, { "epoch": 0.74, "learning_rate": 3.2994186348991265e-06, "loss": 20.718, "step": 68610 }, { "epoch": 0.74, "learning_rate": 3.29681995811274e-06, "loss": 21.398, "step": 68620 }, { "epoch": 0.74, "learning_rate": 3.2942221031028077e-06, "loss": 20.4066, "step": 68630 }, { "epoch": 0.74, "learning_rate": 3.291625070187806e-06, "loss": 21.1276, "step": 68640 }, { "epoch": 0.74, "learning_rate": 3.2890288596861187e-06, "loss": 21.3403, "step": 68650 }, { "epoch": 0.74, "learning_rate": 3.286433471916033e-06, "loss": 21.0434, "step": 68660 }, { "epoch": 0.74, "learning_rate": 3.28383890719573e-06, "loss": 21.4202, "step": 68670 }, { "epoch": 0.74, "learning_rate": 3.281245165843291e-06, "loss": 21.172, "step": 68680 }, { "epoch": 0.74, "learning_rate": 3.2786522481766915e-06, "loss": 21.1958, "step": 68690 }, { "epoch": 0.74, "learning_rate": 3.2760601545138093e-06, "loss": 21.5176, "step": 68700 }, { "epoch": 0.74, "learning_rate": 3.2734688851724273e-06, "loss": 20.9035, "step": 68710 }, { "epoch": 0.74, "learning_rate": 3.270878440470222e-06, "loss": 21.1907, "step": 68720 }, { "epoch": 0.74, "learning_rate": 3.2682888207247665e-06, "loss": 20.9505, "step": 68730 }, { "epoch": 0.74, "learning_rate": 3.2657000262535388e-06, "loss": 20.9836, "step": 68740 }, { "epoch": 0.74, "learning_rate": 3.263112057373904e-06, "loss": 22.1461, "step": 68750 }, { "epoch": 0.74, "learning_rate": 3.2605249144031427e-06, "loss": 21.9401, "step": 68760 }, { "epoch": 0.74, "learning_rate": 3.2579385976584223e-06, "loss": 21.2534, "step": 68770 }, { "epoch": 0.74, "learning_rate": 3.2553531074568125e-06, "loss": 20.7712, "step": 68780 }, { "epoch": 0.74, "learning_rate": 3.2527684441152853e-06, "loss": 21.1401, "step": 68790 }, { "epoch": 0.74, "learning_rate": 3.2501846079506983e-06, "loss": 21.3583, "step": 68800 }, { "epoch": 0.74, "learning_rate": 3.247601599279825e-06, "loss": 20.7239, "step": 68810 }, { "epoch": 0.74, "learning_rate": 3.2450194184193264e-06, "loss": 20.7775, "step": 68820 }, { "epoch": 0.74, "learning_rate": 3.2424380656857655e-06, "loss": 21.5743, "step": 68830 }, { "epoch": 0.74, "learning_rate": 3.2398575413956048e-06, "loss": 20.7993, "step": 68840 }, { "epoch": 0.74, "learning_rate": 3.237277845865201e-06, "loss": 21.5376, "step": 68850 }, { "epoch": 0.74, "learning_rate": 3.2346989794108143e-06, "loss": 21.0376, "step": 68860 }, { "epoch": 0.74, "learning_rate": 3.232120942348599e-06, "loss": 21.295, "step": 68870 }, { "epoch": 0.74, "learning_rate": 3.22954373499461e-06, "loss": 21.9701, "step": 68880 }, { "epoch": 0.74, "learning_rate": 3.226967357664801e-06, "loss": 21.0669, "step": 68890 }, { "epoch": 0.74, "learning_rate": 3.2243918106750215e-06, "loss": 21.089, "step": 68900 }, { "epoch": 0.74, "learning_rate": 3.2218170943410233e-06, "loss": 21.3541, "step": 68910 }, { "epoch": 0.75, "learning_rate": 3.219243208978451e-06, "loss": 21.0194, "step": 68920 }, { "epoch": 0.75, "learning_rate": 3.216670154902851e-06, "loss": 20.7138, "step": 68930 }, { "epoch": 0.75, "learning_rate": 3.214097932429667e-06, "loss": 21.5231, "step": 68940 }, { "epoch": 0.75, "learning_rate": 3.2115265418742415e-06, "loss": 21.6901, "step": 68950 }, { "epoch": 0.75, "learning_rate": 3.208955983551814e-06, "loss": 21.0647, "step": 68960 }, { "epoch": 0.75, "learning_rate": 3.2063862577775194e-06, "loss": 19.9668, "step": 68970 }, { "epoch": 0.75, "learning_rate": 3.2038173648663974e-06, "loss": 20.7807, "step": 68980 }, { "epoch": 0.75, "learning_rate": 3.2012493051333793e-06, "loss": 21.0435, "step": 68990 }, { "epoch": 0.75, "learning_rate": 3.198682078893296e-06, "loss": 21.2433, "step": 69000 }, { "epoch": 0.75, "learning_rate": 3.1961156864608767e-06, "loss": 21.1712, "step": 69010 }, { "epoch": 0.75, "learning_rate": 3.1935501281507496e-06, "loss": 21.4332, "step": 69020 }, { "epoch": 0.75, "learning_rate": 3.190985404277439e-06, "loss": 21.3496, "step": 69030 }, { "epoch": 0.75, "learning_rate": 3.1884215151553666e-06, "loss": 20.6534, "step": 69040 }, { "epoch": 0.75, "learning_rate": 3.185858461098853e-06, "loss": 21.1611, "step": 69050 }, { "epoch": 0.75, "learning_rate": 3.183296242422115e-06, "loss": 21.6336, "step": 69060 }, { "epoch": 0.75, "learning_rate": 3.1807348594392686e-06, "loss": 20.6947, "step": 69070 }, { "epoch": 0.75, "learning_rate": 3.178174312464326e-06, "loss": 21.5274, "step": 69080 }, { "epoch": 0.75, "learning_rate": 3.1756146018111976e-06, "loss": 21.1686, "step": 69090 }, { "epoch": 0.75, "learning_rate": 3.1730557277936925e-06, "loss": 21.201, "step": 69100 }, { "epoch": 0.75, "learning_rate": 3.1704976907255136e-06, "loss": 20.9729, "step": 69110 }, { "epoch": 0.75, "learning_rate": 3.167940490920266e-06, "loss": 21.1569, "step": 69120 }, { "epoch": 0.75, "learning_rate": 3.1653841286914476e-06, "loss": 20.9091, "step": 69130 }, { "epoch": 0.75, "learning_rate": 3.1628286043524568e-06, "loss": 20.6354, "step": 69140 }, { "epoch": 0.75, "learning_rate": 3.1602739182165877e-06, "loss": 21.6269, "step": 69150 }, { "epoch": 0.75, "learning_rate": 3.157720070597031e-06, "loss": 20.8024, "step": 69160 }, { "epoch": 0.75, "learning_rate": 3.1551670618068786e-06, "loss": 21.6259, "step": 69170 }, { "epoch": 0.75, "learning_rate": 3.1526148921591138e-06, "loss": 20.9687, "step": 69180 }, { "epoch": 0.75, "learning_rate": 3.150063561966621e-06, "loss": 21.0274, "step": 69190 }, { "epoch": 0.75, "learning_rate": 3.1475130715421807e-06, "loss": 20.9066, "step": 69200 }, { "epoch": 0.75, "learning_rate": 3.14496342119847e-06, "loss": 21.6445, "step": 69210 }, { "epoch": 0.75, "learning_rate": 3.1424146112480637e-06, "loss": 21.889, "step": 69220 }, { "epoch": 0.75, "learning_rate": 3.139866642003433e-06, "loss": 22.2785, "step": 69230 }, { "epoch": 0.75, "learning_rate": 3.137319513776945e-06, "loss": 20.7274, "step": 69240 }, { "epoch": 0.75, "learning_rate": 3.1347732268808674e-06, "loss": 21.6677, "step": 69250 }, { "epoch": 0.75, "learning_rate": 3.1322277816273606e-06, "loss": 21.1562, "step": 69260 }, { "epoch": 0.75, "learning_rate": 3.1296831783284807e-06, "loss": 21.4078, "step": 69270 }, { "epoch": 0.75, "learning_rate": 3.1271394172961933e-06, "loss": 20.675, "step": 69280 }, { "epoch": 0.75, "learning_rate": 3.1245964988423394e-06, "loss": 21.2601, "step": 69290 }, { "epoch": 0.75, "learning_rate": 3.1220544232786744e-06, "loss": 21.5494, "step": 69300 }, { "epoch": 0.75, "learning_rate": 3.1195131909168417e-06, "loss": 21.0501, "step": 69310 }, { "epoch": 0.75, "learning_rate": 3.1169728020683807e-06, "loss": 21.3201, "step": 69320 }, { "epoch": 0.75, "learning_rate": 3.114433257044741e-06, "loss": 21.2701, "step": 69330 }, { "epoch": 0.75, "learning_rate": 3.111894556157249e-06, "loss": 20.9201, "step": 69340 }, { "epoch": 0.75, "learning_rate": 3.1093566997171375e-06, "loss": 21.1558, "step": 69350 }, { "epoch": 0.75, "learning_rate": 3.1068196880355384e-06, "loss": 21.5272, "step": 69360 }, { "epoch": 0.75, "learning_rate": 3.1042835214234702e-06, "loss": 21.1877, "step": 69370 }, { "epoch": 0.75, "learning_rate": 3.1017482001918663e-06, "loss": 21.6529, "step": 69380 }, { "epoch": 0.75, "learning_rate": 3.099213724651534e-06, "loss": 20.9105, "step": 69390 }, { "epoch": 0.75, "learning_rate": 3.0966800951131905e-06, "loss": 20.9436, "step": 69400 }, { "epoch": 0.75, "learning_rate": 3.0941473118874452e-06, "loss": 20.8826, "step": 69410 }, { "epoch": 0.75, "learning_rate": 3.091615375284803e-06, "loss": 20.9017, "step": 69420 }, { "epoch": 0.75, "learning_rate": 3.0890842856156734e-06, "loss": 21.5659, "step": 69430 }, { "epoch": 0.75, "learning_rate": 3.086554043190354e-06, "loss": 21.1398, "step": 69440 }, { "epoch": 0.75, "learning_rate": 3.0840246483190338e-06, "loss": 21.1791, "step": 69450 }, { "epoch": 0.75, "learning_rate": 3.081496101311807e-06, "loss": 21.0891, "step": 69460 }, { "epoch": 0.75, "learning_rate": 3.078968402478659e-06, "loss": 20.5848, "step": 69470 }, { "epoch": 0.75, "learning_rate": 3.0764415521294777e-06, "loss": 21.723, "step": 69480 }, { "epoch": 0.75, "learning_rate": 3.0739155505740437e-06, "loss": 21.008, "step": 69490 }, { "epoch": 0.75, "learning_rate": 3.071390398122025e-06, "loss": 20.8761, "step": 69500 }, { "epoch": 0.75, "learning_rate": 3.0688660950829973e-06, "loss": 21.4332, "step": 69510 }, { "epoch": 0.75, "learning_rate": 3.0663426417664223e-06, "loss": 21.2543, "step": 69520 }, { "epoch": 0.75, "learning_rate": 3.0638200384816698e-06, "loss": 20.7606, "step": 69530 }, { "epoch": 0.75, "learning_rate": 3.061298285537997e-06, "loss": 20.7642, "step": 69540 }, { "epoch": 0.75, "learning_rate": 3.058777383244559e-06, "loss": 21.3298, "step": 69550 }, { "epoch": 0.75, "learning_rate": 3.0562573319104005e-06, "loss": 20.7218, "step": 69560 }, { "epoch": 0.75, "learning_rate": 3.053738131844467e-06, "loss": 21.4758, "step": 69570 }, { "epoch": 0.75, "learning_rate": 3.051219783355607e-06, "loss": 21.6201, "step": 69580 }, { "epoch": 0.75, "learning_rate": 3.048702286752553e-06, "loss": 20.4618, "step": 69590 }, { "epoch": 0.75, "learning_rate": 3.046185642343942e-06, "loss": 21.116, "step": 69600 }, { "epoch": 0.75, "learning_rate": 3.0436698504382945e-06, "loss": 21.3384, "step": 69610 }, { "epoch": 0.75, "learning_rate": 3.0411549113440354e-06, "loss": 20.818, "step": 69620 }, { "epoch": 0.75, "learning_rate": 3.0386408253694887e-06, "loss": 21.2933, "step": 69630 }, { "epoch": 0.75, "learning_rate": 3.036127592822866e-06, "loss": 21.3943, "step": 69640 }, { "epoch": 0.75, "learning_rate": 3.033615214012281e-06, "loss": 21.0696, "step": 69650 }, { "epoch": 0.75, "learning_rate": 3.0311036892457325e-06, "loss": 21.1022, "step": 69660 }, { "epoch": 0.75, "learning_rate": 3.0285930188311197e-06, "loss": 21.2767, "step": 69670 }, { "epoch": 0.75, "learning_rate": 3.0260832030762455e-06, "loss": 21.0394, "step": 69680 }, { "epoch": 0.75, "learning_rate": 3.023574242288797e-06, "loss": 21.0521, "step": 69690 }, { "epoch": 0.75, "learning_rate": 3.0210661367763618e-06, "loss": 21.0708, "step": 69700 }, { "epoch": 0.75, "learning_rate": 3.018558886846422e-06, "loss": 21.5525, "step": 69710 }, { "epoch": 0.75, "learning_rate": 3.016052492806346e-06, "loss": 20.8717, "step": 69720 }, { "epoch": 0.75, "learning_rate": 3.0135469549634143e-06, "loss": 21.065, "step": 69730 }, { "epoch": 0.75, "learning_rate": 3.01104227362479e-06, "loss": 21.206, "step": 69740 }, { "epoch": 0.75, "learning_rate": 3.0085384490975355e-06, "loss": 20.9858, "step": 69750 }, { "epoch": 0.75, "learning_rate": 3.0060354816886094e-06, "loss": 21.2765, "step": 69760 }, { "epoch": 0.75, "learning_rate": 3.003533371704853e-06, "loss": 21.0907, "step": 69770 }, { "epoch": 0.75, "learning_rate": 3.0010321194530244e-06, "loss": 20.7485, "step": 69780 }, { "epoch": 0.75, "learning_rate": 2.998531725239758e-06, "loss": 21.0193, "step": 69790 }, { "epoch": 0.75, "learning_rate": 2.9960321893715925e-06, "loss": 21.3623, "step": 69800 }, { "epoch": 0.75, "learning_rate": 2.9935335121549615e-06, "loss": 20.7843, "step": 69810 }, { "epoch": 0.75, "learning_rate": 2.9910356938961782e-06, "loss": 21.0811, "step": 69820 }, { "epoch": 0.75, "learning_rate": 2.988538734901475e-06, "loss": 21.4757, "step": 69830 }, { "epoch": 0.76, "learning_rate": 2.9860426354769635e-06, "loss": 21.2549, "step": 69840 }, { "epoch": 0.76, "learning_rate": 2.983547395928651e-06, "loss": 21.5767, "step": 69850 }, { "epoch": 0.76, "learning_rate": 2.9810530165624417e-06, "loss": 21.471, "step": 69860 }, { "epoch": 0.76, "learning_rate": 2.978559497684136e-06, "loss": 21.6347, "step": 69870 }, { "epoch": 0.76, "learning_rate": 2.976066839599425e-06, "loss": 21.4041, "step": 69880 }, { "epoch": 0.76, "learning_rate": 2.973575042613898e-06, "loss": 21.7531, "step": 69890 }, { "epoch": 0.76, "learning_rate": 2.9710841070330354e-06, "loss": 20.7581, "step": 69900 }, { "epoch": 0.76, "learning_rate": 2.9685940331622133e-06, "loss": 21.2824, "step": 69910 }, { "epoch": 0.76, "learning_rate": 2.9661048213067033e-06, "loss": 22.0812, "step": 69920 }, { "epoch": 0.76, "learning_rate": 2.96361647177167e-06, "loss": 20.5171, "step": 69930 }, { "epoch": 0.76, "learning_rate": 2.9611289848621716e-06, "loss": 21.3358, "step": 69940 }, { "epoch": 0.76, "learning_rate": 2.958642360883164e-06, "loss": 21.5653, "step": 69950 }, { "epoch": 0.76, "learning_rate": 2.9561566001394926e-06, "loss": 21.557, "step": 69960 }, { "epoch": 0.76, "learning_rate": 2.953671702935901e-06, "loss": 20.8047, "step": 69970 }, { "epoch": 0.76, "learning_rate": 2.9511876695770237e-06, "loss": 21.0306, "step": 69980 }, { "epoch": 0.76, "learning_rate": 2.948704500367392e-06, "loss": 21.2063, "step": 69990 }, { "epoch": 0.76, "learning_rate": 2.946222195611429e-06, "loss": 20.9739, "step": 70000 }, { "epoch": 0.76, "learning_rate": 2.9437407556134535e-06, "loss": 21.5459, "step": 70010 }, { "epoch": 0.76, "learning_rate": 2.9412601806776777e-06, "loss": 21.6832, "step": 70020 }, { "epoch": 0.76, "learning_rate": 2.938780471108208e-06, "loss": 21.879, "step": 70030 }, { "epoch": 0.76, "learning_rate": 2.9363016272090437e-06, "loss": 20.6818, "step": 70040 }, { "epoch": 0.76, "learning_rate": 2.9338236492840786e-06, "loss": 21.4156, "step": 70050 }, { "epoch": 0.76, "learning_rate": 2.931346537637102e-06, "loss": 21.0129, "step": 70060 }, { "epoch": 0.76, "learning_rate": 2.928870292571793e-06, "loss": 20.8555, "step": 70070 }, { "epoch": 0.76, "learning_rate": 2.926394914391729e-06, "loss": 21.5222, "step": 70080 }, { "epoch": 0.76, "learning_rate": 2.9239204034003777e-06, "loss": 21.6612, "step": 70090 }, { "epoch": 0.76, "learning_rate": 2.9214467599011033e-06, "loss": 21.5855, "step": 70100 }, { "epoch": 0.76, "learning_rate": 2.918973984197161e-06, "loss": 22.276, "step": 70110 }, { "epoch": 0.76, "learning_rate": 2.9165020765917006e-06, "loss": 21.3808, "step": 70120 }, { "epoch": 0.76, "learning_rate": 2.9140310373877655e-06, "loss": 21.5391, "step": 70130 }, { "epoch": 0.76, "learning_rate": 2.9115608668882944e-06, "loss": 21.0521, "step": 70140 }, { "epoch": 0.76, "learning_rate": 2.909091565396116e-06, "loss": 20.5077, "step": 70150 }, { "epoch": 0.76, "learning_rate": 2.906623133213956e-06, "loss": 21.7416, "step": 70160 }, { "epoch": 0.76, "learning_rate": 2.9041555706444303e-06, "loss": 21.815, "step": 70170 }, { "epoch": 0.76, "learning_rate": 2.901688877990051e-06, "loss": 21.2371, "step": 70180 }, { "epoch": 0.76, "learning_rate": 2.899223055553221e-06, "loss": 21.0307, "step": 70190 }, { "epoch": 0.76, "learning_rate": 2.896758103636239e-06, "loss": 21.1315, "step": 70200 }, { "epoch": 0.76, "learning_rate": 2.8942940225412965e-06, "loss": 20.9109, "step": 70210 }, { "epoch": 0.76, "learning_rate": 2.8918308125704754e-06, "loss": 20.7268, "step": 70220 }, { "epoch": 0.76, "learning_rate": 2.8893684740257545e-06, "loss": 20.9081, "step": 70230 }, { "epoch": 0.76, "learning_rate": 2.886907007209e-06, "loss": 21.3231, "step": 70240 }, { "epoch": 0.76, "learning_rate": 2.8844464124219864e-06, "loss": 20.3083, "step": 70250 }, { "epoch": 0.76, "learning_rate": 2.8819866899663596e-06, "loss": 21.8703, "step": 70260 }, { "epoch": 0.76, "learning_rate": 2.879527840143673e-06, "loss": 20.8531, "step": 70270 }, { "epoch": 0.76, "learning_rate": 2.8770698632553694e-06, "loss": 21.5681, "step": 70280 }, { "epoch": 0.76, "learning_rate": 2.874612759602782e-06, "loss": 21.0298, "step": 70290 }, { "epoch": 0.76, "learning_rate": 2.872156529487147e-06, "loss": 20.9407, "step": 70300 }, { "epoch": 0.76, "learning_rate": 2.869701173209578e-06, "loss": 20.8261, "step": 70310 }, { "epoch": 0.76, "learning_rate": 2.867246691071092e-06, "loss": 20.9938, "step": 70320 }, { "epoch": 0.76, "learning_rate": 2.8647930833725967e-06, "loss": 21.2198, "step": 70330 }, { "epoch": 0.76, "learning_rate": 2.8623403504148883e-06, "loss": 21.2053, "step": 70340 }, { "epoch": 0.76, "learning_rate": 2.8598884924986704e-06, "loss": 20.939, "step": 70350 }, { "epoch": 0.76, "learning_rate": 2.8574375099245178e-06, "loss": 21.357, "step": 70360 }, { "epoch": 0.76, "learning_rate": 2.8549874029929124e-06, "loss": 20.6826, "step": 70370 }, { "epoch": 0.76, "learning_rate": 2.8525381720042256e-06, "loss": 20.9969, "step": 70380 }, { "epoch": 0.76, "learning_rate": 2.8500898172587176e-06, "loss": 20.7901, "step": 70390 }, { "epoch": 0.76, "learning_rate": 2.84764233905655e-06, "loss": 20.8014, "step": 70400 }, { "epoch": 0.76, "learning_rate": 2.8451957376977713e-06, "loss": 21.0039, "step": 70410 }, { "epoch": 0.76, "learning_rate": 2.842750013482317e-06, "loss": 21.6039, "step": 70420 }, { "epoch": 0.76, "learning_rate": 2.8403051667100246e-06, "loss": 21.0858, "step": 70430 }, { "epoch": 0.76, "learning_rate": 2.837861197680615e-06, "loss": 20.8626, "step": 70440 }, { "epoch": 0.76, "learning_rate": 2.8354181066937147e-06, "loss": 21.4299, "step": 70450 }, { "epoch": 0.76, "learning_rate": 2.832975894048833e-06, "loss": 21.55, "step": 70460 }, { "epoch": 0.76, "learning_rate": 2.830534560045368e-06, "loss": 21.0701, "step": 70470 }, { "epoch": 0.76, "learning_rate": 2.8280941049826182e-06, "loss": 20.9331, "step": 70480 }, { "epoch": 0.76, "learning_rate": 2.825654529159767e-06, "loss": 21.5571, "step": 70490 }, { "epoch": 0.76, "learning_rate": 2.8232158328759017e-06, "loss": 20.9758, "step": 70500 }, { "epoch": 0.76, "learning_rate": 2.8207780164299904e-06, "loss": 20.6979, "step": 70510 }, { "epoch": 0.76, "learning_rate": 2.8183410801209e-06, "loss": 21.5427, "step": 70520 }, { "epoch": 0.76, "learning_rate": 2.8159050242473807e-06, "loss": 21.1863, "step": 70530 }, { "epoch": 0.76, "learning_rate": 2.8134698491080827e-06, "loss": 20.8047, "step": 70540 }, { "epoch": 0.76, "learning_rate": 2.811035555001549e-06, "loss": 21.6832, "step": 70550 }, { "epoch": 0.76, "learning_rate": 2.808602142226212e-06, "loss": 21.1807, "step": 70560 }, { "epoch": 0.76, "learning_rate": 2.806169611080398e-06, "loss": 20.9255, "step": 70570 }, { "epoch": 0.76, "learning_rate": 2.8037379618623163e-06, "loss": 21.5633, "step": 70580 }, { "epoch": 0.76, "learning_rate": 2.8013071948700767e-06, "loss": 20.9857, "step": 70590 }, { "epoch": 0.76, "learning_rate": 2.798877310401683e-06, "loss": 21.212, "step": 70600 }, { "epoch": 0.76, "learning_rate": 2.796448308755025e-06, "loss": 20.7781, "step": 70610 }, { "epoch": 0.76, "learning_rate": 2.7940201902278896e-06, "loss": 21.8408, "step": 70620 }, { "epoch": 0.76, "learning_rate": 2.7915929551179456e-06, "loss": 21.6595, "step": 70630 }, { "epoch": 0.76, "learning_rate": 2.7891666037227592e-06, "loss": 21.8592, "step": 70640 }, { "epoch": 0.76, "learning_rate": 2.7867411363397967e-06, "loss": 21.5928, "step": 70650 }, { "epoch": 0.76, "learning_rate": 2.784316553266403e-06, "loss": 20.9558, "step": 70660 }, { "epoch": 0.76, "learning_rate": 2.7818928547998224e-06, "loss": 21.1538, "step": 70670 }, { "epoch": 0.76, "learning_rate": 2.77947004123719e-06, "loss": 20.8624, "step": 70680 }, { "epoch": 0.76, "learning_rate": 2.777048112875521e-06, "loss": 21.3018, "step": 70690 }, { "epoch": 0.76, "learning_rate": 2.774627070011742e-06, "loss": 21.2433, "step": 70700 }, { "epoch": 0.76, "learning_rate": 2.7722069129426566e-06, "loss": 21.3082, "step": 70710 }, { "epoch": 0.76, "learning_rate": 2.769787641964965e-06, "loss": 20.7925, "step": 70720 }, { "epoch": 0.76, "learning_rate": 2.76736925737526e-06, "loss": 21.2665, "step": 70730 }, { "epoch": 0.76, "learning_rate": 2.764951759470016e-06, "loss": 21.1762, "step": 70740 }, { "epoch": 0.76, "learning_rate": 2.762535148545613e-06, "loss": 21.8038, "step": 70750 }, { "epoch": 0.76, "learning_rate": 2.7601194248983134e-06, "loss": 21.0255, "step": 70760 }, { "epoch": 0.77, "learning_rate": 2.7577045888242736e-06, "loss": 21.2689, "step": 70770 }, { "epoch": 0.77, "learning_rate": 2.7552906406195424e-06, "loss": 21.7702, "step": 70780 }, { "epoch": 0.77, "learning_rate": 2.752877580580049e-06, "loss": 21.7804, "step": 70790 }, { "epoch": 0.77, "learning_rate": 2.7504654090016326e-06, "loss": 20.9198, "step": 70800 }, { "epoch": 0.77, "learning_rate": 2.7480541261800096e-06, "loss": 21.0228, "step": 70810 }, { "epoch": 0.77, "learning_rate": 2.745643732410791e-06, "loss": 20.3788, "step": 70820 }, { "epoch": 0.77, "learning_rate": 2.7432342279894785e-06, "loss": 20.768, "step": 70830 }, { "epoch": 0.77, "learning_rate": 2.7408256132114674e-06, "loss": 21.1862, "step": 70840 }, { "epoch": 0.77, "learning_rate": 2.7384178883720393e-06, "loss": 21.3358, "step": 70850 }, { "epoch": 0.77, "learning_rate": 2.736011053766372e-06, "loss": 21.4138, "step": 70860 }, { "epoch": 0.77, "learning_rate": 2.733605109689529e-06, "loss": 20.388, "step": 70870 }, { "epoch": 0.77, "learning_rate": 2.7312000564364684e-06, "loss": 21.4519, "step": 70880 }, { "epoch": 0.77, "learning_rate": 2.7287958943020364e-06, "loss": 21.4463, "step": 70890 }, { "epoch": 0.77, "learning_rate": 2.7263926235809734e-06, "loss": 22.0158, "step": 70900 }, { "epoch": 0.77, "learning_rate": 2.7239902445679066e-06, "loss": 21.1306, "step": 70910 }, { "epoch": 0.77, "learning_rate": 2.7215887575573563e-06, "loss": 21.3291, "step": 70920 }, { "epoch": 0.77, "learning_rate": 2.7191881628437335e-06, "loss": 20.9354, "step": 70930 }, { "epoch": 0.77, "learning_rate": 2.716788460721338e-06, "loss": 21.8934, "step": 70940 }, { "epoch": 0.77, "learning_rate": 2.7143896514843627e-06, "loss": 21.0821, "step": 70950 }, { "epoch": 0.77, "learning_rate": 2.7119917354268875e-06, "loss": 21.3341, "step": 70960 }, { "epoch": 0.77, "learning_rate": 2.709594712842887e-06, "loss": 21.0917, "step": 70970 }, { "epoch": 0.77, "learning_rate": 2.7071985840262238e-06, "loss": 20.8151, "step": 70980 }, { "epoch": 0.77, "learning_rate": 2.7048033492706504e-06, "loss": 21.3773, "step": 70990 }, { "epoch": 0.77, "learning_rate": 2.7024090088698107e-06, "loss": 20.6906, "step": 71000 }, { "epoch": 0.77, "learning_rate": 2.700015563117241e-06, "loss": 21.5746, "step": 71010 }, { "epoch": 0.77, "learning_rate": 2.6976230123063628e-06, "loss": 21.1871, "step": 71020 }, { "epoch": 0.77, "learning_rate": 2.695231356730492e-06, "loss": 20.6741, "step": 71030 }, { "epoch": 0.77, "learning_rate": 2.6928405966828354e-06, "loss": 20.6226, "step": 71040 }, { "epoch": 0.77, "learning_rate": 2.6904507324564867e-06, "loss": 21.4346, "step": 71050 }, { "epoch": 0.77, "learning_rate": 2.6880617643444306e-06, "loss": 20.7316, "step": 71060 }, { "epoch": 0.77, "learning_rate": 2.6856736926395444e-06, "loss": 20.8746, "step": 71070 }, { "epoch": 0.77, "learning_rate": 2.6832865176345923e-06, "loss": 21.6572, "step": 71080 }, { "epoch": 0.77, "learning_rate": 2.6809002396222306e-06, "loss": 20.1102, "step": 71090 }, { "epoch": 0.77, "learning_rate": 2.678514858895006e-06, "loss": 21.0324, "step": 71100 }, { "epoch": 0.77, "learning_rate": 2.676130375745353e-06, "loss": 21.2532, "step": 71110 }, { "epoch": 0.77, "learning_rate": 2.673746790465598e-06, "loss": 20.4411, "step": 71120 }, { "epoch": 0.77, "learning_rate": 2.6713641033479563e-06, "loss": 21.142, "step": 71130 }, { "epoch": 0.77, "learning_rate": 2.668982314684534e-06, "loss": 21.4098, "step": 71140 }, { "epoch": 0.77, "learning_rate": 2.6666014247673256e-06, "loss": 20.6035, "step": 71150 }, { "epoch": 0.77, "learning_rate": 2.6642214338882178e-06, "loss": 21.347, "step": 71160 }, { "epoch": 0.77, "learning_rate": 2.661842342338984e-06, "loss": 21.2585, "step": 71170 }, { "epoch": 0.77, "learning_rate": 2.6594641504112894e-06, "loss": 21.0403, "step": 71180 }, { "epoch": 0.77, "learning_rate": 2.657086858396689e-06, "loss": 20.929, "step": 71190 }, { "epoch": 0.77, "learning_rate": 2.6547104665866265e-06, "loss": 20.7135, "step": 71200 }, { "epoch": 0.77, "learning_rate": 2.6523349752724337e-06, "loss": 20.7215, "step": 71210 }, { "epoch": 0.77, "learning_rate": 2.6499603847453415e-06, "loss": 21.4392, "step": 71220 }, { "epoch": 0.77, "learning_rate": 2.6475866952964547e-06, "loss": 21.8439, "step": 71230 }, { "epoch": 0.77, "learning_rate": 2.645213907216778e-06, "loss": 20.6769, "step": 71240 }, { "epoch": 0.77, "learning_rate": 2.642842020797205e-06, "loss": 20.832, "step": 71250 }, { "epoch": 0.77, "learning_rate": 2.6404710363285123e-06, "loss": 21.493, "step": 71260 }, { "epoch": 0.77, "learning_rate": 2.6381009541013814e-06, "loss": 21.6086, "step": 71270 }, { "epoch": 0.77, "learning_rate": 2.6357317744063627e-06, "loss": 21.2227, "step": 71280 }, { "epoch": 0.77, "learning_rate": 2.6333634975339083e-06, "loss": 20.4107, "step": 71290 }, { "epoch": 0.77, "learning_rate": 2.6309961237743587e-06, "loss": 20.9841, "step": 71300 }, { "epoch": 0.77, "learning_rate": 2.628629653417938e-06, "loss": 21.1619, "step": 71310 }, { "epoch": 0.77, "learning_rate": 2.6262640867547717e-06, "loss": 22.3196, "step": 71320 }, { "epoch": 0.77, "learning_rate": 2.6238994240748595e-06, "loss": 20.7387, "step": 71330 }, { "epoch": 0.77, "learning_rate": 2.621535665668099e-06, "loss": 21.4668, "step": 71340 }, { "epoch": 0.77, "learning_rate": 2.6191728118242766e-06, "loss": 21.1957, "step": 71350 }, { "epoch": 0.77, "learning_rate": 2.6168108628330615e-06, "loss": 21.0648, "step": 71360 }, { "epoch": 0.77, "learning_rate": 2.6144498189840227e-06, "loss": 20.8176, "step": 71370 }, { "epoch": 0.77, "learning_rate": 2.6120896805666153e-06, "loss": 21.1391, "step": 71380 }, { "epoch": 0.77, "learning_rate": 2.609730447870171e-06, "loss": 21.8212, "step": 71390 }, { "epoch": 0.77, "learning_rate": 2.6073721211839254e-06, "loss": 21.1105, "step": 71400 }, { "epoch": 0.77, "learning_rate": 2.605014700796994e-06, "loss": 22.2934, "step": 71410 }, { "epoch": 0.77, "learning_rate": 2.6026581869983903e-06, "loss": 21.4394, "step": 71420 }, { "epoch": 0.77, "learning_rate": 2.600302580077012e-06, "loss": 20.6801, "step": 71430 }, { "epoch": 0.77, "learning_rate": 2.5979478803216372e-06, "loss": 21.8891, "step": 71440 }, { "epoch": 0.77, "learning_rate": 2.5955940880209453e-06, "loss": 21.2833, "step": 71450 }, { "epoch": 0.77, "learning_rate": 2.593241203463495e-06, "loss": 22.0149, "step": 71460 }, { "epoch": 0.77, "learning_rate": 2.590889226937744e-06, "loss": 21.475, "step": 71470 }, { "epoch": 0.77, "learning_rate": 2.5885381587320347e-06, "loss": 20.9542, "step": 71480 }, { "epoch": 0.77, "learning_rate": 2.5861879991345894e-06, "loss": 21.7554, "step": 71490 }, { "epoch": 0.77, "learning_rate": 2.583838748433528e-06, "loss": 21.4303, "step": 71500 }, { "epoch": 0.77, "learning_rate": 2.5814904069168555e-06, "loss": 21.1708, "step": 71510 }, { "epoch": 0.77, "learning_rate": 2.5791429748724717e-06, "loss": 21.1314, "step": 71520 }, { "epoch": 0.77, "learning_rate": 2.576796452588157e-06, "loss": 21.4415, "step": 71530 }, { "epoch": 0.77, "learning_rate": 2.5744508403515878e-06, "loss": 20.7105, "step": 71540 }, { "epoch": 0.77, "learning_rate": 2.5721061384503165e-06, "loss": 21.0733, "step": 71550 }, { "epoch": 0.77, "learning_rate": 2.5697623471717938e-06, "loss": 21.554, "step": 71560 }, { "epoch": 0.77, "learning_rate": 2.5674194668033615e-06, "loss": 21.7315, "step": 71570 }, { "epoch": 0.77, "learning_rate": 2.5650774976322413e-06, "loss": 21.4855, "step": 71580 }, { "epoch": 0.77, "learning_rate": 2.5627364399455524e-06, "loss": 20.628, "step": 71590 }, { "epoch": 0.77, "learning_rate": 2.5603962940302886e-06, "loss": 21.4785, "step": 71600 }, { "epoch": 0.77, "learning_rate": 2.558057060173342e-06, "loss": 20.5674, "step": 71610 }, { "epoch": 0.77, "learning_rate": 2.555718738661496e-06, "loss": 21.3144, "step": 71620 }, { "epoch": 0.77, "learning_rate": 2.5533813297814124e-06, "loss": 21.2857, "step": 71630 }, { "epoch": 0.77, "learning_rate": 2.5510448338196493e-06, "loss": 20.7497, "step": 71640 }, { "epoch": 0.77, "learning_rate": 2.54870925106265e-06, "loss": 21.0201, "step": 71650 }, { "epoch": 0.77, "learning_rate": 2.546374581796737e-06, "loss": 21.0594, "step": 71660 }, { "epoch": 0.77, "learning_rate": 2.5440408263081385e-06, "loss": 21.1267, "step": 71670 }, { "epoch": 0.77, "learning_rate": 2.5417079848829585e-06, "loss": 21.8952, "step": 71680 }, { "epoch": 0.78, "learning_rate": 2.5393760578071903e-06, "loss": 21.2862, "step": 71690 }, { "epoch": 0.78, "learning_rate": 2.5370450453667206e-06, "loss": 21.5512, "step": 71700 }, { "epoch": 0.78, "learning_rate": 2.534714947847311e-06, "loss": 21.2137, "step": 71710 }, { "epoch": 0.78, "learning_rate": 2.5323857655346286e-06, "loss": 20.9632, "step": 71720 }, { "epoch": 0.78, "learning_rate": 2.5300574987142155e-06, "loss": 21.602, "step": 71730 }, { "epoch": 0.78, "learning_rate": 2.5277301476715075e-06, "loss": 21.3613, "step": 71740 }, { "epoch": 0.78, "learning_rate": 2.5254037126918285e-06, "loss": 21.2428, "step": 71750 }, { "epoch": 0.78, "learning_rate": 2.5230781940603777e-06, "loss": 20.9505, "step": 71760 }, { "epoch": 0.78, "learning_rate": 2.5207535920622627e-06, "loss": 21.6719, "step": 71770 }, { "epoch": 0.78, "learning_rate": 2.518429906982465e-06, "loss": 21.143, "step": 71780 }, { "epoch": 0.78, "learning_rate": 2.5161071391058555e-06, "loss": 20.9402, "step": 71790 }, { "epoch": 0.78, "learning_rate": 2.513785288717194e-06, "loss": 21.5128, "step": 71800 }, { "epoch": 0.78, "learning_rate": 2.5114643561011297e-06, "loss": 21.1862, "step": 71810 }, { "epoch": 0.78, "learning_rate": 2.509144341542197e-06, "loss": 20.7605, "step": 71820 }, { "epoch": 0.78, "learning_rate": 2.5068252453248154e-06, "loss": 21.5142, "step": 71830 }, { "epoch": 0.78, "learning_rate": 2.5045070677332974e-06, "loss": 21.0975, "step": 71840 }, { "epoch": 0.78, "learning_rate": 2.5021898090518394e-06, "loss": 21.114, "step": 71850 }, { "epoch": 0.78, "learning_rate": 2.4998734695645244e-06, "loss": 21.2715, "step": 71860 }, { "epoch": 0.78, "learning_rate": 2.497558049555325e-06, "loss": 21.104, "step": 71870 }, { "epoch": 0.78, "learning_rate": 2.4952435493081016e-06, "loss": 21.7593, "step": 71880 }, { "epoch": 0.78, "learning_rate": 2.492929969106598e-06, "loss": 21.6565, "step": 71890 }, { "epoch": 0.78, "learning_rate": 2.490617309234449e-06, "loss": 20.6015, "step": 71900 }, { "epoch": 0.78, "learning_rate": 2.4883055699751748e-06, "loss": 20.9079, "step": 71910 }, { "epoch": 0.78, "learning_rate": 2.4859947516121818e-06, "loss": 21.7016, "step": 71920 }, { "epoch": 0.78, "learning_rate": 2.483684854428767e-06, "loss": 21.218, "step": 71930 }, { "epoch": 0.78, "learning_rate": 2.481375878708112e-06, "loss": 21.6385, "step": 71940 }, { "epoch": 0.78, "learning_rate": 2.4790678247332843e-06, "loss": 20.9813, "step": 71950 }, { "epoch": 0.78, "learning_rate": 2.476760692787241e-06, "loss": 20.9671, "step": 71960 }, { "epoch": 0.78, "learning_rate": 2.474454483152825e-06, "loss": 21.256, "step": 71970 }, { "epoch": 0.78, "learning_rate": 2.472149196112764e-06, "loss": 21.5414, "step": 71980 }, { "epoch": 0.78, "learning_rate": 2.4698448319496782e-06, "loss": 20.5979, "step": 71990 }, { "epoch": 0.78, "learning_rate": 2.467541390946069e-06, "loss": 20.8142, "step": 72000 }, { "epoch": 0.78, "learning_rate": 2.465238873384326e-06, "loss": 20.8573, "step": 72010 }, { "epoch": 0.78, "learning_rate": 2.4629372795467276e-06, "loss": 21.2154, "step": 72020 }, { "epoch": 0.78, "learning_rate": 2.4606366097154387e-06, "loss": 21.4665, "step": 72030 }, { "epoch": 0.78, "learning_rate": 2.458336864172508e-06, "loss": 21.4272, "step": 72040 }, { "epoch": 0.78, "learning_rate": 2.4560380431998743e-06, "loss": 20.7833, "step": 72050 }, { "epoch": 0.78, "learning_rate": 2.4537401470793597e-06, "loss": 21.6762, "step": 72060 }, { "epoch": 0.78, "learning_rate": 2.451443176092675e-06, "loss": 20.7148, "step": 72070 }, { "epoch": 0.78, "learning_rate": 2.4491471305214234e-06, "loss": 20.9935, "step": 72080 }, { "epoch": 0.78, "learning_rate": 2.4468520106470807e-06, "loss": 20.8902, "step": 72090 }, { "epoch": 0.78, "learning_rate": 2.44455781675102e-06, "loss": 21.0103, "step": 72100 }, { "epoch": 0.78, "learning_rate": 2.442264549114498e-06, "loss": 21.0212, "step": 72110 }, { "epoch": 0.78, "learning_rate": 2.4399722080186562e-06, "loss": 22.0618, "step": 72120 }, { "epoch": 0.78, "learning_rate": 2.4376807937445314e-06, "loss": 21.0721, "step": 72130 }, { "epoch": 0.78, "learning_rate": 2.43539030657303e-06, "loss": 20.8875, "step": 72140 }, { "epoch": 0.78, "learning_rate": 2.43310074678496e-06, "loss": 21.6103, "step": 72150 }, { "epoch": 0.78, "learning_rate": 2.4308121146610086e-06, "loss": 22.1143, "step": 72160 }, { "epoch": 0.78, "learning_rate": 2.4285244104817474e-06, "loss": 21.0044, "step": 72170 }, { "epoch": 0.78, "learning_rate": 2.4262376345276428e-06, "loss": 21.3217, "step": 72180 }, { "epoch": 0.78, "learning_rate": 2.423951787079044e-06, "loss": 21.8203, "step": 72190 }, { "epoch": 0.78, "learning_rate": 2.4216668684161783e-06, "loss": 21.7266, "step": 72200 }, { "epoch": 0.78, "learning_rate": 2.4193828788191664e-06, "loss": 21.339, "step": 72210 }, { "epoch": 0.78, "learning_rate": 2.4170998185680128e-06, "loss": 21.8391, "step": 72220 }, { "epoch": 0.78, "learning_rate": 2.4148176879426143e-06, "loss": 21.8251, "step": 72230 }, { "epoch": 0.78, "learning_rate": 2.41253648722275e-06, "loss": 20.512, "step": 72240 }, { "epoch": 0.78, "learning_rate": 2.4102562166880762e-06, "loss": 21.3917, "step": 72250 }, { "epoch": 0.78, "learning_rate": 2.4079768766181456e-06, "loss": 20.9543, "step": 72260 }, { "epoch": 0.78, "learning_rate": 2.4056984672923934e-06, "loss": 21.3883, "step": 72270 }, { "epoch": 0.78, "learning_rate": 2.403420988990145e-06, "loss": 21.0125, "step": 72280 }, { "epoch": 0.78, "learning_rate": 2.4011444419906083e-06, "loss": 21.6429, "step": 72290 }, { "epoch": 0.78, "learning_rate": 2.398868826572871e-06, "loss": 21.1271, "step": 72300 }, { "epoch": 0.78, "learning_rate": 2.3965941430159146e-06, "loss": 21.1421, "step": 72310 }, { "epoch": 0.78, "learning_rate": 2.394320391598601e-06, "loss": 20.7343, "step": 72320 }, { "epoch": 0.78, "learning_rate": 2.3920475725996882e-06, "loss": 21.5704, "step": 72330 }, { "epoch": 0.78, "learning_rate": 2.3897756862978084e-06, "loss": 21.3059, "step": 72340 }, { "epoch": 0.78, "learning_rate": 2.387504732971485e-06, "loss": 21.4623, "step": 72350 }, { "epoch": 0.78, "learning_rate": 2.3852347128991227e-06, "loss": 21.2139, "step": 72360 }, { "epoch": 0.78, "learning_rate": 2.3829656263590127e-06, "loss": 20.5559, "step": 72370 }, { "epoch": 0.78, "learning_rate": 2.38069747362934e-06, "loss": 21.0004, "step": 72380 }, { "epoch": 0.78, "learning_rate": 2.3784302549881654e-06, "loss": 20.7748, "step": 72390 }, { "epoch": 0.78, "learning_rate": 2.376163970713442e-06, "loss": 21.1839, "step": 72400 }, { "epoch": 0.78, "learning_rate": 2.3738986210829997e-06, "loss": 21.7636, "step": 72410 }, { "epoch": 0.78, "learning_rate": 2.37163420637456e-06, "loss": 20.9481, "step": 72420 }, { "epoch": 0.78, "learning_rate": 2.3693707268657283e-06, "loss": 20.6555, "step": 72430 }, { "epoch": 0.78, "learning_rate": 2.3671081828340005e-06, "loss": 21.1911, "step": 72440 }, { "epoch": 0.78, "learning_rate": 2.364846574556754e-06, "loss": 21.4458, "step": 72450 }, { "epoch": 0.78, "learning_rate": 2.362585902311244e-06, "loss": 21.8913, "step": 72460 }, { "epoch": 0.78, "learning_rate": 2.36032616637462e-06, "loss": 21.1128, "step": 72470 }, { "epoch": 0.78, "learning_rate": 2.358067367023914e-06, "loss": 20.9087, "step": 72480 }, { "epoch": 0.78, "learning_rate": 2.355809504536046e-06, "loss": 21.4711, "step": 72490 }, { "epoch": 0.78, "learning_rate": 2.353552579187819e-06, "loss": 21.0017, "step": 72500 }, { "epoch": 0.78, "learning_rate": 2.3512965912559203e-06, "loss": 21.6985, "step": 72510 }, { "epoch": 0.78, "learning_rate": 2.349041541016921e-06, "loss": 20.8767, "step": 72520 }, { "epoch": 0.78, "learning_rate": 2.3467874287472748e-06, "loss": 21.0826, "step": 72530 }, { "epoch": 0.78, "learning_rate": 2.344534254723334e-06, "loss": 21.1398, "step": 72540 }, { "epoch": 0.78, "learning_rate": 2.3422820192213213e-06, "loss": 21.704, "step": 72550 }, { "epoch": 0.78, "learning_rate": 2.3400307225173536e-06, "loss": 20.9729, "step": 72560 }, { "epoch": 0.78, "learning_rate": 2.337780364887422e-06, "loss": 21.6356, "step": 72570 }, { "epoch": 0.78, "learning_rate": 2.3355309466074096e-06, "loss": 21.3496, "step": 72580 }, { "epoch": 0.78, "learning_rate": 2.3332824679530897e-06, "loss": 21.2996, "step": 72590 }, { "epoch": 0.78, "learning_rate": 2.331034929200112e-06, "loss": 20.8901, "step": 72600 }, { "epoch": 0.78, "learning_rate": 2.3287883306240124e-06, "loss": 21.5065, "step": 72610 }, { "epoch": 0.79, "learning_rate": 2.3265426725002173e-06, "loss": 22.2101, "step": 72620 }, { "epoch": 0.79, "learning_rate": 2.3242979551040222e-06, "loss": 21.3885, "step": 72630 }, { "epoch": 0.79, "learning_rate": 2.32205417871063e-06, "loss": 21.6106, "step": 72640 }, { "epoch": 0.79, "learning_rate": 2.319811343595111e-06, "loss": 21.894, "step": 72650 }, { "epoch": 0.79, "learning_rate": 2.3175694500324265e-06, "loss": 20.4233, "step": 72660 }, { "epoch": 0.79, "learning_rate": 2.3153284982974245e-06, "loss": 20.8938, "step": 72670 }, { "epoch": 0.79, "learning_rate": 2.3130884886648252e-06, "loss": 21.1921, "step": 72680 }, { "epoch": 0.79, "learning_rate": 2.3108494214092524e-06, "loss": 21.1687, "step": 72690 }, { "epoch": 0.79, "learning_rate": 2.308611296805201e-06, "loss": 21.0231, "step": 72700 }, { "epoch": 0.79, "learning_rate": 2.3063741151270535e-06, "loss": 20.6539, "step": 72710 }, { "epoch": 0.79, "learning_rate": 2.3041378766490808e-06, "loss": 20.953, "step": 72720 }, { "epoch": 0.79, "learning_rate": 2.3019025816454254e-06, "loss": 20.4631, "step": 72730 }, { "epoch": 0.79, "learning_rate": 2.299668230390133e-06, "loss": 20.3539, "step": 72740 }, { "epoch": 0.79, "learning_rate": 2.2974348231571196e-06, "loss": 21.4515, "step": 72750 }, { "epoch": 0.79, "learning_rate": 2.295202360220191e-06, "loss": 21.4518, "step": 72760 }, { "epoch": 0.79, "learning_rate": 2.292970841853036e-06, "loss": 21.2769, "step": 72770 }, { "epoch": 0.79, "learning_rate": 2.2907402683292268e-06, "loss": 20.8285, "step": 72780 }, { "epoch": 0.79, "learning_rate": 2.28851063992222e-06, "loss": 20.7743, "step": 72790 }, { "epoch": 0.79, "learning_rate": 2.2862819569053594e-06, "loss": 21.1933, "step": 72800 }, { "epoch": 0.79, "learning_rate": 2.2840542195518677e-06, "loss": 21.2492, "step": 72810 }, { "epoch": 0.79, "learning_rate": 2.2818274281348564e-06, "loss": 21.2534, "step": 72820 }, { "epoch": 0.79, "learning_rate": 2.279601582927318e-06, "loss": 21.7071, "step": 72830 }, { "epoch": 0.79, "learning_rate": 2.2773766842021306e-06, "loss": 21.6032, "step": 72840 }, { "epoch": 0.79, "learning_rate": 2.2751527322320543e-06, "loss": 21.3568, "step": 72850 }, { "epoch": 0.79, "learning_rate": 2.2729297272897368e-06, "loss": 21.5719, "step": 72860 }, { "epoch": 0.79, "learning_rate": 2.270707669647706e-06, "loss": 21.0404, "step": 72870 }, { "epoch": 0.79, "learning_rate": 2.2684865595783744e-06, "loss": 21.5598, "step": 72880 }, { "epoch": 0.79, "learning_rate": 2.26626639735404e-06, "loss": 21.1832, "step": 72890 }, { "epoch": 0.79, "learning_rate": 2.2640471832468847e-06, "loss": 21.3533, "step": 72900 }, { "epoch": 0.79, "learning_rate": 2.261828917528971e-06, "loss": 20.6612, "step": 72910 }, { "epoch": 0.79, "learning_rate": 2.259611600472248e-06, "loss": 21.3444, "step": 72920 }, { "epoch": 0.79, "learning_rate": 2.2573952323485484e-06, "loss": 20.8718, "step": 72930 }, { "epoch": 0.79, "learning_rate": 2.2551798134295867e-06, "loss": 20.8636, "step": 72940 }, { "epoch": 0.79, "learning_rate": 2.2529653439869624e-06, "loss": 21.1152, "step": 72950 }, { "epoch": 0.79, "learning_rate": 2.25075182429216e-06, "loss": 20.9619, "step": 72960 }, { "epoch": 0.79, "learning_rate": 2.2485392546165443e-06, "loss": 21.0107, "step": 72970 }, { "epoch": 0.79, "learning_rate": 2.2463276352313657e-06, "loss": 21.2394, "step": 72980 }, { "epoch": 0.79, "learning_rate": 2.244116966407759e-06, "loss": 21.1001, "step": 72990 }, { "epoch": 0.79, "learning_rate": 2.241907248416738e-06, "loss": 21.4275, "step": 73000 }, { "epoch": 0.79, "learning_rate": 2.2396984815292065e-06, "loss": 21.2787, "step": 73010 }, { "epoch": 0.79, "learning_rate": 2.2374906660159467e-06, "loss": 20.9037, "step": 73020 }, { "epoch": 0.79, "learning_rate": 2.2352838021476263e-06, "loss": 21.9927, "step": 73030 }, { "epoch": 0.79, "learning_rate": 2.2330778901947912e-06, "loss": 20.7764, "step": 73040 }, { "epoch": 0.79, "learning_rate": 2.2308729304278863e-06, "loss": 21.3873, "step": 73050 }, { "epoch": 0.79, "learning_rate": 2.22866892311722e-06, "loss": 21.1826, "step": 73060 }, { "epoch": 0.79, "learning_rate": 2.226465868532993e-06, "loss": 20.3783, "step": 73070 }, { "epoch": 0.79, "learning_rate": 2.2242637669452906e-06, "loss": 21.7554, "step": 73080 }, { "epoch": 0.79, "learning_rate": 2.222062618624077e-06, "loss": 20.6538, "step": 73090 }, { "epoch": 0.79, "learning_rate": 2.2198624238392088e-06, "loss": 21.4207, "step": 73100 }, { "epoch": 0.79, "learning_rate": 2.2176631828604123e-06, "loss": 21.402, "step": 73110 }, { "epoch": 0.79, "learning_rate": 2.2154648959573057e-06, "loss": 20.9639, "step": 73120 }, { "epoch": 0.79, "learning_rate": 2.213267563399386e-06, "loss": 20.7598, "step": 73130 }, { "epoch": 0.79, "learning_rate": 2.2110711854560365e-06, "loss": 20.8672, "step": 73140 }, { "epoch": 0.79, "learning_rate": 2.2088757623965263e-06, "loss": 21.6796, "step": 73150 }, { "epoch": 0.79, "learning_rate": 2.2066812944899985e-06, "loss": 20.8388, "step": 73160 }, { "epoch": 0.79, "learning_rate": 2.2044877820054843e-06, "loss": 21.369, "step": 73170 }, { "epoch": 0.79, "learning_rate": 2.202295225211898e-06, "loss": 20.6186, "step": 73180 }, { "epoch": 0.79, "learning_rate": 2.2001036243780337e-06, "loss": 21.0991, "step": 73190 }, { "epoch": 0.79, "learning_rate": 2.1979129797725774e-06, "loss": 21.2716, "step": 73200 }, { "epoch": 0.79, "learning_rate": 2.195723291664088e-06, "loss": 21.2374, "step": 73210 }, { "epoch": 0.79, "learning_rate": 2.193534560321008e-06, "loss": 20.7152, "step": 73220 }, { "epoch": 0.79, "learning_rate": 2.191346786011667e-06, "loss": 21.3544, "step": 73230 }, { "epoch": 0.79, "learning_rate": 2.189159969004271e-06, "loss": 21.4633, "step": 73240 }, { "epoch": 0.79, "learning_rate": 2.1869741095669196e-06, "loss": 21.1478, "step": 73250 }, { "epoch": 0.79, "learning_rate": 2.184789207967587e-06, "loss": 21.3062, "step": 73260 }, { "epoch": 0.79, "learning_rate": 2.182605264474128e-06, "loss": 21.3337, "step": 73270 }, { "epoch": 0.79, "learning_rate": 2.180422279354284e-06, "loss": 21.2151, "step": 73280 }, { "epoch": 0.79, "learning_rate": 2.1782402528756763e-06, "loss": 21.3556, "step": 73290 }, { "epoch": 0.79, "learning_rate": 2.1760591853058156e-06, "loss": 20.8794, "step": 73300 }, { "epoch": 0.79, "learning_rate": 2.1738790769120876e-06, "loss": 21.5203, "step": 73310 }, { "epoch": 0.79, "learning_rate": 2.1716999279617646e-06, "loss": 21.2266, "step": 73320 }, { "epoch": 0.79, "learning_rate": 2.169521738721995e-06, "loss": 21.4679, "step": 73330 }, { "epoch": 0.79, "learning_rate": 2.1673445094598122e-06, "loss": 21.2267, "step": 73340 }, { "epoch": 0.79, "learning_rate": 2.1651682404421415e-06, "loss": 21.2943, "step": 73350 }, { "epoch": 0.79, "learning_rate": 2.162992931935778e-06, "loss": 21.6061, "step": 73360 }, { "epoch": 0.79, "learning_rate": 2.160818584207407e-06, "loss": 21.5092, "step": 73370 }, { "epoch": 0.79, "learning_rate": 2.1586451975235866e-06, "loss": 21.3842, "step": 73380 }, { "epoch": 0.79, "learning_rate": 2.156472772150765e-06, "loss": 22.1101, "step": 73390 }, { "epoch": 0.79, "learning_rate": 2.1543013083552744e-06, "loss": 21.2009, "step": 73400 }, { "epoch": 0.79, "learning_rate": 2.1521308064033243e-06, "loss": 21.5604, "step": 73410 }, { "epoch": 0.79, "learning_rate": 2.149961266561008e-06, "loss": 21.1055, "step": 73420 }, { "epoch": 0.79, "learning_rate": 2.147792689094297e-06, "loss": 21.4803, "step": 73430 }, { "epoch": 0.79, "learning_rate": 2.1456250742690464e-06, "loss": 20.4337, "step": 73440 }, { "epoch": 0.79, "learning_rate": 2.143458422351001e-06, "loss": 21.0545, "step": 73450 }, { "epoch": 0.79, "learning_rate": 2.1412927336057797e-06, "loss": 21.047, "step": 73460 }, { "epoch": 0.79, "learning_rate": 2.139128008298884e-06, "loss": 21.2785, "step": 73470 }, { "epoch": 0.79, "learning_rate": 2.1369642466957018e-06, "loss": 21.5073, "step": 73480 }, { "epoch": 0.79, "learning_rate": 2.134801449061491e-06, "loss": 20.7255, "step": 73490 }, { "epoch": 0.79, "learning_rate": 2.132639615661407e-06, "loss": 21.5969, "step": 73500 }, { "epoch": 0.79, "learning_rate": 2.1304787467604793e-06, "loss": 20.8541, "step": 73510 }, { "epoch": 0.79, "learning_rate": 2.128318842623618e-06, "loss": 20.9817, "step": 73520 }, { "epoch": 0.79, "learning_rate": 2.126159903515619e-06, "loss": 21.5137, "step": 73530 }, { "epoch": 0.8, "learning_rate": 2.1240019297011506e-06, "loss": 21.0353, "step": 73540 }, { "epoch": 0.8, "learning_rate": 2.121844921444778e-06, "loss": 20.4086, "step": 73550 }, { "epoch": 0.8, "learning_rate": 2.119688879010935e-06, "loss": 21.0493, "step": 73560 }, { "epoch": 0.8, "learning_rate": 2.1175338026639426e-06, "loss": 20.9756, "step": 73570 }, { "epoch": 0.8, "learning_rate": 2.1153796926680038e-06, "loss": 21.3972, "step": 73580 }, { "epoch": 0.8, "learning_rate": 2.1132265492871997e-06, "loss": 20.3051, "step": 73590 }, { "epoch": 0.8, "learning_rate": 2.1110743727854966e-06, "loss": 21.8559, "step": 73600 }, { "epoch": 0.8, "learning_rate": 2.108923163426739e-06, "loss": 22.1853, "step": 73610 }, { "epoch": 0.8, "learning_rate": 2.106772921474656e-06, "loss": 21.2946, "step": 73620 }, { "epoch": 0.8, "learning_rate": 2.104623647192855e-06, "loss": 21.2945, "step": 73630 }, { "epoch": 0.8, "learning_rate": 2.1024753408448274e-06, "loss": 21.9708, "step": 73640 }, { "epoch": 0.8, "learning_rate": 2.100328002693944e-06, "loss": 21.143, "step": 73650 }, { "epoch": 0.8, "learning_rate": 2.0981816330034587e-06, "loss": 20.8785, "step": 73660 }, { "epoch": 0.8, "learning_rate": 2.096036232036506e-06, "loss": 21.8177, "step": 73670 }, { "epoch": 0.8, "learning_rate": 2.0938918000561006e-06, "loss": 21.3757, "step": 73680 }, { "epoch": 0.8, "learning_rate": 2.091748337325138e-06, "loss": 21.1812, "step": 73690 }, { "epoch": 0.8, "learning_rate": 2.0896058441063982e-06, "loss": 21.6962, "step": 73700 }, { "epoch": 0.8, "learning_rate": 2.087464320662539e-06, "loss": 21.3663, "step": 73710 }, { "epoch": 0.8, "learning_rate": 2.085323767256101e-06, "loss": 20.7049, "step": 73720 }, { "epoch": 0.8, "learning_rate": 2.083184184149506e-06, "loss": 20.9936, "step": 73730 }, { "epoch": 0.8, "learning_rate": 2.0810455716050537e-06, "loss": 21.5305, "step": 73740 }, { "epoch": 0.8, "learning_rate": 2.07890792988493e-06, "loss": 20.8067, "step": 73750 }, { "epoch": 0.8, "learning_rate": 2.076771259251198e-06, "loss": 21.0313, "step": 73760 }, { "epoch": 0.8, "learning_rate": 2.074635559965803e-06, "loss": 21.213, "step": 73770 }, { "epoch": 0.8, "learning_rate": 2.0725008322905714e-06, "loss": 21.1816, "step": 73780 }, { "epoch": 0.8, "learning_rate": 2.0703670764872097e-06, "loss": 20.8541, "step": 73790 }, { "epoch": 0.8, "learning_rate": 2.068234292817305e-06, "loss": 20.9177, "step": 73800 }, { "epoch": 0.8, "learning_rate": 2.066102481542328e-06, "loss": 21.4716, "step": 73810 }, { "epoch": 0.8, "learning_rate": 2.063971642923626e-06, "loss": 21.017, "step": 73820 }, { "epoch": 0.8, "learning_rate": 2.061841777222431e-06, "loss": 21.3492, "step": 73830 }, { "epoch": 0.8, "learning_rate": 2.0597128846998513e-06, "loss": 21.4552, "step": 73840 }, { "epoch": 0.8, "learning_rate": 2.0575849656168822e-06, "loss": 21.8994, "step": 73850 }, { "epoch": 0.8, "learning_rate": 2.0554580202343933e-06, "loss": 21.4231, "step": 73860 }, { "epoch": 0.8, "learning_rate": 2.053332048813138e-06, "loss": 21.4656, "step": 73870 }, { "epoch": 0.8, "learning_rate": 2.0512070516137505e-06, "loss": 21.4089, "step": 73880 }, { "epoch": 0.8, "learning_rate": 2.0490830288967443e-06, "loss": 21.5401, "step": 73890 }, { "epoch": 0.8, "learning_rate": 2.046959980922514e-06, "loss": 21.6002, "step": 73900 }, { "epoch": 0.8, "learning_rate": 2.0448379079513347e-06, "loss": 21.6933, "step": 73910 }, { "epoch": 0.8, "learning_rate": 2.0427168102433625e-06, "loss": 21.4285, "step": 73920 }, { "epoch": 0.8, "learning_rate": 2.0405966880586327e-06, "loss": 21.968, "step": 73930 }, { "epoch": 0.8, "learning_rate": 2.038477541657061e-06, "loss": 21.3975, "step": 73940 }, { "epoch": 0.8, "learning_rate": 2.0363593712984463e-06, "loss": 21.8667, "step": 73950 }, { "epoch": 0.8, "learning_rate": 2.0342421772424635e-06, "loss": 20.4238, "step": 73960 }, { "epoch": 0.8, "learning_rate": 2.032125959748672e-06, "loss": 21.1173, "step": 73970 }, { "epoch": 0.8, "learning_rate": 2.0300107190765083e-06, "loss": 21.3845, "step": 73980 }, { "epoch": 0.8, "learning_rate": 2.027896455485291e-06, "loss": 21.055, "step": 73990 }, { "epoch": 0.8, "learning_rate": 2.025783169234217e-06, "loss": 21.0598, "step": 74000 }, { "epoch": 0.8, "learning_rate": 2.023670860582364e-06, "loss": 20.9647, "step": 74010 }, { "epoch": 0.8, "learning_rate": 2.021559529788697e-06, "loss": 20.5109, "step": 74020 }, { "epoch": 0.8, "learning_rate": 2.019449177112046e-06, "loss": 20.8857, "step": 74030 }, { "epoch": 0.8, "learning_rate": 2.0173398028111347e-06, "loss": 20.1355, "step": 74040 }, { "epoch": 0.8, "learning_rate": 2.0152314071445613e-06, "loss": 21.6676, "step": 74050 }, { "epoch": 0.8, "learning_rate": 2.0131239903708e-06, "loss": 20.7158, "step": 74060 }, { "epoch": 0.8, "learning_rate": 2.011017552748219e-06, "loss": 21.8655, "step": 74070 }, { "epoch": 0.8, "learning_rate": 2.0089120945350495e-06, "loss": 22.1915, "step": 74080 }, { "epoch": 0.8, "learning_rate": 2.0068076159894113e-06, "loss": 21.3286, "step": 74090 }, { "epoch": 0.8, "learning_rate": 2.004704117369304e-06, "loss": 20.9513, "step": 74100 }, { "epoch": 0.8, "learning_rate": 2.002601598932604e-06, "loss": 21.6017, "step": 74110 }, { "epoch": 0.8, "learning_rate": 2.0005000609370763e-06, "loss": 21.064, "step": 74120 }, { "epoch": 0.8, "learning_rate": 1.9983995036403516e-06, "loss": 21.0182, "step": 74130 }, { "epoch": 0.8, "learning_rate": 1.9962999272999506e-06, "loss": 21.2326, "step": 74140 }, { "epoch": 0.8, "learning_rate": 1.99420133217327e-06, "loss": 21.497, "step": 74150 }, { "epoch": 0.8, "learning_rate": 1.9921037185175864e-06, "loss": 20.9357, "step": 74160 }, { "epoch": 0.8, "learning_rate": 1.99000708659006e-06, "loss": 22.1159, "step": 74170 }, { "epoch": 0.8, "learning_rate": 1.9879114366477283e-06, "loss": 21.648, "step": 74180 }, { "epoch": 0.8, "learning_rate": 1.9858167689475016e-06, "loss": 21.1989, "step": 74190 }, { "epoch": 0.8, "learning_rate": 1.9837230837461794e-06, "loss": 21.9061, "step": 74200 }, { "epoch": 0.8, "learning_rate": 1.9816303813004335e-06, "loss": 21.3189, "step": 74210 }, { "epoch": 0.8, "learning_rate": 1.9795386618668245e-06, "loss": 21.139, "step": 74220 }, { "epoch": 0.8, "learning_rate": 1.9774479257017876e-06, "loss": 21.099, "step": 74230 }, { "epoch": 0.8, "learning_rate": 1.97535817306163e-06, "loss": 20.9676, "step": 74240 }, { "epoch": 0.8, "learning_rate": 1.973269404202548e-06, "loss": 20.7339, "step": 74250 }, { "epoch": 0.8, "learning_rate": 1.971181619380611e-06, "loss": 20.9365, "step": 74260 }, { "epoch": 0.8, "learning_rate": 1.9690948188517776e-06, "loss": 21.3356, "step": 74270 }, { "epoch": 0.8, "learning_rate": 1.967009002871877e-06, "loss": 20.7796, "step": 74280 }, { "epoch": 0.8, "learning_rate": 1.9649241716966195e-06, "loss": 21.1664, "step": 74290 }, { "epoch": 0.8, "learning_rate": 1.9628403255815933e-06, "loss": 21.0313, "step": 74300 }, { "epoch": 0.8, "learning_rate": 1.9607574647822648e-06, "loss": 21.3552, "step": 74310 }, { "epoch": 0.8, "learning_rate": 1.958675589553989e-06, "loss": 22.3462, "step": 74320 }, { "epoch": 0.8, "learning_rate": 1.95659470015199e-06, "loss": 21.3757, "step": 74330 }, { "epoch": 0.8, "learning_rate": 1.954514796831378e-06, "loss": 21.445, "step": 74340 }, { "epoch": 0.8, "learning_rate": 1.9524358798471333e-06, "loss": 21.9438, "step": 74350 }, { "epoch": 0.8, "learning_rate": 1.950357949454119e-06, "loss": 20.9335, "step": 74360 }, { "epoch": 0.8, "learning_rate": 1.9482810059070877e-06, "loss": 21.2089, "step": 74370 }, { "epoch": 0.8, "learning_rate": 1.9462050494606564e-06, "loss": 20.6936, "step": 74380 }, { "epoch": 0.8, "learning_rate": 1.9441300803693318e-06, "loss": 20.7745, "step": 74390 }, { "epoch": 0.8, "learning_rate": 1.942056098887489e-06, "loss": 20.7428, "step": 74400 }, { "epoch": 0.8, "learning_rate": 1.939983105269386e-06, "loss": 21.8648, "step": 74410 }, { "epoch": 0.8, "learning_rate": 1.9379110997691697e-06, "loss": 21.3864, "step": 74420 }, { "epoch": 0.8, "learning_rate": 1.935840082640853e-06, "loss": 21.206, "step": 74430 }, { "epoch": 0.8, "learning_rate": 1.933770054138333e-06, "loss": 21.0275, "step": 74440 }, { "epoch": 0.8, "learning_rate": 1.931701014515388e-06, "loss": 20.9642, "step": 74450 }, { "epoch": 0.8, "learning_rate": 1.929632964025663e-06, "loss": 21.0713, "step": 74460 }, { "epoch": 0.81, "learning_rate": 1.9275659029226977e-06, "loss": 20.9457, "step": 74470 }, { "epoch": 0.81, "learning_rate": 1.9254998314599037e-06, "loss": 20.8503, "step": 74480 }, { "epoch": 0.81, "learning_rate": 1.9234347498905694e-06, "loss": 21.4841, "step": 74490 }, { "epoch": 0.81, "learning_rate": 1.921370658467865e-06, "loss": 21.0471, "step": 74500 }, { "epoch": 0.81, "learning_rate": 1.919307557444832e-06, "loss": 21.7458, "step": 74510 }, { "epoch": 0.81, "learning_rate": 1.9172454470744028e-06, "loss": 21.096, "step": 74520 }, { "epoch": 0.81, "learning_rate": 1.915184327609381e-06, "loss": 21.1768, "step": 74530 }, { "epoch": 0.81, "learning_rate": 1.9131241993024464e-06, "loss": 21.9656, "step": 74540 }, { "epoch": 0.81, "learning_rate": 1.911065062406163e-06, "loss": 20.5749, "step": 74550 }, { "epoch": 0.81, "learning_rate": 1.9090069171729708e-06, "loss": 21.5996, "step": 74560 }, { "epoch": 0.81, "learning_rate": 1.906949763855187e-06, "loss": 20.8425, "step": 74570 }, { "epoch": 0.81, "learning_rate": 1.904893602705009e-06, "loss": 21.4364, "step": 74580 }, { "epoch": 0.81, "learning_rate": 1.902838433974511e-06, "loss": 20.3944, "step": 74590 }, { "epoch": 0.81, "learning_rate": 1.9007842579156477e-06, "loss": 22.3281, "step": 74600 }, { "epoch": 0.81, "learning_rate": 1.89873107478025e-06, "loss": 21.2357, "step": 74610 }, { "epoch": 0.81, "learning_rate": 1.896678884820029e-06, "loss": 20.6485, "step": 74620 }, { "epoch": 0.81, "learning_rate": 1.894627688286571e-06, "loss": 21.3076, "step": 74630 }, { "epoch": 0.81, "learning_rate": 1.892577485431344e-06, "loss": 22.1211, "step": 74640 }, { "epoch": 0.81, "learning_rate": 1.890528276505692e-06, "loss": 22.1281, "step": 74650 }, { "epoch": 0.81, "learning_rate": 1.888480061760839e-06, "loss": 21.3948, "step": 74660 }, { "epoch": 0.81, "learning_rate": 1.8864328414478838e-06, "loss": 21.6138, "step": 74670 }, { "epoch": 0.81, "learning_rate": 1.884386615817807e-06, "loss": 21.225, "step": 74680 }, { "epoch": 0.81, "learning_rate": 1.8823413851214656e-06, "loss": 21.26, "step": 74690 }, { "epoch": 0.81, "learning_rate": 1.8802971496095935e-06, "loss": 20.6816, "step": 74700 }, { "epoch": 0.81, "learning_rate": 1.8782539095328056e-06, "loss": 21.2184, "step": 74710 }, { "epoch": 0.81, "learning_rate": 1.8762116651415907e-06, "loss": 21.4431, "step": 74720 }, { "epoch": 0.81, "learning_rate": 1.8741704166863195e-06, "loss": 20.6697, "step": 74730 }, { "epoch": 0.81, "learning_rate": 1.8721301644172385e-06, "loss": 21.7652, "step": 74740 }, { "epoch": 0.81, "learning_rate": 1.8700909085844732e-06, "loss": 21.8443, "step": 74750 }, { "epoch": 0.81, "learning_rate": 1.8680526494380236e-06, "loss": 21.3747, "step": 74760 }, { "epoch": 0.81, "learning_rate": 1.8660153872277731e-06, "loss": 21.1415, "step": 74770 }, { "epoch": 0.81, "learning_rate": 1.8639791222034786e-06, "loss": 21.2047, "step": 74780 }, { "epoch": 0.81, "learning_rate": 1.861943854614775e-06, "loss": 20.8623, "step": 74790 }, { "epoch": 0.81, "learning_rate": 1.8599095847111782e-06, "loss": 20.5721, "step": 74800 }, { "epoch": 0.81, "learning_rate": 1.8578763127420774e-06, "loss": 20.8274, "step": 74810 }, { "epoch": 0.81, "learning_rate": 1.8558440389567434e-06, "loss": 20.9154, "step": 74820 }, { "epoch": 0.81, "learning_rate": 1.8538127636043224e-06, "loss": 20.6003, "step": 74830 }, { "epoch": 0.81, "learning_rate": 1.8517824869338375e-06, "loss": 21.2495, "step": 74840 }, { "epoch": 0.81, "learning_rate": 1.8497532091941906e-06, "loss": 20.5877, "step": 74850 }, { "epoch": 0.81, "learning_rate": 1.8477249306341627e-06, "loss": 20.9814, "step": 74860 }, { "epoch": 0.81, "learning_rate": 1.8456976515024094e-06, "loss": 20.9985, "step": 74870 }, { "epoch": 0.81, "learning_rate": 1.8436713720474653e-06, "loss": 21.1225, "step": 74880 }, { "epoch": 0.81, "learning_rate": 1.8416460925177415e-06, "loss": 21.3673, "step": 74890 }, { "epoch": 0.81, "learning_rate": 1.8396218131615285e-06, "loss": 20.2364, "step": 74900 }, { "epoch": 0.81, "learning_rate": 1.8375985342269919e-06, "loss": 21.207, "step": 74910 }, { "epoch": 0.81, "learning_rate": 1.8355762559621759e-06, "loss": 21.8479, "step": 74920 }, { "epoch": 0.81, "learning_rate": 1.8335549786150008e-06, "loss": 21.4798, "step": 74930 }, { "epoch": 0.81, "learning_rate": 1.8315347024332663e-06, "loss": 21.2742, "step": 74940 }, { "epoch": 0.81, "learning_rate": 1.8295154276646487e-06, "loss": 21.1571, "step": 74950 }, { "epoch": 0.81, "learning_rate": 1.8274971545567e-06, "loss": 20.9014, "step": 74960 }, { "epoch": 0.81, "learning_rate": 1.8254798833568498e-06, "loss": 21.5376, "step": 74970 }, { "epoch": 0.81, "learning_rate": 1.823463614312404e-06, "loss": 20.7632, "step": 74980 }, { "epoch": 0.81, "learning_rate": 1.8214483476705557e-06, "loss": 21.4057, "step": 74990 }, { "epoch": 0.81, "learning_rate": 1.8194340836783565e-06, "loss": 20.8887, "step": 75000 }, { "epoch": 0.81, "learning_rate": 1.8174208225827495e-06, "loss": 20.8371, "step": 75010 }, { "epoch": 0.81, "learning_rate": 1.8154085646305486e-06, "loss": 21.4275, "step": 75020 }, { "epoch": 0.81, "learning_rate": 1.8133973100684465e-06, "loss": 21.5792, "step": 75030 }, { "epoch": 0.81, "learning_rate": 1.8113870591430193e-06, "loss": 21.0499, "step": 75040 }, { "epoch": 0.81, "learning_rate": 1.8093778121007067e-06, "loss": 20.5813, "step": 75050 }, { "epoch": 0.81, "learning_rate": 1.8073695691878335e-06, "loss": 21.4598, "step": 75060 }, { "epoch": 0.81, "learning_rate": 1.8053623306506008e-06, "loss": 20.3491, "step": 75070 }, { "epoch": 0.81, "learning_rate": 1.803356096735085e-06, "loss": 21.2854, "step": 75080 }, { "epoch": 0.81, "learning_rate": 1.8013508676872472e-06, "loss": 21.2461, "step": 75090 }, { "epoch": 0.81, "learning_rate": 1.7993466437529096e-06, "loss": 20.5743, "step": 75100 }, { "epoch": 0.81, "learning_rate": 1.7973434251777833e-06, "loss": 21.2801, "step": 75110 }, { "epoch": 0.81, "learning_rate": 1.7953412122074542e-06, "loss": 21.6195, "step": 75120 }, { "epoch": 0.81, "learning_rate": 1.7933400050873795e-06, "loss": 20.8318, "step": 75130 }, { "epoch": 0.81, "learning_rate": 1.7913398040629027e-06, "loss": 20.9404, "step": 75140 }, { "epoch": 0.81, "learning_rate": 1.7893406093792387e-06, "loss": 20.5661, "step": 75150 }, { "epoch": 0.81, "learning_rate": 1.7873424212814738e-06, "loss": 20.7764, "step": 75160 }, { "epoch": 0.81, "learning_rate": 1.7853452400145788e-06, "loss": 20.5679, "step": 75170 }, { "epoch": 0.81, "learning_rate": 1.7833490658233943e-06, "loss": 21.6306, "step": 75180 }, { "epoch": 0.81, "learning_rate": 1.781353898952648e-06, "loss": 21.5682, "step": 75190 }, { "epoch": 0.81, "learning_rate": 1.7793597396469354e-06, "loss": 21.7773, "step": 75200 }, { "epoch": 0.81, "learning_rate": 1.7773665881507274e-06, "loss": 21.556, "step": 75210 }, { "epoch": 0.81, "learning_rate": 1.7753744447083764e-06, "loss": 21.147, "step": 75220 }, { "epoch": 0.81, "learning_rate": 1.773383309564106e-06, "loss": 21.7682, "step": 75230 }, { "epoch": 0.81, "learning_rate": 1.7713931829620256e-06, "loss": 20.6183, "step": 75240 }, { "epoch": 0.81, "learning_rate": 1.7694040651461108e-06, "loss": 21.3301, "step": 75250 }, { "epoch": 0.81, "learning_rate": 1.7674159563602212e-06, "loss": 21.1182, "step": 75260 }, { "epoch": 0.81, "learning_rate": 1.7654288568480838e-06, "loss": 21.0361, "step": 75270 }, { "epoch": 0.81, "learning_rate": 1.7634427668533072e-06, "loss": 20.7461, "step": 75280 }, { "epoch": 0.81, "learning_rate": 1.761457686619381e-06, "loss": 21.4371, "step": 75290 }, { "epoch": 0.81, "learning_rate": 1.7594736163896632e-06, "loss": 21.0487, "step": 75300 }, { "epoch": 0.81, "learning_rate": 1.757490556407394e-06, "loss": 21.0619, "step": 75310 }, { "epoch": 0.81, "learning_rate": 1.755508506915682e-06, "loss": 21.0112, "step": 75320 }, { "epoch": 0.81, "learning_rate": 1.7535274681575154e-06, "loss": 21.0675, "step": 75330 }, { "epoch": 0.81, "learning_rate": 1.751547440375766e-06, "loss": 20.6612, "step": 75340 }, { "epoch": 0.81, "learning_rate": 1.7495684238131716e-06, "loss": 20.9903, "step": 75350 }, { "epoch": 0.81, "learning_rate": 1.7475904187123528e-06, "loss": 20.7475, "step": 75360 }, { "epoch": 0.81, "learning_rate": 1.7456134253157976e-06, "loss": 20.4802, "step": 75370 }, { "epoch": 0.81, "learning_rate": 1.7436374438658766e-06, "loss": 21.3863, "step": 75380 }, { "epoch": 0.82, "learning_rate": 1.7416624746048404e-06, "loss": 21.074, "step": 75390 }, { "epoch": 0.82, "learning_rate": 1.7396885177748069e-06, "loss": 20.9854, "step": 75400 }, { "epoch": 0.82, "learning_rate": 1.7377155736177741e-06, "loss": 21.6981, "step": 75410 }, { "epoch": 0.82, "learning_rate": 1.7357436423756168e-06, "loss": 20.4858, "step": 75420 }, { "epoch": 0.82, "learning_rate": 1.733772724290077e-06, "loss": 21.4784, "step": 75430 }, { "epoch": 0.82, "learning_rate": 1.7318028196027857e-06, "loss": 21.7517, "step": 75440 }, { "epoch": 0.82, "learning_rate": 1.7298339285552434e-06, "loss": 21.7785, "step": 75450 }, { "epoch": 0.82, "learning_rate": 1.7278660513888245e-06, "loss": 20.3951, "step": 75460 }, { "epoch": 0.82, "learning_rate": 1.725899188344784e-06, "loss": 21.2312, "step": 75470 }, { "epoch": 0.82, "learning_rate": 1.7239333396642422e-06, "loss": 22.5065, "step": 75480 }, { "epoch": 0.82, "learning_rate": 1.7219685055882095e-06, "loss": 21.1989, "step": 75490 }, { "epoch": 0.82, "learning_rate": 1.7200046863575615e-06, "loss": 21.045, "step": 75500 }, { "epoch": 0.82, "learning_rate": 1.718041882213054e-06, "loss": 21.0888, "step": 75510 }, { "epoch": 0.82, "learning_rate": 1.716080093395317e-06, "loss": 21.3104, "step": 75520 }, { "epoch": 0.82, "learning_rate": 1.7141193201448547e-06, "loss": 20.6366, "step": 75530 }, { "epoch": 0.82, "learning_rate": 1.7121595627020482e-06, "loss": 21.398, "step": 75540 }, { "epoch": 0.82, "learning_rate": 1.7102008213071564e-06, "loss": 21.3504, "step": 75550 }, { "epoch": 0.82, "learning_rate": 1.7082430962003083e-06, "loss": 20.8888, "step": 75560 }, { "epoch": 0.82, "learning_rate": 1.7062863876215118e-06, "loss": 21.5294, "step": 75570 }, { "epoch": 0.82, "learning_rate": 1.704330695810652e-06, "loss": 21.2055, "step": 75580 }, { "epoch": 0.82, "learning_rate": 1.7023760210074835e-06, "loss": 21.2831, "step": 75590 }, { "epoch": 0.82, "learning_rate": 1.7004223634516426e-06, "loss": 21.031, "step": 75600 }, { "epoch": 0.82, "learning_rate": 1.6984697233826364e-06, "loss": 21.3919, "step": 75610 }, { "epoch": 0.82, "learning_rate": 1.696518101039849e-06, "loss": 20.7019, "step": 75620 }, { "epoch": 0.82, "learning_rate": 1.6945674966625404e-06, "loss": 21.1657, "step": 75630 }, { "epoch": 0.82, "learning_rate": 1.6926179104898443e-06, "loss": 20.9867, "step": 75640 }, { "epoch": 0.82, "learning_rate": 1.690669342760769e-06, "loss": 20.94, "step": 75650 }, { "epoch": 0.82, "learning_rate": 1.688721793714202e-06, "loss": 21.4, "step": 75660 }, { "epoch": 0.82, "learning_rate": 1.6867752635889012e-06, "loss": 21.2282, "step": 75670 }, { "epoch": 0.82, "learning_rate": 1.6848297526235013e-06, "loss": 20.4212, "step": 75680 }, { "epoch": 0.82, "learning_rate": 1.6828852610565128e-06, "loss": 20.7615, "step": 75690 }, { "epoch": 0.82, "learning_rate": 1.6809417891263214e-06, "loss": 21.144, "step": 75700 }, { "epoch": 0.82, "learning_rate": 1.6789993370711865e-06, "loss": 21.327, "step": 75710 }, { "epoch": 0.82, "learning_rate": 1.6770579051292423e-06, "loss": 21.3387, "step": 75720 }, { "epoch": 0.82, "learning_rate": 1.6751174935384996e-06, "loss": 21.6663, "step": 75730 }, { "epoch": 0.82, "learning_rate": 1.6731781025368422e-06, "loss": 20.8637, "step": 75740 }, { "epoch": 0.82, "learning_rate": 1.671239732362031e-06, "loss": 20.863, "step": 75750 }, { "epoch": 0.82, "learning_rate": 1.6693023832516998e-06, "loss": 20.5659, "step": 75760 }, { "epoch": 0.82, "learning_rate": 1.667366055443358e-06, "loss": 21.1916, "step": 75770 }, { "epoch": 0.82, "learning_rate": 1.6654307491743893e-06, "loss": 20.6481, "step": 75780 }, { "epoch": 0.82, "learning_rate": 1.663496464682054e-06, "loss": 21.3302, "step": 75790 }, { "epoch": 0.82, "learning_rate": 1.6615632022034845e-06, "loss": 21.2154, "step": 75800 }, { "epoch": 0.82, "learning_rate": 1.659630961975689e-06, "loss": 21.2936, "step": 75810 }, { "epoch": 0.82, "learning_rate": 1.6576997442355524e-06, "loss": 21.3263, "step": 75820 }, { "epoch": 0.82, "learning_rate": 1.65576954921983e-06, "loss": 21.326, "step": 75830 }, { "epoch": 0.82, "learning_rate": 1.6538403771651523e-06, "loss": 21.0203, "step": 75840 }, { "epoch": 0.82, "learning_rate": 1.6519122283080347e-06, "loss": 20.5873, "step": 75850 }, { "epoch": 0.82, "learning_rate": 1.649985102884849e-06, "loss": 20.5802, "step": 75860 }, { "epoch": 0.82, "learning_rate": 1.6480590011318565e-06, "loss": 21.144, "step": 75870 }, { "epoch": 0.82, "learning_rate": 1.6461339232851857e-06, "loss": 20.9843, "step": 75880 }, { "epoch": 0.82, "learning_rate": 1.6442098695808418e-06, "loss": 21.501, "step": 75890 }, { "epoch": 0.82, "learning_rate": 1.6422868402547043e-06, "loss": 20.7767, "step": 75900 }, { "epoch": 0.82, "learning_rate": 1.6403648355425272e-06, "loss": 21.6905, "step": 75910 }, { "epoch": 0.82, "learning_rate": 1.6384438556799398e-06, "loss": 21.3911, "step": 75920 }, { "epoch": 0.82, "learning_rate": 1.6365239009024425e-06, "loss": 21.0402, "step": 75930 }, { "epoch": 0.82, "learning_rate": 1.6346049714454126e-06, "loss": 21.5528, "step": 75940 }, { "epoch": 0.82, "learning_rate": 1.632687067544101e-06, "loss": 20.9125, "step": 75950 }, { "epoch": 0.82, "learning_rate": 1.630770189433637e-06, "loss": 21.457, "step": 75960 }, { "epoch": 0.82, "learning_rate": 1.6288543373490162e-06, "loss": 20.7335, "step": 75970 }, { "epoch": 0.82, "learning_rate": 1.626939511525113e-06, "loss": 20.7644, "step": 75980 }, { "epoch": 0.82, "learning_rate": 1.6250257121966762e-06, "loss": 20.5733, "step": 75990 }, { "epoch": 0.82, "learning_rate": 1.6231129395983259e-06, "loss": 21.9156, "step": 76000 }, { "epoch": 0.82, "learning_rate": 1.6212011939645656e-06, "loss": 21.4198, "step": 76010 }, { "epoch": 0.82, "learning_rate": 1.6192904755297579e-06, "loss": 21.0557, "step": 76020 }, { "epoch": 0.82, "learning_rate": 1.6173807845281497e-06, "loss": 21.1706, "step": 76030 }, { "epoch": 0.82, "learning_rate": 1.6154721211938607e-06, "loss": 20.8758, "step": 76040 }, { "epoch": 0.82, "learning_rate": 1.6135644857608811e-06, "loss": 21.3064, "step": 76050 }, { "epoch": 0.82, "learning_rate": 1.6116578784630831e-06, "loss": 21.0961, "step": 76060 }, { "epoch": 0.82, "learning_rate": 1.6097522995342018e-06, "loss": 20.8069, "step": 76070 }, { "epoch": 0.82, "learning_rate": 1.6078477492078525e-06, "loss": 21.7744, "step": 76080 }, { "epoch": 0.82, "learning_rate": 1.6059442277175252e-06, "loss": 20.347, "step": 76090 }, { "epoch": 0.82, "learning_rate": 1.6040417352965777e-06, "loss": 21.5601, "step": 76100 }, { "epoch": 0.82, "learning_rate": 1.602140272178253e-06, "loss": 21.8927, "step": 76110 }, { "epoch": 0.82, "learning_rate": 1.6002398385956607e-06, "loss": 21.3089, "step": 76120 }, { "epoch": 0.82, "learning_rate": 1.5983404347817777e-06, "loss": 20.5855, "step": 76130 }, { "epoch": 0.82, "learning_rate": 1.5964420609694665e-06, "loss": 21.3827, "step": 76140 }, { "epoch": 0.82, "learning_rate": 1.5945447173914542e-06, "loss": 20.5712, "step": 76150 }, { "epoch": 0.82, "learning_rate": 1.5926484042803504e-06, "loss": 21.613, "step": 76160 }, { "epoch": 0.82, "learning_rate": 1.5907531218686346e-06, "loss": 21.6168, "step": 76170 }, { "epoch": 0.82, "learning_rate": 1.5888588703886533e-06, "loss": 21.3037, "step": 76180 }, { "epoch": 0.82, "learning_rate": 1.586965650072635e-06, "loss": 21.9421, "step": 76190 }, { "epoch": 0.82, "learning_rate": 1.5850734611526775e-06, "loss": 20.7707, "step": 76200 }, { "epoch": 0.82, "learning_rate": 1.5831823038607564e-06, "loss": 20.339, "step": 76210 }, { "epoch": 0.82, "learning_rate": 1.5812921784287183e-06, "loss": 21.2085, "step": 76220 }, { "epoch": 0.82, "learning_rate": 1.5794030850882836e-06, "loss": 20.5379, "step": 76230 }, { "epoch": 0.82, "learning_rate": 1.5775150240710424e-06, "loss": 20.8005, "step": 76240 }, { "epoch": 0.82, "learning_rate": 1.5756279956084598e-06, "loss": 20.8528, "step": 76250 }, { "epoch": 0.82, "learning_rate": 1.5737419999318826e-06, "loss": 21.39, "step": 76260 }, { "epoch": 0.82, "learning_rate": 1.5718570372725217e-06, "loss": 21.3964, "step": 76270 }, { "epoch": 0.82, "learning_rate": 1.5699731078614655e-06, "loss": 20.9395, "step": 76280 }, { "epoch": 0.82, "learning_rate": 1.5680902119296704e-06, "loss": 21.3607, "step": 76290 }, { "epoch": 0.82, "learning_rate": 1.5662083497079705e-06, "loss": 21.2975, "step": 76300 }, { "epoch": 0.82, "learning_rate": 1.564327521427077e-06, "loss": 21.2884, "step": 76310 }, { "epoch": 0.83, "learning_rate": 1.5624477273175665e-06, "loss": 21.3429, "step": 76320 }, { "epoch": 0.83, "learning_rate": 1.5605689676098967e-06, "loss": 21.2467, "step": 76330 }, { "epoch": 0.83, "learning_rate": 1.5586912425343893e-06, "loss": 21.2347, "step": 76340 }, { "epoch": 0.83, "learning_rate": 1.5568145523212418e-06, "loss": 20.7535, "step": 76350 }, { "epoch": 0.83, "learning_rate": 1.554938897200534e-06, "loss": 21.8979, "step": 76360 }, { "epoch": 0.83, "learning_rate": 1.5530642774022086e-06, "loss": 20.476, "step": 76370 }, { "epoch": 0.83, "learning_rate": 1.551190693156085e-06, "loss": 21.9815, "step": 76380 }, { "epoch": 0.83, "learning_rate": 1.549318144691858e-06, "loss": 21.165, "step": 76390 }, { "epoch": 0.83, "learning_rate": 1.5474466322390845e-06, "loss": 21.1625, "step": 76400 }, { "epoch": 0.83, "learning_rate": 1.545576156027211e-06, "loss": 20.9626, "step": 76410 }, { "epoch": 0.83, "learning_rate": 1.5437067162855445e-06, "loss": 21.3516, "step": 76420 }, { "epoch": 0.83, "learning_rate": 1.5418383132432712e-06, "loss": 20.7039, "step": 76430 }, { "epoch": 0.83, "learning_rate": 1.539970947129449e-06, "loss": 20.7086, "step": 76440 }, { "epoch": 0.83, "learning_rate": 1.5381046181729997e-06, "loss": 21.0401, "step": 76450 }, { "epoch": 0.83, "learning_rate": 1.5362393266027352e-06, "loss": 20.9049, "step": 76460 }, { "epoch": 0.83, "learning_rate": 1.5343750726473272e-06, "loss": 21.2744, "step": 76470 }, { "epoch": 0.83, "learning_rate": 1.5325118565353237e-06, "loss": 21.7855, "step": 76480 }, { "epoch": 0.83, "learning_rate": 1.5306496784951462e-06, "loss": 21.9309, "step": 76490 }, { "epoch": 0.83, "learning_rate": 1.5287885387550882e-06, "loss": 21.1639, "step": 76500 }, { "epoch": 0.83, "learning_rate": 1.5269284375433169e-06, "loss": 21.1247, "step": 76510 }, { "epoch": 0.83, "learning_rate": 1.525069375087871e-06, "loss": 21.3919, "step": 76520 }, { "epoch": 0.83, "learning_rate": 1.5232113516166625e-06, "loss": 21.1293, "step": 76530 }, { "epoch": 0.83, "learning_rate": 1.521354367357475e-06, "loss": 21.0837, "step": 76540 }, { "epoch": 0.83, "learning_rate": 1.519498422537966e-06, "loss": 21.2038, "step": 76550 }, { "epoch": 0.83, "learning_rate": 1.5176435173856652e-06, "loss": 21.3441, "step": 76560 }, { "epoch": 0.83, "learning_rate": 1.5157896521279747e-06, "loss": 21.1926, "step": 76570 }, { "epoch": 0.83, "learning_rate": 1.5139368269921684e-06, "loss": 21.5652, "step": 76580 }, { "epoch": 0.83, "learning_rate": 1.5120850422053956e-06, "loss": 21.3786, "step": 76590 }, { "epoch": 0.83, "learning_rate": 1.5102342979946727e-06, "loss": 21.5659, "step": 76600 }, { "epoch": 0.83, "learning_rate": 1.5083845945868948e-06, "loss": 21.5667, "step": 76610 }, { "epoch": 0.83, "learning_rate": 1.5065359322088235e-06, "loss": 21.4882, "step": 76620 }, { "epoch": 0.83, "learning_rate": 1.504688311087098e-06, "loss": 21.1765, "step": 76630 }, { "epoch": 0.83, "learning_rate": 1.5028417314482269e-06, "loss": 21.3353, "step": 76640 }, { "epoch": 0.83, "learning_rate": 1.5009961935185902e-06, "loss": 21.0238, "step": 76650 }, { "epoch": 0.83, "learning_rate": 1.4991516975244426e-06, "loss": 20.9532, "step": 76660 }, { "epoch": 0.83, "learning_rate": 1.4973082436919107e-06, "loss": 21.1994, "step": 76670 }, { "epoch": 0.83, "learning_rate": 1.4954658322469917e-06, "loss": 21.192, "step": 76680 }, { "epoch": 0.83, "learning_rate": 1.4936244634155572e-06, "loss": 20.4337, "step": 76690 }, { "epoch": 0.83, "learning_rate": 1.4917841374233488e-06, "loss": 21.6461, "step": 76700 }, { "epoch": 0.83, "learning_rate": 1.4899448544959816e-06, "loss": 20.9743, "step": 76710 }, { "epoch": 0.83, "learning_rate": 1.488106614858943e-06, "loss": 20.1264, "step": 76720 }, { "epoch": 0.83, "learning_rate": 1.4862694187375902e-06, "loss": 21.1781, "step": 76730 }, { "epoch": 0.83, "learning_rate": 1.484433266357157e-06, "loss": 20.7995, "step": 76740 }, { "epoch": 0.83, "learning_rate": 1.4825981579427451e-06, "loss": 20.743, "step": 76750 }, { "epoch": 0.83, "learning_rate": 1.4807640937193302e-06, "loss": 21.0753, "step": 76760 }, { "epoch": 0.83, "learning_rate": 1.478931073911758e-06, "loss": 21.0038, "step": 76770 }, { "epoch": 0.83, "learning_rate": 1.4770990987447488e-06, "loss": 21.2682, "step": 76780 }, { "epoch": 0.83, "learning_rate": 1.4752681684428939e-06, "loss": 21.3978, "step": 76790 }, { "epoch": 0.83, "learning_rate": 1.473438283230655e-06, "loss": 21.2982, "step": 76800 }, { "epoch": 0.83, "learning_rate": 1.4716094433323659e-06, "loss": 20.8695, "step": 76810 }, { "epoch": 0.83, "learning_rate": 1.4697816489722395e-06, "loss": 20.2711, "step": 76820 }, { "epoch": 0.83, "learning_rate": 1.4679549003743475e-06, "loss": 20.9946, "step": 76830 }, { "epoch": 0.83, "learning_rate": 1.4661291977626424e-06, "loss": 21.6542, "step": 76840 }, { "epoch": 0.83, "learning_rate": 1.464304541360946e-06, "loss": 20.9102, "step": 76850 }, { "epoch": 0.83, "learning_rate": 1.46248093139295e-06, "loss": 20.9343, "step": 76860 }, { "epoch": 0.83, "learning_rate": 1.4606583680822272e-06, "loss": 21.1665, "step": 76870 }, { "epoch": 0.83, "learning_rate": 1.4588368516522078e-06, "loss": 20.4491, "step": 76880 }, { "epoch": 0.83, "learning_rate": 1.4570163823262018e-06, "loss": 21.4081, "step": 76890 }, { "epoch": 0.83, "learning_rate": 1.4551969603273908e-06, "loss": 21.1192, "step": 76900 }, { "epoch": 0.83, "learning_rate": 1.453378585878824e-06, "loss": 21.1802, "step": 76910 }, { "epoch": 0.83, "learning_rate": 1.45156125920343e-06, "loss": 21.3007, "step": 76920 }, { "epoch": 0.83, "learning_rate": 1.4497449805240048e-06, "loss": 21.0354, "step": 76930 }, { "epoch": 0.83, "learning_rate": 1.4479297500632084e-06, "loss": 20.8063, "step": 76940 }, { "epoch": 0.83, "learning_rate": 1.4461155680435834e-06, "loss": 21.4405, "step": 76950 }, { "epoch": 0.83, "learning_rate": 1.4443024346875356e-06, "loss": 21.9067, "step": 76960 }, { "epoch": 0.83, "learning_rate": 1.4424903502173515e-06, "loss": 21.3393, "step": 76970 }, { "epoch": 0.83, "learning_rate": 1.4406793148551835e-06, "loss": 21.1604, "step": 76980 }, { "epoch": 0.83, "learning_rate": 1.4388693288230516e-06, "loss": 21.2486, "step": 76990 }, { "epoch": 0.83, "learning_rate": 1.4370603923428517e-06, "loss": 21.2913, "step": 77000 }, { "epoch": 0.83, "learning_rate": 1.4352525056363498e-06, "loss": 20.8767, "step": 77010 }, { "epoch": 0.83, "learning_rate": 1.4334456689251874e-06, "loss": 21.581, "step": 77020 }, { "epoch": 0.83, "learning_rate": 1.4316398824308742e-06, "loss": 20.2051, "step": 77030 }, { "epoch": 0.83, "learning_rate": 1.429835146374785e-06, "loss": 21.2338, "step": 77040 }, { "epoch": 0.83, "learning_rate": 1.4280314609781743e-06, "loss": 20.1417, "step": 77050 }, { "epoch": 0.83, "learning_rate": 1.4262288264621638e-06, "loss": 21.5967, "step": 77060 }, { "epoch": 0.83, "learning_rate": 1.4244272430477512e-06, "loss": 21.4369, "step": 77070 }, { "epoch": 0.83, "learning_rate": 1.422626710955799e-06, "loss": 20.8629, "step": 77080 }, { "epoch": 0.83, "learning_rate": 1.4208272304070458e-06, "loss": 21.2113, "step": 77090 }, { "epoch": 0.83, "learning_rate": 1.4190288016220943e-06, "loss": 20.8675, "step": 77100 }, { "epoch": 0.83, "learning_rate": 1.4172314248214236e-06, "loss": 21.2084, "step": 77110 }, { "epoch": 0.83, "learning_rate": 1.4154351002253875e-06, "loss": 21.3883, "step": 77120 }, { "epoch": 0.83, "learning_rate": 1.4136398280542029e-06, "loss": 21.818, "step": 77130 }, { "epoch": 0.83, "learning_rate": 1.4118456085279652e-06, "loss": 21.4011, "step": 77140 }, { "epoch": 0.83, "learning_rate": 1.4100524418666316e-06, "loss": 21.2267, "step": 77150 }, { "epoch": 0.83, "learning_rate": 1.4082603282900364e-06, "loss": 21.2163, "step": 77160 }, { "epoch": 0.83, "learning_rate": 1.406469268017886e-06, "loss": 21.2934, "step": 77170 }, { "epoch": 0.83, "learning_rate": 1.4046792612697547e-06, "loss": 21.3598, "step": 77180 }, { "epoch": 0.83, "learning_rate": 1.402890308265088e-06, "loss": 21.1473, "step": 77190 }, { "epoch": 0.83, "learning_rate": 1.401102409223205e-06, "loss": 21.0054, "step": 77200 }, { "epoch": 0.83, "learning_rate": 1.3993155643632872e-06, "loss": 21.3292, "step": 77210 }, { "epoch": 0.83, "learning_rate": 1.3975297739043992e-06, "loss": 21.4098, "step": 77220 }, { "epoch": 0.83, "learning_rate": 1.3957450380654658e-06, "loss": 21.0207, "step": 77230 }, { "epoch": 0.84, "learning_rate": 1.39396135706529e-06, "loss": 21.5052, "step": 77240 }, { "epoch": 0.84, "learning_rate": 1.3921787311225422e-06, "loss": 20.4316, "step": 77250 }, { "epoch": 0.84, "learning_rate": 1.3903971604557598e-06, "loss": 20.4719, "step": 77260 }, { "epoch": 0.84, "learning_rate": 1.3886166452833538e-06, "loss": 21.2957, "step": 77270 }, { "epoch": 0.84, "learning_rate": 1.3868371858236117e-06, "loss": 20.8907, "step": 77280 }, { "epoch": 0.84, "learning_rate": 1.3850587822946837e-06, "loss": 21.2783, "step": 77290 }, { "epoch": 0.84, "learning_rate": 1.3832814349145963e-06, "loss": 21.182, "step": 77300 }, { "epoch": 0.84, "learning_rate": 1.3815051439012373e-06, "loss": 20.4876, "step": 77310 }, { "epoch": 0.84, "learning_rate": 1.3797299094723726e-06, "loss": 21.2959, "step": 77320 }, { "epoch": 0.84, "learning_rate": 1.3779557318456404e-06, "loss": 22.1211, "step": 77330 }, { "epoch": 0.84, "learning_rate": 1.3761826112385456e-06, "loss": 21.0122, "step": 77340 }, { "epoch": 0.84, "learning_rate": 1.3744105478684622e-06, "loss": 20.7757, "step": 77350 }, { "epoch": 0.84, "learning_rate": 1.3726395419526395e-06, "loss": 21.3769, "step": 77360 }, { "epoch": 0.84, "learning_rate": 1.3708695937081862e-06, "loss": 21.4402, "step": 77370 }, { "epoch": 0.84, "learning_rate": 1.3691007033520964e-06, "loss": 21.1056, "step": 77380 }, { "epoch": 0.84, "learning_rate": 1.3673328711012257e-06, "loss": 21.9787, "step": 77390 }, { "epoch": 0.84, "learning_rate": 1.3655660971723018e-06, "loss": 21.1763, "step": 77400 }, { "epoch": 0.84, "learning_rate": 1.3638003817819223e-06, "loss": 21.654, "step": 77410 }, { "epoch": 0.84, "learning_rate": 1.362035725146551e-06, "loss": 20.65, "step": 77420 }, { "epoch": 0.84, "learning_rate": 1.3602721274825315e-06, "loss": 21.5774, "step": 77430 }, { "epoch": 0.84, "learning_rate": 1.3585095890060696e-06, "loss": 20.9278, "step": 77440 }, { "epoch": 0.84, "learning_rate": 1.3567481099332435e-06, "loss": 20.8233, "step": 77450 }, { "epoch": 0.84, "learning_rate": 1.3549876904800053e-06, "loss": 21.7194, "step": 77460 }, { "epoch": 0.84, "learning_rate": 1.3532283308621663e-06, "loss": 20.9852, "step": 77470 }, { "epoch": 0.84, "learning_rate": 1.3514700312954221e-06, "loss": 20.8889, "step": 77480 }, { "epoch": 0.84, "learning_rate": 1.349712791995328e-06, "loss": 20.6932, "step": 77490 }, { "epoch": 0.84, "learning_rate": 1.3479566131773148e-06, "loss": 21.1502, "step": 77500 }, { "epoch": 0.84, "learning_rate": 1.3462014950566794e-06, "loss": 21.7103, "step": 77510 }, { "epoch": 0.84, "learning_rate": 1.3444474378485917e-06, "loss": 21.422, "step": 77520 }, { "epoch": 0.84, "learning_rate": 1.3426944417680898e-06, "loss": 21.1284, "step": 77530 }, { "epoch": 0.84, "learning_rate": 1.3409425070300818e-06, "loss": 21.5724, "step": 77540 }, { "epoch": 0.84, "learning_rate": 1.3391916338493482e-06, "loss": 21.1034, "step": 77550 }, { "epoch": 0.84, "learning_rate": 1.337441822440535e-06, "loss": 20.8963, "step": 77560 }, { "epoch": 0.84, "learning_rate": 1.3356930730181616e-06, "loss": 21.3181, "step": 77570 }, { "epoch": 0.84, "learning_rate": 1.3339453857966157e-06, "loss": 21.374, "step": 77580 }, { "epoch": 0.84, "learning_rate": 1.3321987609901553e-06, "loss": 21.0962, "step": 77590 }, { "epoch": 0.84, "learning_rate": 1.3304531988129077e-06, "loss": 21.232, "step": 77600 }, { "epoch": 0.84, "learning_rate": 1.328708699478869e-06, "loss": 21.1215, "step": 77610 }, { "epoch": 0.84, "learning_rate": 1.3269652632019081e-06, "loss": 21.3563, "step": 77620 }, { "epoch": 0.84, "learning_rate": 1.3252228901957608e-06, "loss": 21.3616, "step": 77630 }, { "epoch": 0.84, "learning_rate": 1.323481580674032e-06, "loss": 21.1777, "step": 77640 }, { "epoch": 0.84, "learning_rate": 1.3217413348501996e-06, "loss": 21.1139, "step": 77650 }, { "epoch": 0.84, "learning_rate": 1.3200021529376083e-06, "loss": 21.4005, "step": 77660 }, { "epoch": 0.84, "learning_rate": 1.3182640351494736e-06, "loss": 21.184, "step": 77670 }, { "epoch": 0.84, "learning_rate": 1.316526981698878e-06, "loss": 21.2274, "step": 77680 }, { "epoch": 0.84, "learning_rate": 1.314790992798778e-06, "loss": 20.8519, "step": 77690 }, { "epoch": 0.84, "learning_rate": 1.3130560686619963e-06, "loss": 21.178, "step": 77700 }, { "epoch": 0.84, "learning_rate": 1.3113222095012256e-06, "loss": 21.4663, "step": 77710 }, { "epoch": 0.84, "learning_rate": 1.309589415529029e-06, "loss": 21.4253, "step": 77720 }, { "epoch": 0.84, "learning_rate": 1.3078576869578384e-06, "loss": 21.4288, "step": 77730 }, { "epoch": 0.84, "learning_rate": 1.3061270239999545e-06, "loss": 21.2372, "step": 77740 }, { "epoch": 0.84, "learning_rate": 1.3043974268675474e-06, "loss": 20.1808, "step": 77750 }, { "epoch": 0.84, "learning_rate": 1.3026688957726596e-06, "loss": 21.4267, "step": 77760 }, { "epoch": 0.84, "learning_rate": 1.3009414309271973e-06, "loss": 21.69, "step": 77770 }, { "epoch": 0.84, "learning_rate": 1.2992150325429397e-06, "loss": 21.5444, "step": 77780 }, { "epoch": 0.84, "learning_rate": 1.297489700831539e-06, "loss": 21.623, "step": 77790 }, { "epoch": 0.84, "learning_rate": 1.2957654360045057e-06, "loss": 21.4471, "step": 77800 }, { "epoch": 0.84, "learning_rate": 1.294042238273231e-06, "loss": 21.7163, "step": 77810 }, { "epoch": 0.84, "learning_rate": 1.2923201078489666e-06, "loss": 21.4852, "step": 77820 }, { "epoch": 0.84, "learning_rate": 1.2905990449428384e-06, "loss": 20.8611, "step": 77830 }, { "epoch": 0.84, "learning_rate": 1.2888790497658444e-06, "loss": 21.8326, "step": 77840 }, { "epoch": 0.84, "learning_rate": 1.2871601225288411e-06, "loss": 21.2292, "step": 77850 }, { "epoch": 0.84, "learning_rate": 1.2854422634425634e-06, "loss": 21.6685, "step": 77860 }, { "epoch": 0.84, "learning_rate": 1.2837254727176118e-06, "loss": 21.2432, "step": 77870 }, { "epoch": 0.84, "learning_rate": 1.2820097505644536e-06, "loss": 21.853, "step": 77880 }, { "epoch": 0.84, "learning_rate": 1.2802950971934337e-06, "loss": 20.8531, "step": 77890 }, { "epoch": 0.84, "learning_rate": 1.2785815128147582e-06, "loss": 21.287, "step": 77900 }, { "epoch": 0.84, "learning_rate": 1.2768689976385007e-06, "loss": 21.3895, "step": 77910 }, { "epoch": 0.84, "learning_rate": 1.2751575518746095e-06, "loss": 20.5766, "step": 77920 }, { "epoch": 0.84, "learning_rate": 1.273447175732896e-06, "loss": 21.0401, "step": 77930 }, { "epoch": 0.84, "learning_rate": 1.2717378694230498e-06, "loss": 21.6707, "step": 77940 }, { "epoch": 0.84, "learning_rate": 1.2700296331546214e-06, "loss": 21.4639, "step": 77950 }, { "epoch": 0.84, "learning_rate": 1.2683224671370286e-06, "loss": 21.3937, "step": 77960 }, { "epoch": 0.84, "learning_rate": 1.2666163715795644e-06, "loss": 20.929, "step": 77970 }, { "epoch": 0.84, "learning_rate": 1.2649113466913843e-06, "loss": 21.903, "step": 77980 }, { "epoch": 0.84, "learning_rate": 1.2632073926815203e-06, "loss": 20.9997, "step": 77990 }, { "epoch": 0.84, "learning_rate": 1.2615045097588685e-06, "loss": 20.9995, "step": 78000 }, { "epoch": 0.84, "learning_rate": 1.259802698132191e-06, "loss": 21.2363, "step": 78010 }, { "epoch": 0.84, "learning_rate": 1.2581019580101216e-06, "loss": 20.9693, "step": 78020 }, { "epoch": 0.84, "learning_rate": 1.2564022896011618e-06, "loss": 21.7437, "step": 78030 }, { "epoch": 0.84, "learning_rate": 1.2547036931136868e-06, "loss": 21.2357, "step": 78040 }, { "epoch": 0.84, "learning_rate": 1.2530061687559325e-06, "loss": 21.2637, "step": 78050 }, { "epoch": 0.84, "learning_rate": 1.2513097167360099e-06, "loss": 21.2, "step": 78060 }, { "epoch": 0.84, "learning_rate": 1.249614337261893e-06, "loss": 20.9009, "step": 78070 }, { "epoch": 0.84, "learning_rate": 1.247920030541424e-06, "loss": 21.7434, "step": 78080 }, { "epoch": 0.84, "learning_rate": 1.2462267967823216e-06, "loss": 21.4583, "step": 78090 }, { "epoch": 0.84, "learning_rate": 1.2445346361921661e-06, "loss": 21.3131, "step": 78100 }, { "epoch": 0.84, "learning_rate": 1.2428435489784107e-06, "loss": 21.0066, "step": 78110 }, { "epoch": 0.84, "learning_rate": 1.2411535353483694e-06, "loss": 20.7907, "step": 78120 }, { "epoch": 0.84, "learning_rate": 1.2394645955092287e-06, "loss": 21.0676, "step": 78130 }, { "epoch": 0.84, "learning_rate": 1.2377767296680498e-06, "loss": 20.9166, "step": 78140 }, { "epoch": 0.84, "learning_rate": 1.2360899380317536e-06, "loss": 20.7059, "step": 78150 }, { "epoch": 0.84, "learning_rate": 1.2344042208071327e-06, "loss": 20.9368, "step": 78160 }, { "epoch": 0.85, "learning_rate": 1.2327195782008495e-06, "loss": 20.3435, "step": 78170 }, { "epoch": 0.85, "learning_rate": 1.2310360104194263e-06, "loss": 22.1794, "step": 78180 }, { "epoch": 0.85, "learning_rate": 1.2293535176692673e-06, "loss": 21.3251, "step": 78190 }, { "epoch": 0.85, "learning_rate": 1.227672100156635e-06, "loss": 21.4675, "step": 78200 }, { "epoch": 0.85, "learning_rate": 1.2259917580876624e-06, "loss": 20.8316, "step": 78210 }, { "epoch": 0.85, "learning_rate": 1.2243124916683534e-06, "loss": 21.0542, "step": 78220 }, { "epoch": 0.85, "learning_rate": 1.2226343011045717e-06, "loss": 20.9521, "step": 78230 }, { "epoch": 0.85, "learning_rate": 1.220957186602062e-06, "loss": 20.3041, "step": 78240 }, { "epoch": 0.85, "learning_rate": 1.2192811483664268e-06, "loss": 22.0027, "step": 78250 }, { "epoch": 0.85, "learning_rate": 1.2176061866031408e-06, "loss": 21.388, "step": 78260 }, { "epoch": 0.85, "learning_rate": 1.2159323015175473e-06, "loss": 21.3566, "step": 78270 }, { "epoch": 0.85, "learning_rate": 1.2142594933148511e-06, "loss": 21.4816, "step": 78280 }, { "epoch": 0.85, "learning_rate": 1.2125877622001358e-06, "loss": 21.5307, "step": 78290 }, { "epoch": 0.85, "learning_rate": 1.2109171083783443e-06, "loss": 21.1761, "step": 78300 }, { "epoch": 0.85, "learning_rate": 1.209247532054293e-06, "loss": 20.709, "step": 78310 }, { "epoch": 0.85, "learning_rate": 1.207579033432661e-06, "loss": 21.1263, "step": 78320 }, { "epoch": 0.85, "learning_rate": 1.2059116127179993e-06, "loss": 20.7171, "step": 78330 }, { "epoch": 0.85, "learning_rate": 1.2042452701147244e-06, "loss": 20.915, "step": 78340 }, { "epoch": 0.85, "learning_rate": 1.2025800058271232e-06, "loss": 21.3296, "step": 78350 }, { "epoch": 0.85, "learning_rate": 1.2009158200593463e-06, "loss": 21.2086, "step": 78360 }, { "epoch": 0.85, "learning_rate": 1.1992527130154175e-06, "loss": 21.0366, "step": 78370 }, { "epoch": 0.85, "learning_rate": 1.1975906848992236e-06, "loss": 21.843, "step": 78380 }, { "epoch": 0.85, "learning_rate": 1.1959297359145205e-06, "loss": 20.6589, "step": 78390 }, { "epoch": 0.85, "learning_rate": 1.1942698662649344e-06, "loss": 21.2726, "step": 78400 }, { "epoch": 0.85, "learning_rate": 1.1926110761539556e-06, "loss": 21.0172, "step": 78410 }, { "epoch": 0.85, "learning_rate": 1.1909533657849425e-06, "loss": 21.9927, "step": 78420 }, { "epoch": 0.85, "learning_rate": 1.189296735361124e-06, "loss": 21.4219, "step": 78430 }, { "epoch": 0.85, "learning_rate": 1.187641185085595e-06, "loss": 21.1558, "step": 78440 }, { "epoch": 0.85, "learning_rate": 1.1859867151613159e-06, "loss": 20.9901, "step": 78450 }, { "epoch": 0.85, "learning_rate": 1.1843333257911172e-06, "loss": 21.8804, "step": 78460 }, { "epoch": 0.85, "learning_rate": 1.1826810171776958e-06, "loss": 20.933, "step": 78470 }, { "epoch": 0.85, "learning_rate": 1.1810297895236177e-06, "loss": 21.5552, "step": 78480 }, { "epoch": 0.85, "learning_rate": 1.1793796430313142e-06, "loss": 20.9844, "step": 78490 }, { "epoch": 0.85, "learning_rate": 1.1777305779030845e-06, "loss": 21.8679, "step": 78500 }, { "epoch": 0.85, "learning_rate": 1.176082594341098e-06, "loss": 21.9327, "step": 78510 }, { "epoch": 0.85, "learning_rate": 1.1744356925473866e-06, "loss": 21.8918, "step": 78520 }, { "epoch": 0.85, "learning_rate": 1.172789872723854e-06, "loss": 20.9862, "step": 78530 }, { "epoch": 0.85, "learning_rate": 1.171145135072269e-06, "loss": 20.9065, "step": 78540 }, { "epoch": 0.85, "learning_rate": 1.1695014797942682e-06, "loss": 21.0405, "step": 78550 }, { "epoch": 0.85, "learning_rate": 1.1678589070913559e-06, "loss": 21.5824, "step": 78560 }, { "epoch": 0.85, "learning_rate": 1.1662174171649022e-06, "loss": 21.8082, "step": 78570 }, { "epoch": 0.85, "learning_rate": 1.1645770102161468e-06, "loss": 20.6315, "step": 78580 }, { "epoch": 0.85, "learning_rate": 1.162937686446195e-06, "loss": 21.5734, "step": 78590 }, { "epoch": 0.85, "learning_rate": 1.1612994460560201e-06, "loss": 20.8421, "step": 78600 }, { "epoch": 0.85, "learning_rate": 1.1596622892464603e-06, "loss": 20.6526, "step": 78610 }, { "epoch": 0.85, "learning_rate": 1.1580262162182253e-06, "loss": 22.1106, "step": 78620 }, { "epoch": 0.85, "learning_rate": 1.1563912271718891e-06, "loss": 21.0929, "step": 78630 }, { "epoch": 0.85, "learning_rate": 1.1547573223078924e-06, "loss": 21.0422, "step": 78640 }, { "epoch": 0.85, "learning_rate": 1.1531245018265435e-06, "loss": 21.2662, "step": 78650 }, { "epoch": 0.85, "learning_rate": 1.1514927659280184e-06, "loss": 21.2269, "step": 78660 }, { "epoch": 0.85, "learning_rate": 1.1498621148123611e-06, "loss": 21.6868, "step": 78670 }, { "epoch": 0.85, "learning_rate": 1.1482325486794788e-06, "loss": 20.5665, "step": 78680 }, { "epoch": 0.85, "learning_rate": 1.14660406772915e-06, "loss": 21.2188, "step": 78690 }, { "epoch": 0.85, "learning_rate": 1.144976672161019e-06, "loss": 20.977, "step": 78700 }, { "epoch": 0.85, "learning_rate": 1.1433503621745935e-06, "loss": 21.0352, "step": 78710 }, { "epoch": 0.85, "learning_rate": 1.141725137969254e-06, "loss": 20.8765, "step": 78720 }, { "epoch": 0.85, "learning_rate": 1.1401009997442436e-06, "loss": 20.9617, "step": 78730 }, { "epoch": 0.85, "learning_rate": 1.138477947698673e-06, "loss": 21.5914, "step": 78740 }, { "epoch": 0.85, "learning_rate": 1.1368559820315194e-06, "loss": 21.6248, "step": 78750 }, { "epoch": 0.85, "learning_rate": 1.135235102941633e-06, "loss": 21.3699, "step": 78760 }, { "epoch": 0.85, "learning_rate": 1.1336153106277193e-06, "loss": 21.1554, "step": 78770 }, { "epoch": 0.85, "learning_rate": 1.1319966052883603e-06, "loss": 20.4861, "step": 78780 }, { "epoch": 0.85, "learning_rate": 1.1303789871219983e-06, "loss": 20.6426, "step": 78790 }, { "epoch": 0.85, "learning_rate": 1.1287624563269461e-06, "loss": 21.9874, "step": 78800 }, { "epoch": 0.85, "learning_rate": 1.1271470131013872e-06, "loss": 21.2308, "step": 78810 }, { "epoch": 0.85, "learning_rate": 1.1255326576433612e-06, "loss": 21.1582, "step": 78820 }, { "epoch": 0.85, "learning_rate": 1.1239193901507805e-06, "loss": 21.7666, "step": 78830 }, { "epoch": 0.85, "learning_rate": 1.1223072108214262e-06, "loss": 21.8135, "step": 78840 }, { "epoch": 0.85, "learning_rate": 1.1206961198529386e-06, "loss": 21.2484, "step": 78850 }, { "epoch": 0.85, "learning_rate": 1.1190861174428358e-06, "loss": 21.2866, "step": 78860 }, { "epoch": 0.85, "learning_rate": 1.117477203788495e-06, "loss": 20.9704, "step": 78870 }, { "epoch": 0.85, "learning_rate": 1.1158693790871578e-06, "loss": 21.8415, "step": 78880 }, { "epoch": 0.85, "learning_rate": 1.1142626435359361e-06, "loss": 21.1724, "step": 78890 }, { "epoch": 0.85, "learning_rate": 1.1126569973318069e-06, "loss": 20.7245, "step": 78900 }, { "epoch": 0.85, "learning_rate": 1.1110524406716182e-06, "loss": 21.4541, "step": 78910 }, { "epoch": 0.85, "learning_rate": 1.1094489737520797e-06, "loss": 21.0033, "step": 78920 }, { "epoch": 0.85, "learning_rate": 1.107846596769766e-06, "loss": 21.6881, "step": 78930 }, { "epoch": 0.85, "learning_rate": 1.1062453099211213e-06, "loss": 21.7243, "step": 78940 }, { "epoch": 0.85, "learning_rate": 1.1046451134024527e-06, "loss": 20.7014, "step": 78950 }, { "epoch": 0.85, "learning_rate": 1.1030460074099425e-06, "loss": 21.8879, "step": 78960 }, { "epoch": 0.85, "learning_rate": 1.1014479921396315e-06, "loss": 22.0752, "step": 78970 }, { "epoch": 0.85, "learning_rate": 1.0998510677874252e-06, "loss": 20.9857, "step": 78980 }, { "epoch": 0.85, "learning_rate": 1.0982552345491005e-06, "loss": 20.664, "step": 78990 }, { "epoch": 0.85, "learning_rate": 1.0966604926202963e-06, "loss": 21.5855, "step": 79000 }, { "epoch": 0.85, "learning_rate": 1.0950668421965238e-06, "loss": 20.0627, "step": 79010 }, { "epoch": 0.85, "learning_rate": 1.093474283473155e-06, "loss": 21.0241, "step": 79020 }, { "epoch": 0.85, "learning_rate": 1.0918828166454321e-06, "loss": 21.4325, "step": 79030 }, { "epoch": 0.85, "learning_rate": 1.090292441908456e-06, "loss": 21.061, "step": 79040 }, { "epoch": 0.85, "learning_rate": 1.0887031594571985e-06, "loss": 20.9604, "step": 79050 }, { "epoch": 0.85, "learning_rate": 1.0871149694865024e-06, "loss": 21.1907, "step": 79060 }, { "epoch": 0.85, "learning_rate": 1.08552787219107e-06, "loss": 21.1371, "step": 79070 }, { "epoch": 0.85, "learning_rate": 1.0839418677654745e-06, "loss": 21.2684, "step": 79080 }, { "epoch": 0.86, "learning_rate": 1.0823569564041458e-06, "loss": 21.5964, "step": 79090 }, { "epoch": 0.86, "learning_rate": 1.0807731383013875e-06, "loss": 21.2589, "step": 79100 }, { "epoch": 0.86, "learning_rate": 1.079190413651371e-06, "loss": 21.5233, "step": 79110 }, { "epoch": 0.86, "learning_rate": 1.0776087826481297e-06, "loss": 21.5784, "step": 79120 }, { "epoch": 0.86, "learning_rate": 1.0760282454855653e-06, "loss": 20.9981, "step": 79130 }, { "epoch": 0.86, "learning_rate": 1.0744488023574395e-06, "loss": 20.898, "step": 79140 }, { "epoch": 0.86, "learning_rate": 1.072870453457383e-06, "loss": 20.9572, "step": 79150 }, { "epoch": 0.86, "learning_rate": 1.0712931989789e-06, "loss": 21.496, "step": 79160 }, { "epoch": 0.86, "learning_rate": 1.06971703911535e-06, "loss": 20.768, "step": 79170 }, { "epoch": 0.86, "learning_rate": 1.068141974059963e-06, "loss": 21.27, "step": 79180 }, { "epoch": 0.86, "learning_rate": 1.0665680040058368e-06, "loss": 20.7966, "step": 79190 }, { "epoch": 0.86, "learning_rate": 1.064995129145925e-06, "loss": 21.1696, "step": 79200 }, { "epoch": 0.86, "learning_rate": 1.0634233496730606e-06, "loss": 21.4383, "step": 79210 }, { "epoch": 0.86, "learning_rate": 1.0618526657799355e-06, "loss": 21.0417, "step": 79220 }, { "epoch": 0.86, "learning_rate": 1.0602830776591045e-06, "loss": 21.9176, "step": 79230 }, { "epoch": 0.86, "learning_rate": 1.0587145855029967e-06, "loss": 21.2413, "step": 79240 }, { "epoch": 0.86, "learning_rate": 1.057147189503893e-06, "loss": 20.8056, "step": 79250 }, { "epoch": 0.86, "learning_rate": 1.0555808898539555e-06, "loss": 21.1381, "step": 79260 }, { "epoch": 0.86, "learning_rate": 1.0540156867452024e-06, "loss": 21.5784, "step": 79270 }, { "epoch": 0.86, "learning_rate": 1.05245158036952e-06, "loss": 20.613, "step": 79280 }, { "epoch": 0.86, "learning_rate": 1.05088857091866e-06, "loss": 20.8668, "step": 79290 }, { "epoch": 0.86, "learning_rate": 1.0493266585842388e-06, "loss": 21.3463, "step": 79300 }, { "epoch": 0.86, "learning_rate": 1.0477658435577399e-06, "loss": 20.6774, "step": 79310 }, { "epoch": 0.86, "learning_rate": 1.0462061260305112e-06, "loss": 20.6724, "step": 79320 }, { "epoch": 0.86, "learning_rate": 1.0446475061937667e-06, "loss": 21.6661, "step": 79330 }, { "epoch": 0.86, "learning_rate": 1.0430899842385845e-06, "loss": 22.195, "step": 79340 }, { "epoch": 0.86, "learning_rate": 1.0415335603559085e-06, "loss": 21.4334, "step": 79350 }, { "epoch": 0.86, "learning_rate": 1.0399782347365507e-06, "loss": 21.2162, "step": 79360 }, { "epoch": 0.86, "learning_rate": 1.0384240075711848e-06, "loss": 21.4058, "step": 79370 }, { "epoch": 0.86, "learning_rate": 1.0368708790503511e-06, "loss": 20.9883, "step": 79380 }, { "epoch": 0.86, "learning_rate": 1.0353188493644562e-06, "loss": 21.5165, "step": 79390 }, { "epoch": 0.86, "learning_rate": 1.033767918703772e-06, "loss": 21.0022, "step": 79400 }, { "epoch": 0.86, "learning_rate": 1.032218087258432e-06, "loss": 20.6348, "step": 79410 }, { "epoch": 0.86, "learning_rate": 1.0306693552184399e-06, "loss": 20.6207, "step": 79420 }, { "epoch": 0.86, "learning_rate": 1.0291217227736628e-06, "loss": 20.9772, "step": 79430 }, { "epoch": 0.86, "learning_rate": 1.027575190113832e-06, "loss": 21.0941, "step": 79440 }, { "epoch": 0.86, "learning_rate": 1.026029757428545e-06, "loss": 21.544, "step": 79450 }, { "epoch": 0.86, "learning_rate": 1.0244854249072633e-06, "loss": 20.3768, "step": 79460 }, { "epoch": 0.86, "learning_rate": 1.0229421927393157e-06, "loss": 21.4694, "step": 79470 }, { "epoch": 0.86, "learning_rate": 1.021400061113893e-06, "loss": 20.5837, "step": 79480 }, { "epoch": 0.86, "learning_rate": 1.0198590302200551e-06, "loss": 20.7592, "step": 79490 }, { "epoch": 0.86, "learning_rate": 1.018319100246723e-06, "loss": 21.469, "step": 79500 }, { "epoch": 0.86, "learning_rate": 1.0167802713826847e-06, "loss": 20.6554, "step": 79510 }, { "epoch": 0.86, "learning_rate": 1.0152425438165936e-06, "loss": 20.7107, "step": 79520 }, { "epoch": 0.86, "learning_rate": 1.0137059177369668e-06, "loss": 21.1553, "step": 79530 }, { "epoch": 0.86, "learning_rate": 1.012170393332187e-06, "loss": 20.5853, "step": 79540 }, { "epoch": 0.86, "learning_rate": 1.0106359707905023e-06, "loss": 21.8398, "step": 79550 }, { "epoch": 0.86, "learning_rate": 1.0091026503000245e-06, "loss": 21.0925, "step": 79560 }, { "epoch": 0.86, "learning_rate": 1.0075704320487323e-06, "loss": 20.8515, "step": 79570 }, { "epoch": 0.86, "learning_rate": 1.0060393162244674e-06, "loss": 20.8422, "step": 79580 }, { "epoch": 0.86, "learning_rate": 1.0045093030149366e-06, "loss": 20.9427, "step": 79590 }, { "epoch": 0.86, "learning_rate": 1.002980392607712e-06, "loss": 21.3709, "step": 79600 }, { "epoch": 0.86, "learning_rate": 1.0014525851902302e-06, "loss": 21.5895, "step": 79610 }, { "epoch": 0.86, "learning_rate": 9.999258809497935e-07, "loss": 20.5114, "step": 79620 }, { "epoch": 0.86, "learning_rate": 9.984002800735682e-07, "loss": 21.083, "step": 79630 }, { "epoch": 0.86, "learning_rate": 9.968757827485842e-07, "loss": 20.4797, "step": 79640 }, { "epoch": 0.86, "learning_rate": 9.953523891617388e-07, "loss": 21.7433, "step": 79650 }, { "epoch": 0.86, "learning_rate": 9.938300994997917e-07, "loss": 21.6447, "step": 79660 }, { "epoch": 0.86, "learning_rate": 9.92308913949368e-07, "loss": 20.915, "step": 79670 }, { "epoch": 0.86, "learning_rate": 9.907888326969572e-07, "loss": 21.2413, "step": 79680 }, { "epoch": 0.86, "learning_rate": 9.892698559289137e-07, "loss": 20.9748, "step": 79690 }, { "epoch": 0.86, "learning_rate": 9.877519838314576e-07, "loss": 21.5183, "step": 79700 }, { "epoch": 0.86, "learning_rate": 9.862352165906708e-07, "loss": 21.0004, "step": 79710 }, { "epoch": 0.86, "learning_rate": 9.847195543925003e-07, "loss": 20.5761, "step": 79720 }, { "epoch": 0.86, "learning_rate": 9.832049974227654e-07, "loss": 22.2307, "step": 79730 }, { "epoch": 0.86, "learning_rate": 9.81691545867135e-07, "loss": 21.2983, "step": 79740 }, { "epoch": 0.86, "learning_rate": 9.801791999111554e-07, "loss": 20.9659, "step": 79750 }, { "epoch": 0.86, "learning_rate": 9.786679597402316e-07, "loss": 20.8306, "step": 79760 }, { "epoch": 0.86, "learning_rate": 9.77157825539632e-07, "loss": 20.3064, "step": 79770 }, { "epoch": 0.86, "learning_rate": 9.75648797494496e-07, "loss": 21.5189, "step": 79780 }, { "epoch": 0.86, "learning_rate": 9.741408757898195e-07, "loss": 21.529, "step": 79790 }, { "epoch": 0.86, "learning_rate": 9.726340606104678e-07, "loss": 20.7084, "step": 79800 }, { "epoch": 0.86, "learning_rate": 9.711283521411674e-07, "loss": 20.8319, "step": 79810 }, { "epoch": 0.86, "learning_rate": 9.696237505665096e-07, "loss": 21.7506, "step": 79820 }, { "epoch": 0.86, "learning_rate": 9.681202560709546e-07, "loss": 20.578, "step": 79830 }, { "epoch": 0.86, "learning_rate": 9.66617868838824e-07, "loss": 21.2704, "step": 79840 }, { "epoch": 0.86, "learning_rate": 9.65116589054298e-07, "loss": 20.7089, "step": 79850 }, { "epoch": 0.86, "learning_rate": 9.636164169014294e-07, "loss": 21.1505, "step": 79860 }, { "epoch": 0.86, "learning_rate": 9.621173525641291e-07, "loss": 21.609, "step": 79870 }, { "epoch": 0.86, "learning_rate": 9.60619396226179e-07, "loss": 20.9502, "step": 79880 }, { "epoch": 0.86, "learning_rate": 9.591225480712208e-07, "loss": 21.541, "step": 79890 }, { "epoch": 0.86, "learning_rate": 9.576268082827555e-07, "loss": 22.0983, "step": 79900 }, { "epoch": 0.86, "learning_rate": 9.56132177044158e-07, "loss": 21.0759, "step": 79910 }, { "epoch": 0.86, "learning_rate": 9.5463865453866e-07, "loss": 21.4666, "step": 79920 }, { "epoch": 0.86, "learning_rate": 9.531462409493619e-07, "loss": 20.9166, "step": 79930 }, { "epoch": 0.86, "learning_rate": 9.516549364592275e-07, "loss": 21.0884, "step": 79940 }, { "epoch": 0.86, "learning_rate": 9.501647412510795e-07, "loss": 21.0266, "step": 79950 }, { "epoch": 0.86, "learning_rate": 9.486756555076104e-07, "loss": 21.6074, "step": 79960 }, { "epoch": 0.86, "learning_rate": 9.471876794113721e-07, "loss": 21.7792, "step": 79970 }, { "epoch": 0.86, "learning_rate": 9.457008131447876e-07, "loss": 21.4449, "step": 79980 }, { "epoch": 0.86, "learning_rate": 9.442150568901365e-07, "loss": 21.2177, "step": 79990 }, { "epoch": 0.86, "learning_rate": 9.427304108295676e-07, "loss": 21.9288, "step": 80000 }, { "epoch": 0.86, "learning_rate": 9.412468751450876e-07, "loss": 21.4607, "step": 80010 }, { "epoch": 0.87, "learning_rate": 9.39764450018571e-07, "loss": 21.462, "step": 80020 }, { "epoch": 0.87, "learning_rate": 9.382831356317578e-07, "loss": 21.5196, "step": 80030 }, { "epoch": 0.87, "learning_rate": 9.368029321662487e-07, "loss": 21.4077, "step": 80040 }, { "epoch": 0.87, "learning_rate": 9.353238398035124e-07, "loss": 21.1901, "step": 80050 }, { "epoch": 0.87, "learning_rate": 9.338458587248722e-07, "loss": 22.0105, "step": 80060 }, { "epoch": 0.87, "learning_rate": 9.323689891115228e-07, "loss": 21.3292, "step": 80070 }, { "epoch": 0.87, "learning_rate": 9.30893231144524e-07, "loss": 20.7594, "step": 80080 }, { "epoch": 0.87, "learning_rate": 9.294185850047954e-07, "loss": 21.5744, "step": 80090 }, { "epoch": 0.87, "learning_rate": 9.279450508731236e-07, "loss": 21.0723, "step": 80100 }, { "epoch": 0.87, "learning_rate": 9.264726289301507e-07, "loss": 21.5253, "step": 80110 }, { "epoch": 0.87, "learning_rate": 9.25001319356389e-07, "loss": 21.3203, "step": 80120 }, { "epoch": 0.87, "learning_rate": 9.235311223322186e-07, "loss": 20.726, "step": 80130 }, { "epoch": 0.87, "learning_rate": 9.220620380378753e-07, "loss": 21.3151, "step": 80140 }, { "epoch": 0.87, "learning_rate": 9.205940666534619e-07, "loss": 21.7421, "step": 80150 }, { "epoch": 0.87, "learning_rate": 9.191272083589464e-07, "loss": 21.0924, "step": 80160 }, { "epoch": 0.87, "learning_rate": 9.17661463334153e-07, "loss": 21.1544, "step": 80170 }, { "epoch": 0.87, "learning_rate": 9.161968317587788e-07, "loss": 21.018, "step": 80180 }, { "epoch": 0.87, "learning_rate": 9.147333138123804e-07, "loss": 21.3002, "step": 80190 }, { "epoch": 0.87, "learning_rate": 9.132709096743775e-07, "loss": 21.1695, "step": 80200 }, { "epoch": 0.87, "learning_rate": 9.118096195240545e-07, "loss": 21.536, "step": 80210 }, { "epoch": 0.87, "learning_rate": 9.103494435405525e-07, "loss": 21.0373, "step": 80220 }, { "epoch": 0.87, "learning_rate": 9.088903819028882e-07, "loss": 20.9135, "step": 80230 }, { "epoch": 0.87, "learning_rate": 9.074324347899333e-07, "loss": 21.3615, "step": 80240 }, { "epoch": 0.87, "learning_rate": 9.059756023804245e-07, "loss": 21.5558, "step": 80250 }, { "epoch": 0.87, "learning_rate": 9.045198848529635e-07, "loss": 21.9894, "step": 80260 }, { "epoch": 0.87, "learning_rate": 9.03065282386012e-07, "loss": 21.5888, "step": 80270 }, { "epoch": 0.87, "learning_rate": 9.016117951578985e-07, "loss": 21.3461, "step": 80280 }, { "epoch": 0.87, "learning_rate": 9.001594233468113e-07, "loss": 20.4727, "step": 80290 }, { "epoch": 0.87, "learning_rate": 8.987081671308074e-07, "loss": 21.4834, "step": 80300 }, { "epoch": 0.87, "learning_rate": 8.972580266877995e-07, "loss": 20.9094, "step": 80310 }, { "epoch": 0.87, "learning_rate": 8.958090021955712e-07, "loss": 21.3306, "step": 80320 }, { "epoch": 0.87, "learning_rate": 8.943610938317638e-07, "loss": 21.4617, "step": 80330 }, { "epoch": 0.87, "learning_rate": 8.92914301773884e-07, "loss": 21.4275, "step": 80340 }, { "epoch": 0.87, "learning_rate": 8.914686261993011e-07, "loss": 20.8976, "step": 80350 }, { "epoch": 0.87, "learning_rate": 8.900240672852478e-07, "loss": 21.2379, "step": 80360 }, { "epoch": 0.87, "learning_rate": 8.885806252088191e-07, "loss": 21.4542, "step": 80370 }, { "epoch": 0.87, "learning_rate": 8.871383001469757e-07, "loss": 21.2889, "step": 80380 }, { "epoch": 0.87, "learning_rate": 8.856970922765385e-07, "loss": 21.4829, "step": 80390 }, { "epoch": 0.87, "learning_rate": 8.842570017741914e-07, "loss": 21.3353, "step": 80400 }, { "epoch": 0.87, "learning_rate": 8.828180288164833e-07, "loss": 21.2036, "step": 80410 }, { "epoch": 0.87, "learning_rate": 8.813801735798255e-07, "loss": 21.6778, "step": 80420 }, { "epoch": 0.87, "learning_rate": 8.799434362404912e-07, "loss": 21.0684, "step": 80430 }, { "epoch": 0.87, "learning_rate": 8.785078169746175e-07, "loss": 20.9005, "step": 80440 }, { "epoch": 0.87, "learning_rate": 8.770733159582035e-07, "loss": 20.7406, "step": 80450 }, { "epoch": 0.87, "learning_rate": 8.756399333671128e-07, "loss": 21.3294, "step": 80460 }, { "epoch": 0.87, "learning_rate": 8.742076693770707e-07, "loss": 21.2155, "step": 80470 }, { "epoch": 0.87, "learning_rate": 8.727765241636654e-07, "loss": 21.784, "step": 80480 }, { "epoch": 0.87, "learning_rate": 8.713464979023478e-07, "loss": 21.0597, "step": 80490 }, { "epoch": 0.87, "learning_rate": 8.699175907684331e-07, "loss": 21.6078, "step": 80500 }, { "epoch": 0.87, "learning_rate": 8.684898029370981e-07, "loss": 21.1277, "step": 80510 }, { "epoch": 0.87, "learning_rate": 8.670631345833814e-07, "loss": 21.2022, "step": 80520 }, { "epoch": 0.87, "learning_rate": 8.65637585882183e-07, "loss": 21.4937, "step": 80530 }, { "epoch": 0.87, "learning_rate": 8.642131570082757e-07, "loss": 21.5309, "step": 80540 }, { "epoch": 0.87, "learning_rate": 8.627898481362817e-07, "loss": 21.7034, "step": 80550 }, { "epoch": 0.87, "learning_rate": 8.613676594406917e-07, "loss": 21.0096, "step": 80560 }, { "epoch": 0.87, "learning_rate": 8.599465910958593e-07, "loss": 21.158, "step": 80570 }, { "epoch": 0.87, "learning_rate": 8.585266432759998e-07, "loss": 21.0966, "step": 80580 }, { "epoch": 0.87, "learning_rate": 8.57107816155196e-07, "loss": 21.7471, "step": 80590 }, { "epoch": 0.87, "learning_rate": 8.556901099073844e-07, "loss": 21.3719, "step": 80600 }, { "epoch": 0.87, "learning_rate": 8.542735247063704e-07, "loss": 21.5969, "step": 80610 }, { "epoch": 0.87, "learning_rate": 8.528580607258197e-07, "loss": 21.3154, "step": 80620 }, { "epoch": 0.87, "learning_rate": 8.514437181392598e-07, "loss": 20.7982, "step": 80630 }, { "epoch": 0.87, "learning_rate": 8.500304971200868e-07, "loss": 20.7476, "step": 80640 }, { "epoch": 0.87, "learning_rate": 8.486183978415496e-07, "loss": 20.809, "step": 80650 }, { "epoch": 0.87, "learning_rate": 8.472074204767678e-07, "loss": 20.2488, "step": 80660 }, { "epoch": 0.87, "learning_rate": 8.457975651987172e-07, "loss": 20.997, "step": 80670 }, { "epoch": 0.87, "learning_rate": 8.443888321802396e-07, "loss": 21.1939, "step": 80680 }, { "epoch": 0.87, "learning_rate": 8.429812215940413e-07, "loss": 21.5649, "step": 80690 }, { "epoch": 0.87, "learning_rate": 8.41574733612689e-07, "loss": 21.0462, "step": 80700 }, { "epoch": 0.87, "learning_rate": 8.401693684086065e-07, "loss": 22.2785, "step": 80710 }, { "epoch": 0.87, "learning_rate": 8.387651261540874e-07, "loss": 20.8733, "step": 80720 }, { "epoch": 0.87, "learning_rate": 8.37362007021284e-07, "loss": 20.9281, "step": 80730 }, { "epoch": 0.87, "learning_rate": 8.359600111822097e-07, "loss": 21.1222, "step": 80740 }, { "epoch": 0.87, "learning_rate": 8.345591388087493e-07, "loss": 20.6063, "step": 80750 }, { "epoch": 0.87, "learning_rate": 8.331593900726354e-07, "loss": 20.788, "step": 80760 }, { "epoch": 0.87, "learning_rate": 8.317607651454718e-07, "loss": 21.5208, "step": 80770 }, { "epoch": 0.87, "learning_rate": 8.303632641987259e-07, "loss": 21.8104, "step": 80780 }, { "epoch": 0.87, "learning_rate": 8.289668874037194e-07, "loss": 21.0895, "step": 80790 }, { "epoch": 0.87, "learning_rate": 8.275716349316476e-07, "loss": 21.2549, "step": 80800 }, { "epoch": 0.87, "learning_rate": 8.26177506953556e-07, "loss": 21.2162, "step": 80810 }, { "epoch": 0.87, "learning_rate": 8.247845036403601e-07, "loss": 21.2553, "step": 80820 }, { "epoch": 0.87, "learning_rate": 8.233926251628355e-07, "loss": 21.2163, "step": 80830 }, { "epoch": 0.87, "learning_rate": 8.220018716916167e-07, "loss": 20.6351, "step": 80840 }, { "epoch": 0.87, "learning_rate": 8.206122433972063e-07, "loss": 21.5866, "step": 80850 }, { "epoch": 0.87, "learning_rate": 8.19223740449967e-07, "loss": 21.3528, "step": 80860 }, { "epoch": 0.87, "learning_rate": 8.178363630201192e-07, "loss": 20.5259, "step": 80870 }, { "epoch": 0.87, "learning_rate": 8.16450111277749e-07, "loss": 21.4614, "step": 80880 }, { "epoch": 0.87, "learning_rate": 8.150649853928017e-07, "loss": 21.6267, "step": 80890 }, { "epoch": 0.87, "learning_rate": 8.136809855350924e-07, "loss": 21.3177, "step": 80900 }, { "epoch": 0.87, "learning_rate": 8.122981118742901e-07, "loss": 20.936, "step": 80910 }, { "epoch": 0.87, "learning_rate": 8.109163645799267e-07, "loss": 21.522, "step": 80920 }, { "epoch": 0.87, "learning_rate": 8.095357438213991e-07, "loss": 21.3721, "step": 80930 }, { "epoch": 0.88, "learning_rate": 8.081562497679618e-07, "loss": 21.6176, "step": 80940 }, { "epoch": 0.88, "learning_rate": 8.067778825887385e-07, "loss": 21.2695, "step": 80950 }, { "epoch": 0.88, "learning_rate": 8.054006424527072e-07, "loss": 21.1574, "step": 80960 }, { "epoch": 0.88, "learning_rate": 8.04024529528713e-07, "loss": 21.5068, "step": 80970 }, { "epoch": 0.88, "learning_rate": 8.026495439854564e-07, "loss": 20.8631, "step": 80980 }, { "epoch": 0.88, "learning_rate": 8.01275685991505e-07, "loss": 20.9781, "step": 80990 }, { "epoch": 0.88, "learning_rate": 7.999029557152893e-07, "loss": 21.28, "step": 81000 }, { "epoch": 0.88, "learning_rate": 7.985313533250982e-07, "loss": 21.1059, "step": 81010 }, { "epoch": 0.88, "learning_rate": 7.97160878989085e-07, "loss": 21.0227, "step": 81020 }, { "epoch": 0.88, "learning_rate": 7.957915328752596e-07, "loss": 20.7694, "step": 81030 }, { "epoch": 0.88, "learning_rate": 7.944233151514957e-07, "loss": 21.0538, "step": 81040 }, { "epoch": 0.88, "learning_rate": 7.930562259855356e-07, "loss": 21.4492, "step": 81050 }, { "epoch": 0.88, "learning_rate": 7.916902655449732e-07, "loss": 21.4668, "step": 81060 }, { "epoch": 0.88, "learning_rate": 7.903254339972732e-07, "loss": 20.8987, "step": 81070 }, { "epoch": 0.88, "learning_rate": 7.88961731509752e-07, "loss": 21.003, "step": 81080 }, { "epoch": 0.88, "learning_rate": 7.875991582495923e-07, "loss": 20.2964, "step": 81090 }, { "epoch": 0.88, "learning_rate": 7.862377143838429e-07, "loss": 21.8811, "step": 81100 }, { "epoch": 0.88, "learning_rate": 7.848774000794079e-07, "loss": 20.7574, "step": 81110 }, { "epoch": 0.88, "learning_rate": 7.835182155030563e-07, "loss": 21.5797, "step": 81120 }, { "epoch": 0.88, "learning_rate": 7.821601608214179e-07, "loss": 20.8267, "step": 81130 }, { "epoch": 0.88, "learning_rate": 7.808032362009788e-07, "loss": 20.4111, "step": 81140 }, { "epoch": 0.88, "learning_rate": 7.794474418080955e-07, "loss": 21.2004, "step": 81150 }, { "epoch": 0.88, "learning_rate": 7.780927778089808e-07, "loss": 20.2449, "step": 81160 }, { "epoch": 0.88, "learning_rate": 7.767392443697097e-07, "loss": 20.7568, "step": 81170 }, { "epoch": 0.88, "learning_rate": 7.753868416562205e-07, "loss": 22.0529, "step": 81180 }, { "epoch": 0.88, "learning_rate": 7.74035569834305e-07, "loss": 21.0309, "step": 81190 }, { "epoch": 0.88, "learning_rate": 7.726854290696273e-07, "loss": 20.5983, "step": 81200 }, { "epoch": 0.88, "learning_rate": 7.713364195277084e-07, "loss": 21.037, "step": 81210 }, { "epoch": 0.88, "learning_rate": 7.699885413739272e-07, "loss": 20.6349, "step": 81220 }, { "epoch": 0.88, "learning_rate": 7.686417947735292e-07, "loss": 21.7706, "step": 81230 }, { "epoch": 0.88, "learning_rate": 7.67296179891619e-07, "loss": 21.2641, "step": 81240 }, { "epoch": 0.88, "learning_rate": 7.65951696893159e-07, "loss": 21.1792, "step": 81250 }, { "epoch": 0.88, "learning_rate": 7.646083459429798e-07, "loss": 21.485, "step": 81260 }, { "epoch": 0.88, "learning_rate": 7.632661272057685e-07, "loss": 20.8148, "step": 81270 }, { "epoch": 0.88, "learning_rate": 7.619250408460732e-07, "loss": 20.705, "step": 81280 }, { "epoch": 0.88, "learning_rate": 7.60585087028305e-07, "loss": 21.634, "step": 81290 }, { "epoch": 0.88, "learning_rate": 7.592462659167365e-07, "loss": 20.3562, "step": 81300 }, { "epoch": 0.88, "learning_rate": 7.579085776754991e-07, "loss": 20.7861, "step": 81310 }, { "epoch": 0.88, "learning_rate": 7.56572022468588e-07, "loss": 22.4431, "step": 81320 }, { "epoch": 0.88, "learning_rate": 7.552366004598566e-07, "loss": 20.6401, "step": 81330 }, { "epoch": 0.88, "learning_rate": 7.539023118130229e-07, "loss": 20.6424, "step": 81340 }, { "epoch": 0.88, "learning_rate": 7.525691566916627e-07, "loss": 21.566, "step": 81350 }, { "epoch": 0.88, "learning_rate": 7.512371352592152e-07, "loss": 20.8311, "step": 81360 }, { "epoch": 0.88, "learning_rate": 7.499062476789776e-07, "loss": 21.0543, "step": 81370 }, { "epoch": 0.88, "learning_rate": 7.485764941141127e-07, "loss": 21.2373, "step": 81380 }, { "epoch": 0.88, "learning_rate": 7.472478747276402e-07, "loss": 21.1481, "step": 81390 }, { "epoch": 0.88, "learning_rate": 7.459203896824418e-07, "loss": 21.0717, "step": 81400 }, { "epoch": 0.88, "learning_rate": 7.44594039141261e-07, "loss": 20.819, "step": 81410 }, { "epoch": 0.88, "learning_rate": 7.432688232667029e-07, "loss": 21.6471, "step": 81420 }, { "epoch": 0.88, "learning_rate": 7.4194474222123e-07, "loss": 21.2803, "step": 81430 }, { "epoch": 0.88, "learning_rate": 7.406217961671702e-07, "loss": 21.1728, "step": 81440 }, { "epoch": 0.88, "learning_rate": 7.392999852667093e-07, "loss": 20.5282, "step": 81450 }, { "epoch": 0.88, "learning_rate": 7.379793096818955e-07, "loss": 22.067, "step": 81460 }, { "epoch": 0.88, "learning_rate": 7.366597695746347e-07, "loss": 21.2556, "step": 81470 }, { "epoch": 0.88, "learning_rate": 7.353413651066987e-07, "loss": 21.0247, "step": 81480 }, { "epoch": 0.88, "learning_rate": 7.34024096439715e-07, "loss": 22.4778, "step": 81490 }, { "epoch": 0.88, "learning_rate": 7.327079637351742e-07, "loss": 20.235, "step": 81500 }, { "epoch": 0.88, "learning_rate": 7.313929671544328e-07, "loss": 20.7838, "step": 81510 }, { "epoch": 0.88, "learning_rate": 7.300791068586954e-07, "loss": 20.6713, "step": 81520 }, { "epoch": 0.88, "learning_rate": 7.287663830090397e-07, "loss": 21.4424, "step": 81530 }, { "epoch": 0.88, "learning_rate": 7.274547957663968e-07, "loss": 20.8727, "step": 81540 }, { "epoch": 0.88, "learning_rate": 7.261443452915595e-07, "loss": 21.0738, "step": 81550 }, { "epoch": 0.88, "learning_rate": 7.24835031745188e-07, "loss": 21.303, "step": 81560 }, { "epoch": 0.88, "learning_rate": 7.235268552877917e-07, "loss": 21.6583, "step": 81570 }, { "epoch": 0.88, "learning_rate": 7.222198160797489e-07, "loss": 21.1339, "step": 81580 }, { "epoch": 0.88, "learning_rate": 7.20913914281296e-07, "loss": 21.4369, "step": 81590 }, { "epoch": 0.88, "learning_rate": 7.196091500525293e-07, "loss": 20.7862, "step": 81600 }, { "epoch": 0.88, "learning_rate": 7.183055235534098e-07, "loss": 21.5691, "step": 81610 }, { "epoch": 0.88, "learning_rate": 7.170030349437506e-07, "loss": 21.8516, "step": 81620 }, { "epoch": 0.88, "learning_rate": 7.157016843832343e-07, "loss": 21.2908, "step": 81630 }, { "epoch": 0.88, "learning_rate": 7.144014720313974e-07, "loss": 21.0561, "step": 81640 }, { "epoch": 0.88, "learning_rate": 7.131023980476381e-07, "loss": 21.1762, "step": 81650 }, { "epoch": 0.88, "learning_rate": 7.118044625912213e-07, "loss": 21.5337, "step": 81660 }, { "epoch": 0.88, "learning_rate": 7.105076658212662e-07, "loss": 20.9941, "step": 81670 }, { "epoch": 0.88, "learning_rate": 7.092120078967501e-07, "loss": 21.1291, "step": 81680 }, { "epoch": 0.88, "learning_rate": 7.079174889765162e-07, "loss": 21.2295, "step": 81690 }, { "epoch": 0.88, "learning_rate": 7.066241092192649e-07, "loss": 20.9369, "step": 81700 }, { "epoch": 0.88, "learning_rate": 7.053318687835619e-07, "loss": 20.8133, "step": 81710 }, { "epoch": 0.88, "learning_rate": 7.040407678278271e-07, "loss": 21.7088, "step": 81720 }, { "epoch": 0.88, "learning_rate": 7.027508065103428e-07, "loss": 22.2011, "step": 81730 }, { "epoch": 0.88, "learning_rate": 7.014619849892501e-07, "loss": 21.387, "step": 81740 }, { "epoch": 0.88, "learning_rate": 7.001743034225539e-07, "loss": 20.9739, "step": 81750 }, { "epoch": 0.88, "learning_rate": 6.988877619681179e-07, "loss": 21.2382, "step": 81760 }, { "epoch": 0.88, "learning_rate": 6.97602360783668e-07, "loss": 21.8172, "step": 81770 }, { "epoch": 0.88, "learning_rate": 6.963181000267827e-07, "loss": 20.7774, "step": 81780 }, { "epoch": 0.88, "learning_rate": 6.950349798549083e-07, "loss": 21.4163, "step": 81790 }, { "epoch": 0.88, "learning_rate": 6.93753000425349e-07, "loss": 20.5764, "step": 81800 }, { "epoch": 0.88, "learning_rate": 6.92472161895269e-07, "loss": 20.7585, "step": 81810 }, { "epoch": 0.88, "learning_rate": 6.91192464421695e-07, "loss": 21.7279, "step": 81820 }, { "epoch": 0.88, "learning_rate": 6.899139081615092e-07, "loss": 20.9813, "step": 81830 }, { "epoch": 0.88, "learning_rate": 6.886364932714563e-07, "loss": 21.19, "step": 81840 }, { "epoch": 0.88, "learning_rate": 6.873602199081386e-07, "loss": 21.2036, "step": 81850 }, { "epoch": 0.88, "learning_rate": 6.860850882280257e-07, "loss": 21.3227, "step": 81860 }, { "epoch": 0.89, "learning_rate": 6.848110983874401e-07, "loss": 20.699, "step": 81870 }, { "epoch": 0.89, "learning_rate": 6.835382505425681e-07, "loss": 21.0541, "step": 81880 }, { "epoch": 0.89, "learning_rate": 6.822665448494514e-07, "loss": 21.4582, "step": 81890 }, { "epoch": 0.89, "learning_rate": 6.809959814639955e-07, "loss": 21.7527, "step": 81900 }, { "epoch": 0.89, "learning_rate": 6.797265605419668e-07, "loss": 21.6859, "step": 81910 }, { "epoch": 0.89, "learning_rate": 6.784582822389896e-07, "loss": 21.3309, "step": 81920 }, { "epoch": 0.89, "learning_rate": 6.771911467105474e-07, "loss": 20.9922, "step": 81930 }, { "epoch": 0.89, "learning_rate": 6.759251541119882e-07, "loss": 20.6174, "step": 81940 }, { "epoch": 0.89, "learning_rate": 6.746603045985101e-07, "loss": 20.8406, "step": 81950 }, { "epoch": 0.89, "learning_rate": 6.733965983251822e-07, "loss": 21.2873, "step": 81960 }, { "epoch": 0.89, "learning_rate": 6.721340354469275e-07, "loss": 21.5988, "step": 81970 }, { "epoch": 0.89, "learning_rate": 6.708726161185286e-07, "loss": 21.1919, "step": 81980 }, { "epoch": 0.89, "learning_rate": 6.69612340494633e-07, "loss": 21.7354, "step": 81990 }, { "epoch": 0.89, "learning_rate": 6.683532087297384e-07, "loss": 20.8779, "step": 82000 }, { "epoch": 0.89, "learning_rate": 6.670952209782123e-07, "loss": 20.9311, "step": 82010 }, { "epoch": 0.89, "learning_rate": 6.658383773942767e-07, "loss": 20.954, "step": 82020 }, { "epoch": 0.89, "learning_rate": 6.645826781320141e-07, "loss": 21.2829, "step": 82030 }, { "epoch": 0.89, "learning_rate": 6.633281233453692e-07, "loss": 21.4627, "step": 82040 }, { "epoch": 0.89, "learning_rate": 6.620747131881377e-07, "loss": 21.2773, "step": 82050 }, { "epoch": 0.89, "learning_rate": 6.608224478139891e-07, "loss": 21.9358, "step": 82060 }, { "epoch": 0.89, "learning_rate": 6.595713273764404e-07, "loss": 21.0175, "step": 82070 }, { "epoch": 0.89, "learning_rate": 6.583213520288745e-07, "loss": 20.6878, "step": 82080 }, { "epoch": 0.89, "learning_rate": 6.57072521924531e-07, "loss": 21.1632, "step": 82090 }, { "epoch": 0.89, "learning_rate": 6.558248372165121e-07, "loss": 21.0082, "step": 82100 }, { "epoch": 0.89, "learning_rate": 6.545782980577742e-07, "loss": 20.9645, "step": 82110 }, { "epoch": 0.89, "learning_rate": 6.533329046011405e-07, "loss": 20.9764, "step": 82120 }, { "epoch": 0.89, "learning_rate": 6.520886569992879e-07, "loss": 21.0214, "step": 82130 }, { "epoch": 0.89, "learning_rate": 6.508455554047566e-07, "loss": 21.4292, "step": 82140 }, { "epoch": 0.89, "learning_rate": 6.496035999699445e-07, "loss": 20.9997, "step": 82150 }, { "epoch": 0.89, "learning_rate": 6.483627908471057e-07, "loss": 21.7617, "step": 82160 }, { "epoch": 0.89, "learning_rate": 6.471231281883605e-07, "loss": 21.4906, "step": 82170 }, { "epoch": 0.89, "learning_rate": 6.458846121456852e-07, "loss": 21.3827, "step": 82180 }, { "epoch": 0.89, "learning_rate": 6.446472428709161e-07, "loss": 21.6929, "step": 82190 }, { "epoch": 0.89, "learning_rate": 6.434110205157462e-07, "loss": 21.3449, "step": 82200 }, { "epoch": 0.89, "learning_rate": 6.421759452317322e-07, "loss": 20.9018, "step": 82210 }, { "epoch": 0.89, "learning_rate": 6.409420171702873e-07, "loss": 20.9121, "step": 82220 }, { "epoch": 0.89, "learning_rate": 6.397092364826851e-07, "loss": 22.1173, "step": 82230 }, { "epoch": 0.89, "learning_rate": 6.38477603320059e-07, "loss": 21.1079, "step": 82240 }, { "epoch": 0.89, "learning_rate": 6.372471178333995e-07, "loss": 21.6408, "step": 82250 }, { "epoch": 0.89, "learning_rate": 6.360177801735601e-07, "loss": 21.7043, "step": 82260 }, { "epoch": 0.89, "learning_rate": 6.347895904912493e-07, "loss": 21.7629, "step": 82270 }, { "epoch": 0.89, "learning_rate": 6.335625489370389e-07, "loss": 21.4363, "step": 82280 }, { "epoch": 0.89, "learning_rate": 6.323366556613574e-07, "loss": 21.2124, "step": 82290 }, { "epoch": 0.89, "learning_rate": 6.311119108144926e-07, "loss": 21.7842, "step": 82300 }, { "epoch": 0.89, "learning_rate": 6.298883145465929e-07, "loss": 21.5651, "step": 82310 }, { "epoch": 0.89, "learning_rate": 6.286658670076651e-07, "loss": 20.7178, "step": 82320 }, { "epoch": 0.89, "learning_rate": 6.274445683475738e-07, "loss": 21.2857, "step": 82330 }, { "epoch": 0.89, "learning_rate": 6.26224418716046e-07, "loss": 21.6423, "step": 82340 }, { "epoch": 0.89, "learning_rate": 6.250054182626652e-07, "loss": 20.797, "step": 82350 }, { "epoch": 0.89, "learning_rate": 6.237875671368742e-07, "loss": 21.7336, "step": 82360 }, { "epoch": 0.89, "learning_rate": 6.225708654879769e-07, "loss": 20.9343, "step": 82370 }, { "epoch": 0.89, "learning_rate": 6.213553134651329e-07, "loss": 20.7355, "step": 82380 }, { "epoch": 0.89, "learning_rate": 6.20140911217364e-07, "loss": 21.3412, "step": 82390 }, { "epoch": 0.89, "learning_rate": 6.1892765889355e-07, "loss": 21.4967, "step": 82400 }, { "epoch": 0.89, "learning_rate": 6.177155566424297e-07, "loss": 21.5304, "step": 82410 }, { "epoch": 0.89, "learning_rate": 6.165046046126e-07, "loss": 21.3255, "step": 82420 }, { "epoch": 0.89, "learning_rate": 6.152948029525186e-07, "loss": 22.0703, "step": 82430 }, { "epoch": 0.89, "learning_rate": 6.140861518105001e-07, "loss": 21.2213, "step": 82440 }, { "epoch": 0.89, "learning_rate": 6.128786513347196e-07, "loss": 20.7983, "step": 82450 }, { "epoch": 0.89, "learning_rate": 6.116723016732107e-07, "loss": 21.2724, "step": 82460 }, { "epoch": 0.89, "learning_rate": 6.104671029738651e-07, "loss": 20.0651, "step": 82470 }, { "epoch": 0.89, "learning_rate": 6.092630553844358e-07, "loss": 21.1661, "step": 82480 }, { "epoch": 0.89, "learning_rate": 6.080601590525314e-07, "loss": 21.1509, "step": 82490 }, { "epoch": 0.89, "learning_rate": 6.068584141256217e-07, "loss": 21.6576, "step": 82500 }, { "epoch": 0.89, "learning_rate": 6.056578207510344e-07, "loss": 21.0049, "step": 82510 }, { "epoch": 0.89, "learning_rate": 6.04458379075955e-07, "loss": 21.0109, "step": 82520 }, { "epoch": 0.89, "learning_rate": 6.032600892474339e-07, "loss": 21.5313, "step": 82530 }, { "epoch": 0.89, "learning_rate": 6.020629514123699e-07, "loss": 21.4822, "step": 82540 }, { "epoch": 0.89, "learning_rate": 6.008669657175292e-07, "loss": 21.9118, "step": 82550 }, { "epoch": 0.89, "learning_rate": 5.996721323095323e-07, "loss": 20.5901, "step": 82560 }, { "epoch": 0.89, "learning_rate": 5.984784513348585e-07, "loss": 20.8358, "step": 82570 }, { "epoch": 0.89, "learning_rate": 5.97285922939852e-07, "loss": 21.9273, "step": 82580 }, { "epoch": 0.89, "learning_rate": 5.960945472707069e-07, "loss": 20.5134, "step": 82590 }, { "epoch": 0.89, "learning_rate": 5.949043244734798e-07, "loss": 20.9091, "step": 82600 }, { "epoch": 0.89, "learning_rate": 5.937152546940872e-07, "loss": 21.161, "step": 82610 }, { "epoch": 0.89, "learning_rate": 5.925273380783014e-07, "loss": 20.7025, "step": 82620 }, { "epoch": 0.89, "learning_rate": 5.913405747717593e-07, "loss": 20.9944, "step": 82630 }, { "epoch": 0.89, "learning_rate": 5.901549649199501e-07, "loss": 21.1073, "step": 82640 }, { "epoch": 0.89, "learning_rate": 5.889705086682207e-07, "loss": 21.6103, "step": 82650 }, { "epoch": 0.89, "learning_rate": 5.877872061617828e-07, "loss": 21.1042, "step": 82660 }, { "epoch": 0.89, "learning_rate": 5.866050575457017e-07, "loss": 20.5958, "step": 82670 }, { "epoch": 0.89, "learning_rate": 5.854240629649044e-07, "loss": 20.7118, "step": 82680 }, { "epoch": 0.89, "learning_rate": 5.842442225641754e-07, "loss": 20.531, "step": 82690 }, { "epoch": 0.89, "learning_rate": 5.830655364881543e-07, "loss": 21.3883, "step": 82700 }, { "epoch": 0.89, "learning_rate": 5.818880048813447e-07, "loss": 21.4513, "step": 82710 }, { "epoch": 0.89, "learning_rate": 5.807116278881042e-07, "loss": 21.4956, "step": 82720 }, { "epoch": 0.89, "learning_rate": 5.795364056526531e-07, "loss": 21.271, "step": 82730 }, { "epoch": 0.89, "learning_rate": 5.783623383190673e-07, "loss": 21.5205, "step": 82740 }, { "epoch": 0.89, "learning_rate": 5.771894260312794e-07, "loss": 20.9097, "step": 82750 }, { "epoch": 0.89, "learning_rate": 5.760176689330855e-07, "loss": 21.2033, "step": 82760 }, { "epoch": 0.89, "learning_rate": 5.748470671681328e-07, "loss": 21.0612, "step": 82770 }, { "epoch": 0.89, "learning_rate": 5.736776208799356e-07, "loss": 20.151, "step": 82780 }, { "epoch": 0.9, "learning_rate": 5.725093302118611e-07, "loss": 21.2285, "step": 82790 }, { "epoch": 0.9, "learning_rate": 5.713421953071374e-07, "loss": 21.4318, "step": 82800 }, { "epoch": 0.9, "learning_rate": 5.701762163088465e-07, "loss": 21.3457, "step": 82810 }, { "epoch": 0.9, "learning_rate": 5.690113933599306e-07, "loss": 21.6928, "step": 82820 }, { "epoch": 0.9, "learning_rate": 5.678477266031945e-07, "loss": 20.8863, "step": 82830 }, { "epoch": 0.9, "learning_rate": 5.666852161812974e-07, "loss": 21.0327, "step": 82840 }, { "epoch": 0.9, "learning_rate": 5.655238622367575e-07, "loss": 20.9734, "step": 82850 }, { "epoch": 0.9, "learning_rate": 5.643636649119489e-07, "loss": 21.3724, "step": 82860 }, { "epoch": 0.9, "learning_rate": 5.632046243491063e-07, "loss": 21.0127, "step": 82870 }, { "epoch": 0.9, "learning_rate": 5.62046740690324e-07, "loss": 21.463, "step": 82880 }, { "epoch": 0.9, "learning_rate": 5.60890014077552e-07, "loss": 20.8924, "step": 82890 }, { "epoch": 0.9, "learning_rate": 5.597344446525998e-07, "loss": 20.7995, "step": 82900 }, { "epoch": 0.9, "learning_rate": 5.585800325571345e-07, "loss": 21.0008, "step": 82910 }, { "epoch": 0.9, "learning_rate": 5.57426777932678e-07, "loss": 21.8507, "step": 82920 }, { "epoch": 0.9, "learning_rate": 5.562746809206177e-07, "loss": 21.3612, "step": 82930 }, { "epoch": 0.9, "learning_rate": 5.551237416621936e-07, "loss": 20.8355, "step": 82940 }, { "epoch": 0.9, "learning_rate": 5.53973960298505e-07, "loss": 21.0969, "step": 82950 }, { "epoch": 0.9, "learning_rate": 5.528253369705106e-07, "loss": 21.5271, "step": 82960 }, { "epoch": 0.9, "learning_rate": 5.516778718190208e-07, "loss": 20.4838, "step": 82970 }, { "epoch": 0.9, "learning_rate": 5.505315649847154e-07, "loss": 20.7384, "step": 82980 }, { "epoch": 0.9, "learning_rate": 5.493864166081231e-07, "loss": 21.1528, "step": 82990 }, { "epoch": 0.9, "learning_rate": 5.482424268296338e-07, "loss": 20.5791, "step": 83000 }, { "epoch": 0.9, "learning_rate": 5.470995957894965e-07, "loss": 21.0027, "step": 83010 }, { "epoch": 0.9, "learning_rate": 5.459579236278112e-07, "loss": 21.2314, "step": 83020 }, { "epoch": 0.9, "learning_rate": 5.448174104845472e-07, "loss": 21.3134, "step": 83030 }, { "epoch": 0.9, "learning_rate": 5.436780564995237e-07, "loss": 21.0744, "step": 83040 }, { "epoch": 0.9, "learning_rate": 5.425398618124189e-07, "loss": 21.6781, "step": 83050 }, { "epoch": 0.9, "learning_rate": 5.414028265627702e-07, "loss": 21.2666, "step": 83060 }, { "epoch": 0.9, "learning_rate": 5.402669508899728e-07, "loss": 20.5447, "step": 83070 }, { "epoch": 0.9, "learning_rate": 5.391322349332806e-07, "loss": 22.3639, "step": 83080 }, { "epoch": 0.9, "learning_rate": 5.379986788318014e-07, "loss": 21.5146, "step": 83090 }, { "epoch": 0.9, "learning_rate": 5.368662827245053e-07, "loss": 21.0865, "step": 83100 }, { "epoch": 0.9, "learning_rate": 5.357350467502187e-07, "loss": 20.3518, "step": 83110 }, { "epoch": 0.9, "learning_rate": 5.346049710476242e-07, "loss": 20.6528, "step": 83120 }, { "epoch": 0.9, "learning_rate": 5.334760557552643e-07, "loss": 21.6426, "step": 83130 }, { "epoch": 0.9, "learning_rate": 5.323483010115382e-07, "loss": 21.4226, "step": 83140 }, { "epoch": 0.9, "learning_rate": 5.312217069547032e-07, "loss": 21.1919, "step": 83150 }, { "epoch": 0.9, "learning_rate": 5.300962737228732e-07, "loss": 21.3557, "step": 83160 }, { "epoch": 0.9, "learning_rate": 5.289720014540223e-07, "loss": 21.5062, "step": 83170 }, { "epoch": 0.9, "learning_rate": 5.27848890285979e-07, "loss": 21.2346, "step": 83180 }, { "epoch": 0.9, "learning_rate": 5.267269403564324e-07, "loss": 22.0704, "step": 83190 }, { "epoch": 0.9, "learning_rate": 5.256061518029276e-07, "loss": 21.3676, "step": 83200 }, { "epoch": 0.9, "learning_rate": 5.244865247628673e-07, "loss": 21.7875, "step": 83210 }, { "epoch": 0.9, "learning_rate": 5.233680593735124e-07, "loss": 21.2785, "step": 83220 }, { "epoch": 0.9, "learning_rate": 5.222507557719813e-07, "loss": 20.8077, "step": 83230 }, { "epoch": 0.9, "learning_rate": 5.2113461409525e-07, "loss": 21.0617, "step": 83240 }, { "epoch": 0.9, "learning_rate": 5.200196344801522e-07, "loss": 20.9776, "step": 83250 }, { "epoch": 0.9, "learning_rate": 5.189058170633776e-07, "loss": 21.512, "step": 83260 }, { "epoch": 0.9, "learning_rate": 5.177931619814758e-07, "loss": 21.4637, "step": 83270 }, { "epoch": 0.9, "learning_rate": 5.16681669370852e-07, "loss": 20.4573, "step": 83280 }, { "epoch": 0.9, "learning_rate": 5.155713393677697e-07, "loss": 20.2957, "step": 83290 }, { "epoch": 0.9, "learning_rate": 5.144621721083509e-07, "loss": 20.5157, "step": 83300 }, { "epoch": 0.9, "learning_rate": 5.133541677285736e-07, "loss": 21.5811, "step": 83310 }, { "epoch": 0.9, "learning_rate": 5.122473263642724e-07, "loss": 21.0872, "step": 83320 }, { "epoch": 0.9, "learning_rate": 5.111416481511411e-07, "loss": 21.5686, "step": 83330 }, { "epoch": 0.9, "learning_rate": 5.100371332247312e-07, "loss": 20.8045, "step": 83340 }, { "epoch": 0.9, "learning_rate": 5.089337817204499e-07, "loss": 20.7589, "step": 83350 }, { "epoch": 0.9, "learning_rate": 5.078315937735634e-07, "loss": 20.8196, "step": 83360 }, { "epoch": 0.9, "learning_rate": 5.067305695191926e-07, "loss": 21.6867, "step": 83370 }, { "epoch": 0.9, "learning_rate": 5.056307090923208e-07, "loss": 20.9963, "step": 83380 }, { "epoch": 0.9, "learning_rate": 5.045320126277819e-07, "loss": 21.1541, "step": 83390 }, { "epoch": 0.9, "learning_rate": 5.03434480260272e-07, "loss": 21.3879, "step": 83400 }, { "epoch": 0.9, "learning_rate": 5.023381121243442e-07, "loss": 21.5415, "step": 83410 }, { "epoch": 0.9, "learning_rate": 5.012429083544068e-07, "loss": 20.9266, "step": 83420 }, { "epoch": 0.9, "learning_rate": 5.001488690847255e-07, "loss": 21.0421, "step": 83430 }, { "epoch": 0.9, "learning_rate": 4.990559944494256e-07, "loss": 22.1288, "step": 83440 }, { "epoch": 0.9, "learning_rate": 4.979642845824873e-07, "loss": 20.9553, "step": 83450 }, { "epoch": 0.9, "learning_rate": 4.968737396177492e-07, "loss": 20.8658, "step": 83460 }, { "epoch": 0.9, "learning_rate": 4.957843596889055e-07, "loss": 20.9049, "step": 83470 }, { "epoch": 0.9, "learning_rate": 4.946961449295096e-07, "loss": 21.549, "step": 83480 }, { "epoch": 0.9, "learning_rate": 4.936090954729699e-07, "loss": 21.3675, "step": 83490 }, { "epoch": 0.9, "learning_rate": 4.92523211452558e-07, "loss": 20.5072, "step": 83500 }, { "epoch": 0.9, "learning_rate": 4.914384930013927e-07, "loss": 21.4733, "step": 83510 }, { "epoch": 0.9, "learning_rate": 4.903549402524566e-07, "loss": 20.7269, "step": 83520 }, { "epoch": 0.9, "learning_rate": 4.892725533385889e-07, "loss": 21.3744, "step": 83530 }, { "epoch": 0.9, "learning_rate": 4.881913323924814e-07, "loss": 20.139, "step": 83540 }, { "epoch": 0.9, "learning_rate": 4.871112775466924e-07, "loss": 20.8699, "step": 83550 }, { "epoch": 0.9, "learning_rate": 4.86032388933626e-07, "loss": 21.3552, "step": 83560 }, { "epoch": 0.9, "learning_rate": 4.849546666855509e-07, "loss": 21.3769, "step": 83570 }, { "epoch": 0.9, "learning_rate": 4.838781109345903e-07, "loss": 21.8103, "step": 83580 }, { "epoch": 0.9, "learning_rate": 4.828027218127218e-07, "loss": 21.1041, "step": 83590 }, { "epoch": 0.9, "learning_rate": 4.817284994517867e-07, "loss": 21.1059, "step": 83600 }, { "epoch": 0.9, "learning_rate": 4.806554439834798e-07, "loss": 21.7584, "step": 83610 }, { "epoch": 0.9, "learning_rate": 4.795835555393491e-07, "loss": 21.2485, "step": 83620 }, { "epoch": 0.9, "learning_rate": 4.785128342508028e-07, "loss": 21.1451, "step": 83630 }, { "epoch": 0.9, "learning_rate": 4.774432802491069e-07, "loss": 21.9894, "step": 83640 }, { "epoch": 0.9, "learning_rate": 4.763748936653845e-07, "loss": 21.5462, "step": 83650 }, { "epoch": 0.9, "learning_rate": 4.753076746306151e-07, "loss": 20.9561, "step": 83660 }, { "epoch": 0.9, "learning_rate": 4.7424162327563193e-07, "loss": 21.5059, "step": 83670 }, { "epoch": 0.9, "learning_rate": 4.731767397311282e-07, "loss": 20.4449, "step": 83680 }, { "epoch": 0.9, "learning_rate": 4.721130241276528e-07, "loss": 20.3429, "step": 83690 }, { "epoch": 0.9, "learning_rate": 4.7105047659561367e-07, "loss": 20.6246, "step": 83700 }, { "epoch": 0.9, "learning_rate": 4.699890972652754e-07, "loss": 20.8458, "step": 83710 }, { "epoch": 0.91, "learning_rate": 4.6892888626675406e-07, "loss": 21.4133, "step": 83720 }, { "epoch": 0.91, "learning_rate": 4.6786984373002665e-07, "loss": 20.8761, "step": 83730 }, { "epoch": 0.91, "learning_rate": 4.6681196978492715e-07, "loss": 20.4007, "step": 83740 }, { "epoch": 0.91, "learning_rate": 4.657552645611463e-07, "loss": 21.1134, "step": 83750 }, { "epoch": 0.91, "learning_rate": 4.646997281882315e-07, "loss": 21.404, "step": 83760 }, { "epoch": 0.91, "learning_rate": 4.6364536079558597e-07, "loss": 22.4068, "step": 83770 }, { "epoch": 0.91, "learning_rate": 4.625921625124685e-07, "loss": 20.9821, "step": 83780 }, { "epoch": 0.91, "learning_rate": 4.6154013346799475e-07, "loss": 21.4091, "step": 83790 }, { "epoch": 0.91, "learning_rate": 4.604892737911415e-07, "loss": 19.8704, "step": 83800 }, { "epoch": 0.91, "learning_rate": 4.594395836107379e-07, "loss": 21.6811, "step": 83810 }, { "epoch": 0.91, "learning_rate": 4.583910630554722e-07, "loss": 21.5195, "step": 83820 }, { "epoch": 0.91, "learning_rate": 4.5734371225388485e-07, "loss": 20.9839, "step": 83830 }, { "epoch": 0.91, "learning_rate": 4.5629753133437427e-07, "loss": 21.0413, "step": 83840 }, { "epoch": 0.91, "learning_rate": 4.5525252042520227e-07, "loss": 20.8658, "step": 83850 }, { "epoch": 0.91, "learning_rate": 4.5420867965447977e-07, "loss": 21.2638, "step": 83860 }, { "epoch": 0.91, "learning_rate": 4.531660091501755e-07, "loss": 21.1856, "step": 83870 }, { "epoch": 0.91, "learning_rate": 4.521245090401172e-07, "loss": 21.4579, "step": 83880 }, { "epoch": 0.91, "learning_rate": 4.510841794519838e-07, "loss": 21.3515, "step": 83890 }, { "epoch": 0.91, "learning_rate": 4.5004502051332e-07, "loss": 20.7875, "step": 83900 }, { "epoch": 0.91, "learning_rate": 4.490070323515183e-07, "loss": 20.8398, "step": 83910 }, { "epoch": 0.91, "learning_rate": 4.4797021509383144e-07, "loss": 21.5543, "step": 83920 }, { "epoch": 0.91, "learning_rate": 4.4693456886736983e-07, "loss": 21.651, "step": 83930 }, { "epoch": 0.91, "learning_rate": 4.4590009379909317e-07, "loss": 21.06, "step": 83940 }, { "epoch": 0.91, "learning_rate": 4.4486679001582876e-07, "loss": 20.8948, "step": 83950 }, { "epoch": 0.91, "learning_rate": 4.43834657644252e-07, "loss": 21.4054, "step": 83960 }, { "epoch": 0.91, "learning_rate": 4.428036968108973e-07, "loss": 21.3364, "step": 83970 }, { "epoch": 0.91, "learning_rate": 4.4177390764215675e-07, "loss": 21.1448, "step": 83980 }, { "epoch": 0.91, "learning_rate": 4.4074529026427395e-07, "loss": 21.5522, "step": 83990 }, { "epoch": 0.91, "learning_rate": 4.397178448033557e-07, "loss": 20.4595, "step": 84000 }, { "epoch": 0.91, "learning_rate": 4.3869157138536013e-07, "loss": 21.4237, "step": 84010 }, { "epoch": 0.91, "learning_rate": 4.376664701361044e-07, "loss": 21.0775, "step": 84020 }, { "epoch": 0.91, "learning_rate": 4.3664254118125915e-07, "loss": 21.6527, "step": 84030 }, { "epoch": 0.91, "learning_rate": 4.356197846463539e-07, "loss": 21.7031, "step": 84040 }, { "epoch": 0.91, "learning_rate": 4.3459820065677285e-07, "loss": 21.1408, "step": 84050 }, { "epoch": 0.91, "learning_rate": 4.3357778933775796e-07, "loss": 20.5975, "step": 84060 }, { "epoch": 0.91, "learning_rate": 4.325585508144059e-07, "loss": 21.2872, "step": 84070 }, { "epoch": 0.91, "learning_rate": 4.315404852116711e-07, "loss": 21.2084, "step": 84080 }, { "epoch": 0.91, "learning_rate": 4.3052359265436273e-07, "loss": 21.2318, "step": 84090 }, { "epoch": 0.91, "learning_rate": 4.295078732671465e-07, "loss": 21.1889, "step": 84100 }, { "epoch": 0.91, "learning_rate": 4.2849332717454505e-07, "loss": 20.9931, "step": 84110 }, { "epoch": 0.91, "learning_rate": 4.274799545009367e-07, "loss": 21.4949, "step": 84120 }, { "epoch": 0.91, "learning_rate": 4.264677553705554e-07, "loss": 20.084, "step": 84130 }, { "epoch": 0.91, "learning_rate": 4.254567299074919e-07, "loss": 20.9215, "step": 84140 }, { "epoch": 0.91, "learning_rate": 4.2444687823569255e-07, "loss": 21.6813, "step": 84150 }, { "epoch": 0.91, "learning_rate": 4.234382004789617e-07, "loss": 22.1443, "step": 84160 }, { "epoch": 0.91, "learning_rate": 4.224306967609559e-07, "loss": 21.5218, "step": 84170 }, { "epoch": 0.91, "learning_rate": 4.2142436720519096e-07, "loss": 20.9367, "step": 84180 }, { "epoch": 0.91, "learning_rate": 4.204192119350392e-07, "loss": 20.5426, "step": 84190 }, { "epoch": 0.91, "learning_rate": 4.194152310737265e-07, "loss": 21.7369, "step": 84200 }, { "epoch": 0.91, "learning_rate": 4.184124247443355e-07, "loss": 20.8902, "step": 84210 }, { "epoch": 0.91, "learning_rate": 4.174107930698057e-07, "loss": 20.4436, "step": 84220 }, { "epoch": 0.91, "learning_rate": 4.1641033617293216e-07, "loss": 20.7664, "step": 84230 }, { "epoch": 0.91, "learning_rate": 4.1541105417636565e-07, "loss": 20.769, "step": 84240 }, { "epoch": 0.91, "learning_rate": 4.1441294720261373e-07, "loss": 20.8261, "step": 84250 }, { "epoch": 0.91, "learning_rate": 4.1341601537403964e-07, "loss": 21.888, "step": 84260 }, { "epoch": 0.91, "learning_rate": 4.1242025881286117e-07, "loss": 21.6201, "step": 84270 }, { "epoch": 0.91, "learning_rate": 4.1142567764115403e-07, "loss": 21.4662, "step": 84280 }, { "epoch": 0.91, "learning_rate": 4.1043227198084735e-07, "loss": 20.9667, "step": 84290 }, { "epoch": 0.91, "learning_rate": 4.094400419537292e-07, "loss": 21.434, "step": 84300 }, { "epoch": 0.91, "learning_rate": 4.0844898768144236e-07, "loss": 21.2133, "step": 84310 }, { "epoch": 0.91, "learning_rate": 4.0745910928548406e-07, "loss": 21.4195, "step": 84320 }, { "epoch": 0.91, "learning_rate": 4.064704068872094e-07, "loss": 20.2755, "step": 84330 }, { "epoch": 0.91, "learning_rate": 4.0548288060782705e-07, "loss": 21.764, "step": 84340 }, { "epoch": 0.91, "learning_rate": 4.0449653056840343e-07, "loss": 21.5518, "step": 84350 }, { "epoch": 0.91, "learning_rate": 4.0351135688986077e-07, "loss": 20.3282, "step": 84360 }, { "epoch": 0.91, "learning_rate": 4.0252735969297575e-07, "loss": 21.5418, "step": 84370 }, { "epoch": 0.91, "learning_rate": 4.0154453909838185e-07, "loss": 21.6698, "step": 84380 }, { "epoch": 0.91, "learning_rate": 4.0056289522656834e-07, "loss": 21.3155, "step": 84390 }, { "epoch": 0.91, "learning_rate": 3.9958242819787886e-07, "loss": 20.5675, "step": 84400 }, { "epoch": 0.91, "learning_rate": 3.9860313813251395e-07, "loss": 21.2871, "step": 84410 }, { "epoch": 0.91, "learning_rate": 3.9762502515053094e-07, "loss": 20.9562, "step": 84420 }, { "epoch": 0.91, "learning_rate": 3.966480893718394e-07, "loss": 21.5289, "step": 84430 }, { "epoch": 0.91, "learning_rate": 3.9567233091620915e-07, "loss": 20.7275, "step": 84440 }, { "epoch": 0.91, "learning_rate": 3.9469774990326227e-07, "loss": 21.012, "step": 84450 }, { "epoch": 0.91, "learning_rate": 3.9372434645247536e-07, "loss": 21.7538, "step": 84460 }, { "epoch": 0.91, "learning_rate": 3.927521206831886e-07, "loss": 20.8048, "step": 84470 }, { "epoch": 0.91, "learning_rate": 3.9178107271458654e-07, "loss": 21.0696, "step": 84480 }, { "epoch": 0.91, "learning_rate": 3.9081120266571624e-07, "loss": 21.2883, "step": 84490 }, { "epoch": 0.91, "learning_rate": 3.898425106554804e-07, "loss": 22.1904, "step": 84500 }, { "epoch": 0.91, "learning_rate": 3.8887499680263284e-07, "loss": 21.0185, "step": 84510 }, { "epoch": 0.91, "learning_rate": 3.87908661225791e-07, "loss": 20.8367, "step": 84520 }, { "epoch": 0.91, "learning_rate": 3.8694350404341775e-07, "loss": 21.415, "step": 84530 }, { "epoch": 0.91, "learning_rate": 3.859795253738385e-07, "loss": 21.0301, "step": 84540 }, { "epoch": 0.91, "learning_rate": 3.8501672533523327e-07, "loss": 21.6296, "step": 84550 }, { "epoch": 0.91, "learning_rate": 3.8405510404563304e-07, "loss": 21.2358, "step": 84560 }, { "epoch": 0.91, "learning_rate": 3.8309466162293253e-07, "loss": 20.3475, "step": 84570 }, { "epoch": 0.91, "learning_rate": 3.821353981848752e-07, "loss": 21.1792, "step": 84580 }, { "epoch": 0.91, "learning_rate": 3.8117731384906045e-07, "loss": 20.8973, "step": 84590 }, { "epoch": 0.91, "learning_rate": 3.802204087329464e-07, "loss": 20.7337, "step": 84600 }, { "epoch": 0.91, "learning_rate": 3.7926468295384265e-07, "loss": 21.4314, "step": 84610 }, { "epoch": 0.91, "learning_rate": 3.783101366289199e-07, "loss": 20.9052, "step": 84620 }, { "epoch": 0.91, "learning_rate": 3.773567698752001e-07, "loss": 21.4573, "step": 84630 }, { "epoch": 0.92, "learning_rate": 3.7640458280955863e-07, "loss": 20.7154, "step": 84640 }, { "epoch": 0.92, "learning_rate": 3.7545357554872985e-07, "loss": 20.0743, "step": 84650 }, { "epoch": 0.92, "learning_rate": 3.745037482093028e-07, "loss": 20.9285, "step": 84660 }, { "epoch": 0.92, "learning_rate": 3.7355510090772204e-07, "loss": 21.1116, "step": 84670 }, { "epoch": 0.92, "learning_rate": 3.72607633760288e-07, "loss": 21.3081, "step": 84680 }, { "epoch": 0.92, "learning_rate": 3.716613468831531e-07, "loss": 21.5522, "step": 84690 }, { "epoch": 0.92, "learning_rate": 3.7071624039232924e-07, "loss": 21.2257, "step": 84700 }, { "epoch": 0.92, "learning_rate": 3.697723144036791e-07, "loss": 20.9073, "step": 84710 }, { "epoch": 0.92, "learning_rate": 3.688295690329269e-07, "loss": 21.205, "step": 84720 }, { "epoch": 0.92, "learning_rate": 3.6788800439564677e-07, "loss": 20.5513, "step": 84730 }, { "epoch": 0.92, "learning_rate": 3.6694762060727083e-07, "loss": 21.316, "step": 84740 }, { "epoch": 0.92, "learning_rate": 3.660084177830825e-07, "loss": 21.257, "step": 84750 }, { "epoch": 0.92, "learning_rate": 3.6507039603822515e-07, "loss": 21.7202, "step": 84760 }, { "epoch": 0.92, "learning_rate": 3.641335554876968e-07, "loss": 21.0098, "step": 84770 }, { "epoch": 0.92, "learning_rate": 3.6319789624634785e-07, "loss": 21.4665, "step": 84780 }, { "epoch": 0.92, "learning_rate": 3.622634184288876e-07, "loss": 21.8559, "step": 84790 }, { "epoch": 0.92, "learning_rate": 3.6133012214987664e-07, "loss": 21.3024, "step": 84800 }, { "epoch": 0.92, "learning_rate": 3.603980075237301e-07, "loss": 21.9414, "step": 84810 }, { "epoch": 0.92, "learning_rate": 3.594670746647244e-07, "loss": 20.6575, "step": 84820 }, { "epoch": 0.92, "learning_rate": 3.5853732368698603e-07, "loss": 21.5462, "step": 84830 }, { "epoch": 0.92, "learning_rate": 3.576087547044982e-07, "loss": 21.9685, "step": 84840 }, { "epoch": 0.92, "learning_rate": 3.5668136783109875e-07, "loss": 21.0481, "step": 84850 }, { "epoch": 0.92, "learning_rate": 3.55755163180479e-07, "loss": 22.1788, "step": 84860 }, { "epoch": 0.92, "learning_rate": 3.5483014086618805e-07, "loss": 21.1947, "step": 84870 }, { "epoch": 0.92, "learning_rate": 3.539063010016308e-07, "loss": 21.1588, "step": 84880 }, { "epoch": 0.92, "learning_rate": 3.529836437000633e-07, "loss": 21.807, "step": 84890 }, { "epoch": 0.92, "learning_rate": 3.5206216907460065e-07, "loss": 21.1173, "step": 84900 }, { "epoch": 0.92, "learning_rate": 3.5114187723820693e-07, "loss": 20.7482, "step": 84910 }, { "epoch": 0.92, "learning_rate": 3.502227683037096e-07, "loss": 22.0113, "step": 84920 }, { "epoch": 0.92, "learning_rate": 3.4930484238378525e-07, "loss": 20.5861, "step": 84930 }, { "epoch": 0.92, "learning_rate": 3.483880995909672e-07, "loss": 21.2353, "step": 84940 }, { "epoch": 0.92, "learning_rate": 3.474725400376444e-07, "loss": 21.3657, "step": 84950 }, { "epoch": 0.92, "learning_rate": 3.465581638360571e-07, "loss": 21.6333, "step": 84960 }, { "epoch": 0.92, "learning_rate": 3.4564497109830675e-07, "loss": 20.9282, "step": 84970 }, { "epoch": 0.92, "learning_rate": 3.4473296193634377e-07, "loss": 21.4661, "step": 84980 }, { "epoch": 0.92, "learning_rate": 3.438221364619776e-07, "loss": 21.2225, "step": 84990 }, { "epoch": 0.92, "learning_rate": 3.429124947868689e-07, "loss": 21.8621, "step": 85000 }, { "epoch": 0.92, "learning_rate": 3.420040370225375e-07, "loss": 21.4009, "step": 85010 }, { "epoch": 0.92, "learning_rate": 3.410967632803541e-07, "loss": 21.186, "step": 85020 }, { "epoch": 0.92, "learning_rate": 3.4019067367154655e-07, "loss": 20.9928, "step": 85030 }, { "epoch": 0.92, "learning_rate": 3.3928576830719706e-07, "loss": 21.8735, "step": 85040 }, { "epoch": 0.92, "learning_rate": 3.383820472982424e-07, "loss": 21.6398, "step": 85050 }, { "epoch": 0.92, "learning_rate": 3.3747951075547403e-07, "loss": 20.8741, "step": 85060 }, { "epoch": 0.92, "learning_rate": 3.3657815878953784e-07, "loss": 21.7031, "step": 85070 }, { "epoch": 0.92, "learning_rate": 3.356779915109365e-07, "loss": 21.2312, "step": 85080 }, { "epoch": 0.92, "learning_rate": 3.3477900903002625e-07, "loss": 21.3932, "step": 85090 }, { "epoch": 0.92, "learning_rate": 3.338812114570156e-07, "loss": 20.8982, "step": 85100 }, { "epoch": 0.92, "learning_rate": 3.32984598901972e-07, "loss": 21.0077, "step": 85110 }, { "epoch": 0.92, "learning_rate": 3.3208917147481534e-07, "loss": 21.3033, "step": 85120 }, { "epoch": 0.92, "learning_rate": 3.3119492928532006e-07, "loss": 22.2693, "step": 85130 }, { "epoch": 0.92, "learning_rate": 3.303018724431162e-07, "loss": 21.5865, "step": 85140 }, { "epoch": 0.92, "learning_rate": 3.294100010576884e-07, "loss": 21.0285, "step": 85150 }, { "epoch": 0.92, "learning_rate": 3.2851931523837475e-07, "loss": 22.2465, "step": 85160 }, { "epoch": 0.92, "learning_rate": 3.276298150943691e-07, "loss": 20.8085, "step": 85170 }, { "epoch": 0.92, "learning_rate": 3.267415007347197e-07, "loss": 21.7513, "step": 85180 }, { "epoch": 0.92, "learning_rate": 3.258543722683305e-07, "loss": 21.3127, "step": 85190 }, { "epoch": 0.92, "learning_rate": 3.2496842980395793e-07, "loss": 21.4946, "step": 85200 }, { "epoch": 0.92, "learning_rate": 3.2408367345021507e-07, "loss": 22.0829, "step": 85210 }, { "epoch": 0.92, "learning_rate": 3.232001033155674e-07, "loss": 21.4212, "step": 85220 }, { "epoch": 0.92, "learning_rate": 3.22317719508336e-07, "loss": 20.5227, "step": 85230 }, { "epoch": 0.92, "learning_rate": 3.2143652213669887e-07, "loss": 21.7506, "step": 85240 }, { "epoch": 0.92, "learning_rate": 3.205565113086839e-07, "loss": 20.9625, "step": 85250 }, { "epoch": 0.92, "learning_rate": 3.1967768713217826e-07, "loss": 21.2835, "step": 85260 }, { "epoch": 0.92, "learning_rate": 3.188000497149191e-07, "loss": 20.9822, "step": 85270 }, { "epoch": 0.92, "learning_rate": 3.1792359916450355e-07, "loss": 21.0766, "step": 85280 }, { "epoch": 0.92, "learning_rate": 3.1704833558837687e-07, "loss": 21.7063, "step": 85290 }, { "epoch": 0.92, "learning_rate": 3.1617425909384436e-07, "loss": 20.9406, "step": 85300 }, { "epoch": 0.92, "learning_rate": 3.1530136978806136e-07, "loss": 20.6376, "step": 85310 }, { "epoch": 0.92, "learning_rate": 3.1442966777804005e-07, "loss": 22.1442, "step": 85320 }, { "epoch": 0.92, "learning_rate": 3.1355915317064946e-07, "loss": 20.8773, "step": 85330 }, { "epoch": 0.92, "learning_rate": 3.1268982607260854e-07, "loss": 21.2686, "step": 85340 }, { "epoch": 0.92, "learning_rate": 3.1182168659049104e-07, "loss": 21.4069, "step": 85350 }, { "epoch": 0.92, "learning_rate": 3.1095473483072733e-07, "loss": 21.6717, "step": 85360 }, { "epoch": 0.92, "learning_rate": 3.100889708996024e-07, "loss": 21.4274, "step": 85370 }, { "epoch": 0.92, "learning_rate": 3.092243949032547e-07, "loss": 20.9694, "step": 85380 }, { "epoch": 0.92, "learning_rate": 3.083610069476761e-07, "loss": 21.5008, "step": 85390 }, { "epoch": 0.92, "learning_rate": 3.0749880713871306e-07, "loss": 20.7585, "step": 85400 }, { "epoch": 0.92, "learning_rate": 3.0663779558206764e-07, "loss": 21.0721, "step": 85410 }, { "epoch": 0.92, "learning_rate": 3.057779723832954e-07, "loss": 20.6463, "step": 85420 }, { "epoch": 0.92, "learning_rate": 3.0491933764780766e-07, "loss": 21.3296, "step": 85430 }, { "epoch": 0.92, "learning_rate": 3.04061891480868e-07, "loss": 20.9117, "step": 85440 }, { "epoch": 0.92, "learning_rate": 3.0320563398759437e-07, "loss": 21.1276, "step": 85450 }, { "epoch": 0.92, "learning_rate": 3.023505652729597e-07, "loss": 21.4729, "step": 85460 }, { "epoch": 0.92, "learning_rate": 3.014966854417911e-07, "loss": 21.4083, "step": 85470 }, { "epoch": 0.92, "learning_rate": 3.0064399459877157e-07, "loss": 21.6182, "step": 85480 }, { "epoch": 0.92, "learning_rate": 2.9979249284843526e-07, "loss": 21.374, "step": 85490 }, { "epoch": 0.92, "learning_rate": 2.9894218029517306e-07, "loss": 21.2122, "step": 85500 }, { "epoch": 0.92, "learning_rate": 2.9809305704322723e-07, "loss": 21.1782, "step": 85510 }, { "epoch": 0.92, "learning_rate": 2.9724512319669665e-07, "loss": 20.7008, "step": 85520 }, { "epoch": 0.92, "learning_rate": 2.963983788595348e-07, "loss": 21.9668, "step": 85530 }, { "epoch": 0.92, "learning_rate": 2.9555282413554766e-07, "loss": 20.8316, "step": 85540 }, { "epoch": 0.92, "learning_rate": 2.9470845912839775e-07, "loss": 20.8628, "step": 85550 }, { "epoch": 0.92, "learning_rate": 2.9386528394159784e-07, "loss": 20.954, "step": 85560 }, { "epoch": 0.93, "learning_rate": 2.9302329867851644e-07, "loss": 21.2072, "step": 85570 }, { "epoch": 0.93, "learning_rate": 2.9218250344237756e-07, "loss": 21.0962, "step": 85580 }, { "epoch": 0.93, "learning_rate": 2.9134289833625984e-07, "loss": 21.2224, "step": 85590 }, { "epoch": 0.93, "learning_rate": 2.9050448346309544e-07, "loss": 21.5393, "step": 85600 }, { "epoch": 0.93, "learning_rate": 2.896672589256655e-07, "loss": 21.3461, "step": 85610 }, { "epoch": 0.93, "learning_rate": 2.888312248266134e-07, "loss": 21.0689, "step": 85620 }, { "epoch": 0.93, "learning_rate": 2.8799638126843055e-07, "loss": 20.5519, "step": 85630 }, { "epoch": 0.93, "learning_rate": 2.8716272835346614e-07, "loss": 21.4763, "step": 85640 }, { "epoch": 0.93, "learning_rate": 2.863302661839218e-07, "loss": 20.8407, "step": 85650 }, { "epoch": 0.93, "learning_rate": 2.854989948618525e-07, "loss": 21.2117, "step": 85660 }, { "epoch": 0.93, "learning_rate": 2.846689144891679e-07, "loss": 21.9781, "step": 85670 }, { "epoch": 0.93, "learning_rate": 2.8384002516763096e-07, "loss": 20.556, "step": 85680 }, { "epoch": 0.93, "learning_rate": 2.830123269988616e-07, "loss": 21.0059, "step": 85690 }, { "epoch": 0.93, "learning_rate": 2.821858200843308e-07, "loss": 21.6609, "step": 85700 }, { "epoch": 0.93, "learning_rate": 2.8136050452536425e-07, "loss": 20.871, "step": 85710 }, { "epoch": 0.93, "learning_rate": 2.805363804231398e-07, "loss": 20.4891, "step": 85720 }, { "epoch": 0.93, "learning_rate": 2.7971344787869114e-07, "loss": 21.2351, "step": 85730 }, { "epoch": 0.93, "learning_rate": 2.7889170699290867e-07, "loss": 21.4914, "step": 85740 }, { "epoch": 0.93, "learning_rate": 2.780711578665307e-07, "loss": 20.981, "step": 85750 }, { "epoch": 0.93, "learning_rate": 2.7725180060015454e-07, "loss": 21.1067, "step": 85760 }, { "epoch": 0.93, "learning_rate": 2.7643363529422764e-07, "loss": 20.6196, "step": 85770 }, { "epoch": 0.93, "learning_rate": 2.7561666204905193e-07, "loss": 20.7808, "step": 85780 }, { "epoch": 0.93, "learning_rate": 2.748008809647884e-07, "loss": 20.2453, "step": 85790 }, { "epoch": 0.93, "learning_rate": 2.739862921414438e-07, "loss": 22.0264, "step": 85800 }, { "epoch": 0.93, "learning_rate": 2.731728956788848e-07, "loss": 20.983, "step": 85810 }, { "epoch": 0.93, "learning_rate": 2.723606916768307e-07, "loss": 21.2589, "step": 85820 }, { "epoch": 0.93, "learning_rate": 2.715496802348494e-07, "loss": 20.8845, "step": 85830 }, { "epoch": 0.93, "learning_rate": 2.707398614523704e-07, "loss": 21.8503, "step": 85840 }, { "epoch": 0.93, "learning_rate": 2.6993123542867206e-07, "loss": 21.3039, "step": 85850 }, { "epoch": 0.93, "learning_rate": 2.691238022628895e-07, "loss": 21.287, "step": 85860 }, { "epoch": 0.93, "learning_rate": 2.6831756205400905e-07, "loss": 21.001, "step": 85870 }, { "epoch": 0.93, "learning_rate": 2.675125149008706e-07, "loss": 21.0267, "step": 85880 }, { "epoch": 0.93, "learning_rate": 2.6670866090216965e-07, "loss": 20.8813, "step": 85890 }, { "epoch": 0.93, "learning_rate": 2.6590600015645617e-07, "loss": 21.5949, "step": 85900 }, { "epoch": 0.93, "learning_rate": 2.6510453276213043e-07, "loss": 21.5402, "step": 85910 }, { "epoch": 0.93, "learning_rate": 2.6430425881745047e-07, "loss": 20.6335, "step": 85920 }, { "epoch": 0.93, "learning_rate": 2.6350517842052225e-07, "loss": 20.8586, "step": 85930 }, { "epoch": 0.93, "learning_rate": 2.6270729166931185e-07, "loss": 21.1901, "step": 85940 }, { "epoch": 0.93, "learning_rate": 2.619105986616366e-07, "loss": 20.9627, "step": 85950 }, { "epoch": 0.93, "learning_rate": 2.61115099495165e-07, "loss": 22.429, "step": 85960 }, { "epoch": 0.93, "learning_rate": 2.603207942674235e-07, "loss": 21.0109, "step": 85970 }, { "epoch": 0.93, "learning_rate": 2.595276830757876e-07, "loss": 21.5992, "step": 85980 }, { "epoch": 0.93, "learning_rate": 2.587357660174905e-07, "loss": 21.4589, "step": 85990 }, { "epoch": 0.93, "learning_rate": 2.57945043189618e-07, "loss": 21.2868, "step": 86000 }, { "epoch": 0.93, "learning_rate": 2.571555146891058e-07, "loss": 21.2071, "step": 86010 }, { "epoch": 0.93, "learning_rate": 2.5636718061274877e-07, "loss": 21.2088, "step": 86020 }, { "epoch": 0.93, "learning_rate": 2.5558004105719183e-07, "loss": 20.7053, "step": 86030 }, { "epoch": 0.93, "learning_rate": 2.5479409611893545e-07, "loss": 21.3281, "step": 86040 }, { "epoch": 0.93, "learning_rate": 2.5400934589433046e-07, "loss": 20.7006, "step": 86050 }, { "epoch": 0.93, "learning_rate": 2.532257904795843e-07, "loss": 21.681, "step": 86060 }, { "epoch": 0.93, "learning_rate": 2.524434299707579e-07, "loss": 20.6189, "step": 86070 }, { "epoch": 0.93, "learning_rate": 2.5166226446376343e-07, "loss": 21.3212, "step": 86080 }, { "epoch": 0.93, "learning_rate": 2.508822940543676e-07, "loss": 21.4377, "step": 86090 }, { "epoch": 0.93, "learning_rate": 2.5010351883819283e-07, "loss": 21.2402, "step": 86100 }, { "epoch": 0.93, "learning_rate": 2.4932593891071167e-07, "loss": 20.6633, "step": 86110 }, { "epoch": 0.93, "learning_rate": 2.4854955436725115e-07, "loss": 21.9367, "step": 86120 }, { "epoch": 0.93, "learning_rate": 2.47774365302994e-07, "loss": 21.6076, "step": 86130 }, { "epoch": 0.93, "learning_rate": 2.470003718129721e-07, "loss": 20.7839, "step": 86140 }, { "epoch": 0.93, "learning_rate": 2.46227573992075e-07, "loss": 21.1701, "step": 86150 }, { "epoch": 0.93, "learning_rate": 2.4545597193504356e-07, "loss": 21.711, "step": 86160 }, { "epoch": 0.93, "learning_rate": 2.446855657364722e-07, "loss": 21.3493, "step": 86170 }, { "epoch": 0.93, "learning_rate": 2.439163554908086e-07, "loss": 21.7405, "step": 86180 }, { "epoch": 0.93, "learning_rate": 2.431483412923541e-07, "loss": 21.7333, "step": 86190 }, { "epoch": 0.93, "learning_rate": 2.423815232352633e-07, "loss": 20.5986, "step": 86200 }, { "epoch": 0.93, "learning_rate": 2.4161590141354443e-07, "loss": 20.3738, "step": 86210 }, { "epoch": 0.93, "learning_rate": 2.4085147592105896e-07, "loss": 21.4939, "step": 86220 }, { "epoch": 0.93, "learning_rate": 2.400882468515231e-07, "loss": 20.7196, "step": 86230 }, { "epoch": 0.93, "learning_rate": 2.393262142985009e-07, "loss": 21.5242, "step": 86240 }, { "epoch": 0.93, "learning_rate": 2.385653783554187e-07, "loss": 21.2892, "step": 86250 }, { "epoch": 0.93, "learning_rate": 2.378057391155486e-07, "loss": 21.3501, "step": 86260 }, { "epoch": 0.93, "learning_rate": 2.3704729667201832e-07, "loss": 20.8698, "step": 86270 }, { "epoch": 0.93, "learning_rate": 2.36290051117809e-07, "loss": 20.805, "step": 86280 }, { "epoch": 0.93, "learning_rate": 2.3553400254575643e-07, "loss": 20.8416, "step": 86290 }, { "epoch": 0.93, "learning_rate": 2.3477915104854865e-07, "loss": 20.9021, "step": 86300 }, { "epoch": 0.93, "learning_rate": 2.3402549671872498e-07, "loss": 20.584, "step": 86310 }, { "epoch": 0.93, "learning_rate": 2.3327303964868042e-07, "loss": 21.5184, "step": 86320 }, { "epoch": 0.93, "learning_rate": 2.3252177993066338e-07, "loss": 20.7599, "step": 86330 }, { "epoch": 0.93, "learning_rate": 2.3177171765677132e-07, "loss": 21.6344, "step": 86340 }, { "epoch": 0.93, "learning_rate": 2.3102285291896397e-07, "loss": 21.4322, "step": 86350 }, { "epoch": 0.93, "learning_rate": 2.3027518580904352e-07, "loss": 21.7512, "step": 86360 }, { "epoch": 0.93, "learning_rate": 2.2952871641867101e-07, "loss": 22.0264, "step": 86370 }, { "epoch": 0.93, "learning_rate": 2.287834448393611e-07, "loss": 21.6364, "step": 86380 }, { "epoch": 0.93, "learning_rate": 2.2803937116247954e-07, "loss": 21.1984, "step": 86390 }, { "epoch": 0.93, "learning_rate": 2.272964954792467e-07, "loss": 21.1287, "step": 86400 }, { "epoch": 0.93, "learning_rate": 2.265548178807353e-07, "loss": 20.7205, "step": 86410 }, { "epoch": 0.93, "learning_rate": 2.258143384578715e-07, "loss": 21.369, "step": 86420 }, { "epoch": 0.93, "learning_rate": 2.2507505730143265e-07, "loss": 21.5724, "step": 86430 }, { "epoch": 0.93, "learning_rate": 2.2433697450205182e-07, "loss": 22.0197, "step": 86440 }, { "epoch": 0.93, "learning_rate": 2.2360009015021666e-07, "loss": 20.5744, "step": 86450 }, { "epoch": 0.93, "learning_rate": 2.2286440433626267e-07, "loss": 21.3283, "step": 86460 }, { "epoch": 0.93, "learning_rate": 2.2212991715038324e-07, "loss": 21.1129, "step": 86470 }, { "epoch": 0.93, "learning_rate": 2.213966286826208e-07, "loss": 21.2363, "step": 86480 }, { "epoch": 0.94, "learning_rate": 2.2066453902287232e-07, "loss": 21.0029, "step": 86490 }, { "epoch": 0.94, "learning_rate": 2.1993364826089158e-07, "loss": 21.6412, "step": 86500 }, { "epoch": 0.94, "learning_rate": 2.1920395648628025e-07, "loss": 21.1758, "step": 86510 }, { "epoch": 0.94, "learning_rate": 2.184754637884956e-07, "loss": 21.2733, "step": 86520 }, { "epoch": 0.94, "learning_rate": 2.1774817025684626e-07, "loss": 21.4582, "step": 86530 }, { "epoch": 0.94, "learning_rate": 2.170220759804942e-07, "loss": 20.3188, "step": 86540 }, { "epoch": 0.94, "learning_rate": 2.162971810484571e-07, "loss": 21.657, "step": 86550 }, { "epoch": 0.94, "learning_rate": 2.1557348554960168e-07, "loss": 20.5867, "step": 86560 }, { "epoch": 0.94, "learning_rate": 2.1485098957265138e-07, "loss": 21.4932, "step": 86570 }, { "epoch": 0.94, "learning_rate": 2.141296932061776e-07, "loss": 21.7091, "step": 86580 }, { "epoch": 0.94, "learning_rate": 2.134095965386096e-07, "loss": 21.4963, "step": 86590 }, { "epoch": 0.94, "learning_rate": 2.1269069965822785e-07, "loss": 20.268, "step": 86600 }, { "epoch": 0.94, "learning_rate": 2.1197300265316523e-07, "loss": 21.1266, "step": 86610 }, { "epoch": 0.94, "learning_rate": 2.1125650561140797e-07, "loss": 21.4123, "step": 86620 }, { "epoch": 0.94, "learning_rate": 2.1054120862079364e-07, "loss": 21.3034, "step": 86630 }, { "epoch": 0.94, "learning_rate": 2.0982711176901539e-07, "loss": 21.3228, "step": 86640 }, { "epoch": 0.94, "learning_rate": 2.0911421514361763e-07, "loss": 20.7608, "step": 86650 }, { "epoch": 0.94, "learning_rate": 2.0840251883199823e-07, "loss": 21.1606, "step": 86660 }, { "epoch": 0.94, "learning_rate": 2.0769202292140745e-07, "loss": 21.3113, "step": 86670 }, { "epoch": 0.94, "learning_rate": 2.0698272749894998e-07, "loss": 21.4061, "step": 86680 }, { "epoch": 0.94, "learning_rate": 2.0627463265157742e-07, "loss": 21.4585, "step": 86690 }, { "epoch": 0.94, "learning_rate": 2.0556773846610368e-07, "loss": 20.9238, "step": 86700 }, { "epoch": 0.94, "learning_rate": 2.0486204502918828e-07, "loss": 21.3645, "step": 86710 }, { "epoch": 0.94, "learning_rate": 2.0415755242734536e-07, "loss": 21.5199, "step": 86720 }, { "epoch": 0.94, "learning_rate": 2.0345426074694362e-07, "loss": 20.9747, "step": 86730 }, { "epoch": 0.94, "learning_rate": 2.0275217007420077e-07, "loss": 21.2947, "step": 86740 }, { "epoch": 0.94, "learning_rate": 2.020512804951913e-07, "loss": 20.7721, "step": 86750 }, { "epoch": 0.94, "learning_rate": 2.0135159209584087e-07, "loss": 21.3601, "step": 86760 }, { "epoch": 0.94, "learning_rate": 2.006531049619276e-07, "loss": 20.3702, "step": 86770 }, { "epoch": 0.94, "learning_rate": 1.999558191790829e-07, "loss": 21.2594, "step": 86780 }, { "epoch": 0.94, "learning_rate": 1.992597348327885e-07, "loss": 21.3131, "step": 86790 }, { "epoch": 0.94, "learning_rate": 1.9856485200838382e-07, "loss": 21.3365, "step": 86800 }, { "epoch": 0.94, "learning_rate": 1.9787117079105523e-07, "loss": 20.5876, "step": 86810 }, { "epoch": 0.94, "learning_rate": 1.971786912658469e-07, "loss": 20.9693, "step": 86820 }, { "epoch": 0.94, "learning_rate": 1.9648741351765312e-07, "loss": 21.2147, "step": 86830 }, { "epoch": 0.94, "learning_rate": 1.9579733763121943e-07, "loss": 21.9531, "step": 86840 }, { "epoch": 0.94, "learning_rate": 1.95108463691146e-07, "loss": 21.1174, "step": 86850 }, { "epoch": 0.94, "learning_rate": 1.9442079178188743e-07, "loss": 21.1838, "step": 86860 }, { "epoch": 0.94, "learning_rate": 1.9373432198774633e-07, "loss": 21.055, "step": 86870 }, { "epoch": 0.94, "learning_rate": 1.9304905439288203e-07, "loss": 21.0945, "step": 86880 }, { "epoch": 0.94, "learning_rate": 1.9236498908130397e-07, "loss": 21.2018, "step": 86890 }, { "epoch": 0.94, "learning_rate": 1.916821261368762e-07, "loss": 21.3347, "step": 86900 }, { "epoch": 0.94, "learning_rate": 1.9100046564331398e-07, "loss": 20.8327, "step": 86910 }, { "epoch": 0.94, "learning_rate": 1.903200076841849e-07, "loss": 21.1513, "step": 86920 }, { "epoch": 0.94, "learning_rate": 1.8964075234291e-07, "loss": 20.5499, "step": 86930 }, { "epoch": 0.94, "learning_rate": 1.889626997027627e-07, "loss": 21.3296, "step": 86940 }, { "epoch": 0.94, "learning_rate": 1.882858498468687e-07, "loss": 21.1212, "step": 86950 }, { "epoch": 0.94, "learning_rate": 1.8761020285820718e-07, "loss": 20.9647, "step": 86960 }, { "epoch": 0.94, "learning_rate": 1.8693575881960856e-07, "loss": 20.5349, "step": 86970 }, { "epoch": 0.94, "learning_rate": 1.862625178137556e-07, "loss": 21.1969, "step": 86980 }, { "epoch": 0.94, "learning_rate": 1.8559047992318447e-07, "loss": 20.7633, "step": 86990 }, { "epoch": 0.94, "learning_rate": 1.8491964523028483e-07, "loss": 21.0483, "step": 87000 }, { "epoch": 0.94, "learning_rate": 1.8425001381729645e-07, "loss": 20.9143, "step": 87010 }, { "epoch": 0.94, "learning_rate": 1.8358158576631368e-07, "loss": 21.1545, "step": 87020 }, { "epoch": 0.94, "learning_rate": 1.8291436115928206e-07, "loss": 21.4443, "step": 87030 }, { "epoch": 0.94, "learning_rate": 1.8224834007800064e-07, "loss": 21.7499, "step": 87040 }, { "epoch": 0.94, "learning_rate": 1.815835226041185e-07, "loss": 20.6175, "step": 87050 }, { "epoch": 0.94, "learning_rate": 1.8091990881914157e-07, "loss": 22.1804, "step": 87060 }, { "epoch": 0.94, "learning_rate": 1.8025749880442256e-07, "loss": 21.1205, "step": 87070 }, { "epoch": 0.94, "learning_rate": 1.7959629264117206e-07, "loss": 20.7115, "step": 87080 }, { "epoch": 0.94, "learning_rate": 1.789362904104497e-07, "loss": 21.2944, "step": 87090 }, { "epoch": 0.94, "learning_rate": 1.7827749219316847e-07, "loss": 20.7225, "step": 87100 }, { "epoch": 0.94, "learning_rate": 1.7761989807009383e-07, "loss": 21.0374, "step": 87110 }, { "epoch": 0.94, "learning_rate": 1.7696350812184348e-07, "loss": 20.9245, "step": 87120 }, { "epoch": 0.94, "learning_rate": 1.7630832242888862e-07, "loss": 21.4781, "step": 87130 }, { "epoch": 0.94, "learning_rate": 1.7565434107154944e-07, "loss": 20.9996, "step": 87140 }, { "epoch": 0.94, "learning_rate": 1.750015641300029e-07, "loss": 21.6261, "step": 87150 }, { "epoch": 0.94, "learning_rate": 1.7434999168427503e-07, "loss": 20.8224, "step": 87160 }, { "epoch": 0.94, "learning_rate": 1.7369962381424632e-07, "loss": 21.9218, "step": 87170 }, { "epoch": 0.94, "learning_rate": 1.7305046059964748e-07, "loss": 21.0135, "step": 87180 }, { "epoch": 0.94, "learning_rate": 1.724025021200626e-07, "loss": 21.0583, "step": 87190 }, { "epoch": 0.94, "learning_rate": 1.7175574845493036e-07, "loss": 21.0095, "step": 87200 }, { "epoch": 0.94, "learning_rate": 1.7111019968353625e-07, "loss": 21.5425, "step": 87210 }, { "epoch": 0.94, "learning_rate": 1.7046585588502475e-07, "loss": 21.1149, "step": 87220 }, { "epoch": 0.94, "learning_rate": 1.6982271713838706e-07, "loss": 19.8893, "step": 87230 }, { "epoch": 0.94, "learning_rate": 1.691807835224679e-07, "loss": 20.8557, "step": 87240 }, { "epoch": 0.94, "learning_rate": 1.6854005511596772e-07, "loss": 21.3507, "step": 87250 }, { "epoch": 0.94, "learning_rate": 1.6790053199743472e-07, "loss": 21.7444, "step": 87260 }, { "epoch": 0.94, "learning_rate": 1.6726221424527288e-07, "loss": 20.6918, "step": 87270 }, { "epoch": 0.94, "learning_rate": 1.666251019377352e-07, "loss": 21.9685, "step": 87280 }, { "epoch": 0.94, "learning_rate": 1.659891951529291e-07, "loss": 21.5994, "step": 87290 }, { "epoch": 0.94, "learning_rate": 1.6535449396881453e-07, "loss": 20.4872, "step": 87300 }, { "epoch": 0.94, "learning_rate": 1.6472099846319923e-07, "loss": 22.0424, "step": 87310 }, { "epoch": 0.94, "learning_rate": 1.6408870871375216e-07, "loss": 21.6999, "step": 87320 }, { "epoch": 0.94, "learning_rate": 1.6345762479798354e-07, "loss": 20.5047, "step": 87330 }, { "epoch": 0.94, "learning_rate": 1.6282774679326484e-07, "loss": 21.1979, "step": 87340 }, { "epoch": 0.94, "learning_rate": 1.621990747768132e-07, "loss": 21.337, "step": 87350 }, { "epoch": 0.94, "learning_rate": 1.6157160882570134e-07, "loss": 20.9546, "step": 87360 }, { "epoch": 0.94, "learning_rate": 1.6094534901685554e-07, "loss": 21.2068, "step": 87370 }, { "epoch": 0.94, "learning_rate": 1.6032029542705107e-07, "loss": 20.0232, "step": 87380 }, { "epoch": 0.94, "learning_rate": 1.5969644813291552e-07, "loss": 21.4828, "step": 87390 }, { "epoch": 0.94, "learning_rate": 1.5907380721092992e-07, "loss": 22.0387, "step": 87400 }, { "epoch": 0.94, "learning_rate": 1.5845237273742653e-07, "loss": 20.3809, "step": 87410 }, { "epoch": 0.95, "learning_rate": 1.5783214478859e-07, "loss": 20.721, "step": 87420 }, { "epoch": 0.95, "learning_rate": 1.5721312344045948e-07, "loss": 21.7644, "step": 87430 }, { "epoch": 0.95, "learning_rate": 1.5659530876892093e-07, "loss": 21.1201, "step": 87440 }, { "epoch": 0.95, "learning_rate": 1.559787008497171e-07, "loss": 21.8174, "step": 87450 }, { "epoch": 0.95, "learning_rate": 1.5536329975843977e-07, "loss": 21.7021, "step": 87460 }, { "epoch": 0.95, "learning_rate": 1.5474910557053523e-07, "loss": 21.8922, "step": 87470 }, { "epoch": 0.95, "learning_rate": 1.5413611836129995e-07, "loss": 21.4203, "step": 87480 }, { "epoch": 0.95, "learning_rate": 1.5352433820588375e-07, "loss": 20.4081, "step": 87490 }, { "epoch": 0.95, "learning_rate": 1.529137651792878e-07, "loss": 21.1646, "step": 87500 }, { "epoch": 0.95, "learning_rate": 1.523043993563633e-07, "loss": 21.4678, "step": 87510 }, { "epoch": 0.95, "learning_rate": 1.5169624081181833e-07, "loss": 20.5324, "step": 87520 }, { "epoch": 0.95, "learning_rate": 1.5108928962020875e-07, "loss": 21.4634, "step": 87530 }, { "epoch": 0.95, "learning_rate": 1.5048354585594392e-07, "loss": 21.105, "step": 87540 }, { "epoch": 0.95, "learning_rate": 1.4987900959328561e-07, "loss": 21.5459, "step": 87550 }, { "epoch": 0.95, "learning_rate": 1.4927568090634447e-07, "loss": 21.6108, "step": 87560 }, { "epoch": 0.95, "learning_rate": 1.4867355986908806e-07, "loss": 20.9192, "step": 87570 }, { "epoch": 0.95, "learning_rate": 1.4807264655533282e-07, "loss": 21.0906, "step": 87580 }, { "epoch": 0.95, "learning_rate": 1.4747294103874875e-07, "loss": 21.6981, "step": 87590 }, { "epoch": 0.95, "learning_rate": 1.4687444339285485e-07, "loss": 21.4555, "step": 87600 }, { "epoch": 0.95, "learning_rate": 1.4627715369102346e-07, "loss": 20.9163, "step": 87610 }, { "epoch": 0.95, "learning_rate": 1.4568107200648273e-07, "loss": 21.8991, "step": 87620 }, { "epoch": 0.95, "learning_rate": 1.4508619841230531e-07, "loss": 21.2499, "step": 87630 }, { "epoch": 0.95, "learning_rate": 1.4449253298142284e-07, "loss": 21.0544, "step": 87640 }, { "epoch": 0.95, "learning_rate": 1.439000757866149e-07, "loss": 21.8316, "step": 87650 }, { "epoch": 0.95, "learning_rate": 1.4330882690051229e-07, "loss": 20.8914, "step": 87660 }, { "epoch": 0.95, "learning_rate": 1.4271878639560032e-07, "loss": 21.2992, "step": 87670 }, { "epoch": 0.95, "learning_rate": 1.4212995434421562e-07, "loss": 20.9603, "step": 87680 }, { "epoch": 0.95, "learning_rate": 1.4154233081854595e-07, "loss": 20.2864, "step": 87690 }, { "epoch": 0.95, "learning_rate": 1.409559158906304e-07, "loss": 21.2015, "step": 87700 }, { "epoch": 0.95, "learning_rate": 1.403707096323592e-07, "loss": 21.5722, "step": 87710 }, { "epoch": 0.95, "learning_rate": 1.3978671211547724e-07, "loss": 20.838, "step": 87720 }, { "epoch": 0.95, "learning_rate": 1.392039234115805e-07, "loss": 20.6552, "step": 87730 }, { "epoch": 0.95, "learning_rate": 1.3862234359211524e-07, "loss": 21.6626, "step": 87740 }, { "epoch": 0.95, "learning_rate": 1.3804197272837993e-07, "loss": 21.2396, "step": 87750 }, { "epoch": 0.95, "learning_rate": 1.3746281089152435e-07, "loss": 21.0542, "step": 87760 }, { "epoch": 0.95, "learning_rate": 1.3688485815255282e-07, "loss": 21.6274, "step": 87770 }, { "epoch": 0.95, "learning_rate": 1.3630811458231863e-07, "loss": 20.8512, "step": 87780 }, { "epoch": 0.95, "learning_rate": 1.3573258025152635e-07, "loss": 20.9696, "step": 87790 }, { "epoch": 0.95, "learning_rate": 1.351582552307351e-07, "loss": 20.2893, "step": 87800 }, { "epoch": 0.95, "learning_rate": 1.3458513959035524e-07, "loss": 20.7202, "step": 87810 }, { "epoch": 0.95, "learning_rate": 1.34013233400645e-07, "loss": 20.7742, "step": 87820 }, { "epoch": 0.95, "learning_rate": 1.3344253673171936e-07, "loss": 21.6563, "step": 87830 }, { "epoch": 0.95, "learning_rate": 1.3287304965354243e-07, "loss": 21.168, "step": 87840 }, { "epoch": 0.95, "learning_rate": 1.3230477223592942e-07, "loss": 20.3615, "step": 87850 }, { "epoch": 0.95, "learning_rate": 1.3173770454855018e-07, "loss": 22.2782, "step": 87860 }, { "epoch": 0.95, "learning_rate": 1.3117184666092353e-07, "loss": 21.335, "step": 87870 }, { "epoch": 0.95, "learning_rate": 1.3060719864242065e-07, "loss": 21.4049, "step": 87880 }, { "epoch": 0.95, "learning_rate": 1.3004376056226396e-07, "loss": 20.849, "step": 87890 }, { "epoch": 0.95, "learning_rate": 1.2948153248952932e-07, "loss": 20.9421, "step": 87900 }, { "epoch": 0.95, "learning_rate": 1.289205144931427e-07, "loss": 21.3433, "step": 87910 }, { "epoch": 0.95, "learning_rate": 1.2836070664188237e-07, "loss": 21.204, "step": 87920 }, { "epoch": 0.95, "learning_rate": 1.2780210900437796e-07, "loss": 20.9591, "step": 87930 }, { "epoch": 0.95, "learning_rate": 1.2724472164910905e-07, "loss": 20.9554, "step": 87940 }, { "epoch": 0.95, "learning_rate": 1.2668854464441104e-07, "loss": 21.2527, "step": 87950 }, { "epoch": 0.95, "learning_rate": 1.2613357805846715e-07, "loss": 20.6282, "step": 87960 }, { "epoch": 0.95, "learning_rate": 1.2557982195931408e-07, "loss": 20.295, "step": 87970 }, { "epoch": 0.95, "learning_rate": 1.250272764148386e-07, "loss": 21.1053, "step": 87980 }, { "epoch": 0.95, "learning_rate": 1.2447594149278098e-07, "loss": 21.7966, "step": 87990 }, { "epoch": 0.95, "learning_rate": 1.239258172607316e-07, "loss": 21.4596, "step": 88000 }, { "epoch": 0.95, "learning_rate": 1.233769037861332e-07, "loss": 20.5629, "step": 88010 }, { "epoch": 0.95, "learning_rate": 1.2282920113627972e-07, "loss": 22.0813, "step": 88020 }, { "epoch": 0.95, "learning_rate": 1.2228270937831743e-07, "loss": 21.9202, "step": 88030 }, { "epoch": 0.95, "learning_rate": 1.2173742857924276e-07, "loss": 21.4037, "step": 88040 }, { "epoch": 0.95, "learning_rate": 1.2119335880590444e-07, "loss": 21.2251, "step": 88050 }, { "epoch": 0.95, "learning_rate": 1.2065050012500245e-07, "loss": 21.4048, "step": 88060 }, { "epoch": 0.95, "learning_rate": 1.2010885260308913e-07, "loss": 21.3514, "step": 88070 }, { "epoch": 0.95, "learning_rate": 1.1956841630656801e-07, "loss": 20.5267, "step": 88080 }, { "epoch": 0.95, "learning_rate": 1.1902919130169277e-07, "loss": 21.1687, "step": 88090 }, { "epoch": 0.95, "learning_rate": 1.1849117765457164e-07, "loss": 21.6148, "step": 88100 }, { "epoch": 0.95, "learning_rate": 1.1795437543115962e-07, "loss": 21.0572, "step": 88110 }, { "epoch": 0.95, "learning_rate": 1.1741878469726853e-07, "loss": 21.2137, "step": 88120 }, { "epoch": 0.95, "learning_rate": 1.1688440551855806e-07, "loss": 21.3975, "step": 88130 }, { "epoch": 0.95, "learning_rate": 1.1635123796054027e-07, "loss": 21.1332, "step": 88140 }, { "epoch": 0.95, "learning_rate": 1.158192820885795e-07, "loss": 21.5266, "step": 88150 }, { "epoch": 0.95, "learning_rate": 1.1528853796788919e-07, "loss": 21.423, "step": 88160 }, { "epoch": 0.95, "learning_rate": 1.1475900566353837e-07, "loss": 21.3778, "step": 88170 }, { "epoch": 0.95, "learning_rate": 1.142306852404429e-07, "loss": 20.7117, "step": 88180 }, { "epoch": 0.95, "learning_rate": 1.1370357676337429e-07, "loss": 20.6477, "step": 88190 }, { "epoch": 0.95, "learning_rate": 1.1317768029695198e-07, "loss": 20.3835, "step": 88200 }, { "epoch": 0.95, "learning_rate": 1.1265299590564882e-07, "loss": 21.2, "step": 88210 }, { "epoch": 0.95, "learning_rate": 1.1212952365378782e-07, "loss": 21.2773, "step": 88220 }, { "epoch": 0.95, "learning_rate": 1.116072636055443e-07, "loss": 21.415, "step": 88230 }, { "epoch": 0.95, "learning_rate": 1.1108621582494706e-07, "loss": 20.7983, "step": 88240 }, { "epoch": 0.95, "learning_rate": 1.1056638037586942e-07, "loss": 21.7788, "step": 88250 }, { "epoch": 0.95, "learning_rate": 1.1004775732204486e-07, "loss": 21.053, "step": 88260 }, { "epoch": 0.95, "learning_rate": 1.0953034672705032e-07, "loss": 21.3366, "step": 88270 }, { "epoch": 0.95, "learning_rate": 1.0901414865432058e-07, "loss": 21.2722, "step": 88280 }, { "epoch": 0.95, "learning_rate": 1.0849916316713837e-07, "loss": 21.7206, "step": 88290 }, { "epoch": 0.95, "learning_rate": 1.0798539032863764e-07, "loss": 21.3505, "step": 88300 }, { "epoch": 0.95, "learning_rate": 1.0747283020180465e-07, "loss": 21.2538, "step": 88310 }, { "epoch": 0.95, "learning_rate": 1.0696148284947694e-07, "loss": 21.0849, "step": 88320 }, { "epoch": 0.95, "learning_rate": 1.0645134833434213e-07, "loss": 21.4362, "step": 88330 }, { "epoch": 0.96, "learning_rate": 1.059424267189424e-07, "loss": 20.6586, "step": 88340 }, { "epoch": 0.96, "learning_rate": 1.0543471806566786e-07, "loss": 20.9046, "step": 88350 }, { "epoch": 0.96, "learning_rate": 1.0492822243675982e-07, "loss": 21.3019, "step": 88360 }, { "epoch": 0.96, "learning_rate": 1.0442293989431307e-07, "loss": 21.0677, "step": 88370 }, { "epoch": 0.96, "learning_rate": 1.0391887050027249e-07, "loss": 21.5183, "step": 88380 }, { "epoch": 0.96, "learning_rate": 1.0341601431643533e-07, "loss": 21.0448, "step": 88390 }, { "epoch": 0.96, "learning_rate": 1.0291437140444893e-07, "loss": 21.0272, "step": 88400 }, { "epoch": 0.96, "learning_rate": 1.0241394182581188e-07, "loss": 21.7892, "step": 88410 }, { "epoch": 0.96, "learning_rate": 1.0191472564187399e-07, "loss": 21.2478, "step": 88420 }, { "epoch": 0.96, "learning_rate": 1.0141672291383741e-07, "loss": 21.8736, "step": 88430 }, { "epoch": 0.96, "learning_rate": 1.0091993370275444e-07, "loss": 21.7277, "step": 88440 }, { "epoch": 0.96, "learning_rate": 1.0042435806952965e-07, "loss": 21.1419, "step": 88450 }, { "epoch": 0.96, "learning_rate": 9.992999607491671e-08, "loss": 22.0854, "step": 88460 }, { "epoch": 0.96, "learning_rate": 9.943684777952267e-08, "loss": 20.9617, "step": 88470 }, { "epoch": 0.96, "learning_rate": 9.894491324380473e-08, "loss": 21.6653, "step": 88480 }, { "epoch": 0.96, "learning_rate": 9.845419252807242e-08, "loss": 21.7774, "step": 88490 }, { "epoch": 0.96, "learning_rate": 9.796468569248652e-08, "loss": 21.5439, "step": 88500 }, { "epoch": 0.96, "learning_rate": 9.747639279705567e-08, "loss": 21.7149, "step": 88510 }, { "epoch": 0.96, "learning_rate": 9.698931390164424e-08, "loss": 21.1219, "step": 88520 }, { "epoch": 0.96, "learning_rate": 9.650344906596331e-08, "loss": 21.5063, "step": 88530 }, { "epoch": 0.96, "learning_rate": 9.601879834957972e-08, "loss": 21.2809, "step": 88540 }, { "epoch": 0.96, "learning_rate": 9.553536181190815e-08, "loss": 22.0319, "step": 88550 }, { "epoch": 0.96, "learning_rate": 9.505313951221673e-08, "loss": 21.5958, "step": 88560 }, { "epoch": 0.96, "learning_rate": 9.457213150962152e-08, "loss": 21.0735, "step": 88570 }, { "epoch": 0.96, "learning_rate": 9.409233786309313e-08, "loss": 21.6096, "step": 88580 }, { "epoch": 0.96, "learning_rate": 9.361375863145117e-08, "loss": 21.561, "step": 88590 }, { "epoch": 0.96, "learning_rate": 9.313639387336759e-08, "loss": 21.207, "step": 88600 }, { "epoch": 0.96, "learning_rate": 9.266024364736448e-08, "loss": 21.6348, "step": 88610 }, { "epoch": 0.96, "learning_rate": 9.218530801181735e-08, "loss": 21.0467, "step": 88620 }, { "epoch": 0.96, "learning_rate": 9.171158702494743e-08, "loss": 20.4556, "step": 88630 }, { "epoch": 0.96, "learning_rate": 9.123908074483268e-08, "loss": 20.9169, "step": 88640 }, { "epoch": 0.96, "learning_rate": 9.07677892294001e-08, "loss": 21.4569, "step": 88650 }, { "epoch": 0.96, "learning_rate": 9.029771253642794e-08, "loss": 21.2743, "step": 88660 }, { "epoch": 0.96, "learning_rate": 8.982885072354452e-08, "loss": 21.1778, "step": 88670 }, { "epoch": 0.96, "learning_rate": 8.936120384822944e-08, "loss": 20.7709, "step": 88680 }, { "epoch": 0.96, "learning_rate": 8.889477196781571e-08, "loss": 21.2668, "step": 88690 }, { "epoch": 0.96, "learning_rate": 8.842955513948314e-08, "loss": 20.5709, "step": 88700 }, { "epoch": 0.96, "learning_rate": 8.796555342026724e-08, "loss": 21.9177, "step": 88710 }, { "epoch": 0.96, "learning_rate": 8.750276686705139e-08, "loss": 21.6995, "step": 88720 }, { "epoch": 0.96, "learning_rate": 8.70411955365702e-08, "loss": 20.5516, "step": 88730 }, { "epoch": 0.96, "learning_rate": 8.658083948541062e-08, "loss": 21.312, "step": 88740 }, { "epoch": 0.96, "learning_rate": 8.612169877000975e-08, "loss": 21.5339, "step": 88750 }, { "epoch": 0.96, "learning_rate": 8.566377344665699e-08, "loss": 21.2137, "step": 88760 }, { "epoch": 0.96, "learning_rate": 8.520706357149078e-08, "loss": 21.2192, "step": 88770 }, { "epoch": 0.96, "learning_rate": 8.475156920050187e-08, "loss": 20.982, "step": 88780 }, { "epoch": 0.96, "learning_rate": 8.429729038953117e-08, "loss": 21.7079, "step": 88790 }, { "epoch": 0.96, "learning_rate": 8.384422719427076e-08, "loss": 21.1872, "step": 88800 }, { "epoch": 0.96, "learning_rate": 8.339237967026515e-08, "loss": 20.6513, "step": 88810 }, { "epoch": 0.96, "learning_rate": 8.294174787290776e-08, "loss": 20.9916, "step": 88820 }, { "epoch": 0.96, "learning_rate": 8.249233185744332e-08, "loss": 20.9099, "step": 88830 }, { "epoch": 0.96, "learning_rate": 8.204413167896885e-08, "loss": 21.3645, "step": 88840 }, { "epoch": 0.96, "learning_rate": 8.159714739243152e-08, "loss": 21.3337, "step": 88850 }, { "epoch": 0.96, "learning_rate": 8.11513790526286e-08, "loss": 20.0144, "step": 88860 }, { "epoch": 0.96, "learning_rate": 8.07068267142086e-08, "loss": 21.2615, "step": 88870 }, { "epoch": 0.96, "learning_rate": 8.026349043167348e-08, "loss": 21.2919, "step": 88880 }, { "epoch": 0.96, "learning_rate": 7.982137025937308e-08, "loss": 21.6642, "step": 88890 }, { "epoch": 0.96, "learning_rate": 7.938046625150852e-08, "loss": 21.5793, "step": 88900 }, { "epoch": 0.96, "learning_rate": 7.89407784621321e-08, "loss": 21.2477, "step": 88910 }, { "epoch": 0.96, "learning_rate": 7.850230694514849e-08, "loss": 21.6659, "step": 88920 }, { "epoch": 0.96, "learning_rate": 7.806505175431245e-08, "loss": 20.6999, "step": 88930 }, { "epoch": 0.96, "learning_rate": 7.762901294322778e-08, "loss": 21.311, "step": 88940 }, { "epoch": 0.96, "learning_rate": 7.719419056535171e-08, "loss": 21.2922, "step": 88950 }, { "epoch": 0.96, "learning_rate": 7.67605846739905e-08, "loss": 21.4794, "step": 88960 }, { "epoch": 0.96, "learning_rate": 7.632819532230273e-08, "loss": 21.5209, "step": 88970 }, { "epoch": 0.96, "learning_rate": 7.589702256329823e-08, "loss": 21.195, "step": 88980 }, { "epoch": 0.96, "learning_rate": 7.546706644983359e-08, "loss": 21.4793, "step": 88990 }, { "epoch": 0.96, "learning_rate": 7.503832703462222e-08, "loss": 20.5847, "step": 89000 }, { "epoch": 0.96, "learning_rate": 7.461080437022428e-08, "loss": 21.3741, "step": 89010 }, { "epoch": 0.96, "learning_rate": 7.41844985090523e-08, "loss": 21.7854, "step": 89020 }, { "epoch": 0.96, "learning_rate": 7.37594095033678e-08, "loss": 21.3655, "step": 89030 }, { "epoch": 0.96, "learning_rate": 7.333553740528687e-08, "loss": 22.1865, "step": 89040 }, { "epoch": 0.96, "learning_rate": 7.29128822667724e-08, "loss": 21.5413, "step": 89050 }, { "epoch": 0.96, "learning_rate": 7.24914441396396e-08, "loss": 20.9658, "step": 89060 }, { "epoch": 0.96, "learning_rate": 7.207122307555603e-08, "loss": 21.2045, "step": 89070 }, { "epoch": 0.96, "learning_rate": 7.165221912603826e-08, "loss": 21.2598, "step": 89080 }, { "epoch": 0.96, "learning_rate": 7.123443234245409e-08, "loss": 21.1991, "step": 89090 }, { "epoch": 0.96, "learning_rate": 7.081786277602254e-08, "loss": 22.7726, "step": 89100 }, { "epoch": 0.96, "learning_rate": 7.040251047781055e-08, "loss": 20.8359, "step": 89110 }, { "epoch": 0.96, "learning_rate": 6.998837549874183e-08, "loss": 21.3018, "step": 89120 }, { "epoch": 0.96, "learning_rate": 6.957545788958464e-08, "loss": 21.8317, "step": 89130 }, { "epoch": 0.96, "learning_rate": 6.916375770096073e-08, "loss": 21.4156, "step": 89140 }, { "epoch": 0.96, "learning_rate": 6.875327498334417e-08, "loss": 21.3224, "step": 89150 }, { "epoch": 0.96, "learning_rate": 6.834400978705691e-08, "loss": 21.3067, "step": 89160 }, { "epoch": 0.96, "learning_rate": 6.793596216227328e-08, "loss": 20.6213, "step": 89170 }, { "epoch": 0.96, "learning_rate": 6.752913215901769e-08, "loss": 21.434, "step": 89180 }, { "epoch": 0.96, "learning_rate": 6.712351982716469e-08, "loss": 20.822, "step": 89190 }, { "epoch": 0.96, "learning_rate": 6.67191252164412e-08, "loss": 21.6648, "step": 89200 }, { "epoch": 0.96, "learning_rate": 6.63159483764253e-08, "loss": 21.4644, "step": 89210 }, { "epoch": 0.96, "learning_rate": 6.591398935654191e-08, "loss": 21.172, "step": 89220 }, { "epoch": 0.96, "learning_rate": 6.551324820607053e-08, "loss": 21.3619, "step": 89230 }, { "epoch": 0.96, "learning_rate": 6.511372497413959e-08, "loss": 21.5373, "step": 89240 }, { "epoch": 0.96, "learning_rate": 6.471541970972772e-08, "loss": 21.9869, "step": 89250 }, { "epoch": 0.96, "learning_rate": 6.431833246166808e-08, "loss": 20.957, "step": 89260 }, { "epoch": 0.97, "learning_rate": 6.392246327863949e-08, "loss": 21.7994, "step": 89270 }, { "epoch": 0.97, "learning_rate": 6.352781220917315e-08, "loss": 21.399, "step": 89280 }, { "epoch": 0.97, "learning_rate": 6.313437930165256e-08, "loss": 21.4367, "step": 89290 }, { "epoch": 0.97, "learning_rate": 6.274216460431026e-08, "loss": 20.8677, "step": 89300 }, { "epoch": 0.97, "learning_rate": 6.23511681652289e-08, "loss": 22.0899, "step": 89310 }, { "epoch": 0.97, "learning_rate": 6.196139003234458e-08, "loss": 20.7333, "step": 89320 }, { "epoch": 0.97, "learning_rate": 6.157283025344018e-08, "loss": 20.9633, "step": 89330 }, { "epoch": 0.97, "learning_rate": 6.118548887615206e-08, "loss": 20.6545, "step": 89340 }, { "epoch": 0.97, "learning_rate": 6.079936594796665e-08, "loss": 21.2938, "step": 89350 }, { "epoch": 0.97, "learning_rate": 6.041446151621943e-08, "loss": 20.9542, "step": 89360 }, { "epoch": 0.97, "learning_rate": 6.003077562810044e-08, "loss": 21.4018, "step": 89370 }, { "epoch": 0.97, "learning_rate": 5.964830833064427e-08, "loss": 21.412, "step": 89380 }, { "epoch": 0.97, "learning_rate": 5.926705967074231e-08, "loss": 20.7592, "step": 89390 }, { "epoch": 0.97, "learning_rate": 5.8887029695131606e-08, "loss": 21.1009, "step": 89400 }, { "epoch": 0.97, "learning_rate": 5.850821845040266e-08, "loss": 20.1012, "step": 89410 }, { "epoch": 0.97, "learning_rate": 5.8130625982997236e-08, "loss": 21.2607, "step": 89420 }, { "epoch": 0.97, "learning_rate": 5.7754252339204955e-08, "loss": 20.9261, "step": 89430 }, { "epoch": 0.97, "learning_rate": 5.737909756516669e-08, "loss": 21.5701, "step": 89440 }, { "epoch": 0.97, "learning_rate": 5.7005161706875645e-08, "loss": 20.9425, "step": 89450 }, { "epoch": 0.97, "learning_rate": 5.663244481017516e-08, "loss": 20.9483, "step": 89460 }, { "epoch": 0.97, "learning_rate": 5.626094692075645e-08, "loss": 21.2241, "step": 89470 }, { "epoch": 0.97, "learning_rate": 5.5890668084165324e-08, "loss": 20.4476, "step": 89480 }, { "epoch": 0.97, "learning_rate": 5.552160834579545e-08, "loss": 20.9536, "step": 89490 }, { "epoch": 0.97, "learning_rate": 5.515376775088954e-08, "loss": 21.6445, "step": 89500 }, { "epoch": 0.97, "learning_rate": 5.4787146344545964e-08, "loss": 21.6612, "step": 89510 }, { "epoch": 0.97, "learning_rate": 5.4421744171709864e-08, "loss": 21.2474, "step": 89520 }, { "epoch": 0.97, "learning_rate": 5.405756127717876e-08, "loss": 20.837, "step": 89530 }, { "epoch": 0.97, "learning_rate": 5.369459770559693e-08, "loss": 21.2389, "step": 89540 }, { "epoch": 0.97, "learning_rate": 5.333285350146322e-08, "loss": 21.4515, "step": 89550 }, { "epoch": 0.97, "learning_rate": 5.29723287091255e-08, "loss": 22.0402, "step": 89560 }, { "epoch": 0.97, "learning_rate": 5.261302337278396e-08, "loss": 21.184, "step": 89570 }, { "epoch": 0.97, "learning_rate": 5.2254937536485586e-08, "loss": 21.5119, "step": 89580 }, { "epoch": 0.97, "learning_rate": 5.189807124413082e-08, "loss": 20.5652, "step": 89590 }, { "epoch": 0.97, "learning_rate": 5.154242453946912e-08, "loss": 21.2493, "step": 89600 }, { "epoch": 0.97, "learning_rate": 5.1187997466101145e-08, "loss": 21.1134, "step": 89610 }, { "epoch": 0.97, "learning_rate": 5.0834790067478824e-08, "loss": 21.8756, "step": 89620 }, { "epoch": 0.97, "learning_rate": 5.0482802386903063e-08, "loss": 20.6164, "step": 89630 }, { "epoch": 0.97, "learning_rate": 5.0132034467526015e-08, "loss": 21.0605, "step": 89640 }, { "epoch": 0.97, "learning_rate": 4.9782486352348836e-08, "loss": 21.8902, "step": 89650 }, { "epoch": 0.97, "learning_rate": 4.943415808422503e-08, "loss": 21.845, "step": 89660 }, { "epoch": 0.97, "learning_rate": 4.9087049705859316e-08, "loss": 21.9524, "step": 89670 }, { "epoch": 0.97, "learning_rate": 4.874116125980322e-08, "loss": 21.9102, "step": 89680 }, { "epoch": 0.97, "learning_rate": 4.839649278846281e-08, "loss": 20.6821, "step": 89690 }, { "epoch": 0.97, "learning_rate": 4.805304433409097e-08, "loss": 21.3436, "step": 89700 }, { "epoch": 0.97, "learning_rate": 4.771081593879512e-08, "loss": 20.8761, "step": 89710 }, { "epoch": 0.97, "learning_rate": 4.736980764452837e-08, "loss": 21.153, "step": 89720 }, { "epoch": 0.97, "learning_rate": 4.7030019493097267e-08, "loss": 21.4995, "step": 89730 }, { "epoch": 0.97, "learning_rate": 4.6691451526159614e-08, "loss": 20.6166, "step": 89740 }, { "epoch": 0.97, "learning_rate": 4.6354103785219986e-08, "loss": 20.9893, "step": 89750 }, { "epoch": 0.97, "learning_rate": 4.601797631163751e-08, "loss": 21.4254, "step": 89760 }, { "epoch": 0.97, "learning_rate": 4.568306914661813e-08, "loss": 20.4774, "step": 89770 }, { "epoch": 0.97, "learning_rate": 4.5349382331221217e-08, "loss": 21.3822, "step": 89780 }, { "epoch": 0.97, "learning_rate": 4.501691590635293e-08, "loss": 21.1215, "step": 89790 }, { "epoch": 0.97, "learning_rate": 4.468566991277512e-08, "loss": 20.7359, "step": 89800 }, { "epoch": 0.97, "learning_rate": 4.4355644391094186e-08, "loss": 21.7157, "step": 89810 }, { "epoch": 0.97, "learning_rate": 4.40268393817711e-08, "loss": 21.2, "step": 89820 }, { "epoch": 0.97, "learning_rate": 4.369925492511473e-08, "loss": 21.9515, "step": 89830 }, { "epoch": 0.97, "learning_rate": 4.3372891061286284e-08, "loss": 21.0684, "step": 89840 }, { "epoch": 0.97, "learning_rate": 4.304774783029597e-08, "loss": 20.8546, "step": 89850 }, { "epoch": 0.97, "learning_rate": 4.2723825272004137e-08, "loss": 20.7968, "step": 89860 }, { "epoch": 0.97, "learning_rate": 4.2401123426123456e-08, "loss": 20.5941, "step": 89870 }, { "epoch": 0.97, "learning_rate": 4.207964233221451e-08, "loss": 20.9878, "step": 89880 }, { "epoch": 0.97, "learning_rate": 4.17593820296891e-08, "loss": 20.6711, "step": 89890 }, { "epoch": 0.97, "learning_rate": 4.1440342557809156e-08, "loss": 21.1715, "step": 89900 }, { "epoch": 0.97, "learning_rate": 4.1122523955688945e-08, "loss": 21.2202, "step": 89910 }, { "epoch": 0.97, "learning_rate": 4.080592626229063e-08, "loss": 21.5764, "step": 89920 }, { "epoch": 0.97, "learning_rate": 4.049054951642761e-08, "loss": 21.5368, "step": 89930 }, { "epoch": 0.97, "learning_rate": 4.01763937567623e-08, "loss": 21.5919, "step": 89940 }, { "epoch": 0.97, "learning_rate": 3.9863459021810544e-08, "loss": 20.5741, "step": 89950 }, { "epoch": 0.97, "learning_rate": 3.9551745349935e-08, "loss": 21.156, "step": 89960 }, { "epoch": 0.97, "learning_rate": 3.924125277935176e-08, "loss": 21.4874, "step": 89970 }, { "epoch": 0.97, "learning_rate": 3.8931981348124815e-08, "loss": 21.0636, "step": 89980 }, { "epoch": 0.97, "learning_rate": 3.862393109416829e-08, "loss": 21.7438, "step": 89990 }, { "epoch": 0.97, "learning_rate": 3.8317102055249747e-08, "loss": 21.2246, "step": 90000 }, { "epoch": 0.97, "learning_rate": 3.801149426898243e-08, "loss": 21.3271, "step": 90010 }, { "epoch": 0.97, "learning_rate": 3.770710777283526e-08, "loss": 20.9284, "step": 90020 }, { "epoch": 0.97, "learning_rate": 3.740394260412172e-08, "loss": 20.4747, "step": 90030 }, { "epoch": 0.97, "learning_rate": 3.7101998800010975e-08, "loss": 21.5409, "step": 90040 }, { "epoch": 0.97, "learning_rate": 3.680127639751674e-08, "loss": 20.5038, "step": 90050 }, { "epoch": 0.97, "learning_rate": 3.6501775433508414e-08, "loss": 21.3941, "step": 90060 }, { "epoch": 0.97, "learning_rate": 3.6203495944703296e-08, "loss": 21.8024, "step": 90070 }, { "epoch": 0.97, "learning_rate": 3.5906437967667685e-08, "loss": 21.1704, "step": 90080 }, { "epoch": 0.97, "learning_rate": 3.561060153882023e-08, "loss": 21.3565, "step": 90090 }, { "epoch": 0.97, "learning_rate": 3.531598669442859e-08, "loss": 21.4879, "step": 90100 }, { "epoch": 0.97, "learning_rate": 3.502259347061055e-08, "loss": 21.0175, "step": 90110 }, { "epoch": 0.97, "learning_rate": 3.47304219033362e-08, "loss": 20.6346, "step": 90120 }, { "epoch": 0.97, "learning_rate": 3.4439472028423573e-08, "loss": 21.0322, "step": 90130 }, { "epoch": 0.97, "learning_rate": 3.414974388154191e-08, "loss": 21.8358, "step": 90140 }, { "epoch": 0.97, "learning_rate": 3.386123749820947e-08, "loss": 21.7163, "step": 90150 }, { "epoch": 0.97, "learning_rate": 3.3573952913796837e-08, "loss": 20.57, "step": 90160 }, { "epoch": 0.97, "learning_rate": 3.3287890163523626e-08, "loss": 20.9223, "step": 90170 }, { "epoch": 0.97, "learning_rate": 3.3003049282458456e-08, "loss": 21.7835, "step": 90180 }, { "epoch": 0.98, "learning_rate": 3.271943030552227e-08, "loss": 20.8806, "step": 90190 }, { "epoch": 0.98, "learning_rate": 3.243703326748615e-08, "loss": 21.0042, "step": 90200 }, { "epoch": 0.98, "learning_rate": 3.2155858202969073e-08, "loss": 21.7277, "step": 90210 }, { "epoch": 0.98, "learning_rate": 3.187590514644234e-08, "loss": 21.5421, "step": 90220 }, { "epoch": 0.98, "learning_rate": 3.1597174132226294e-08, "loss": 21.2468, "step": 90230 }, { "epoch": 0.98, "learning_rate": 3.131966519449359e-08, "loss": 20.6827, "step": 90240 }, { "epoch": 0.98, "learning_rate": 3.1043378367263676e-08, "loss": 21.5983, "step": 90250 }, { "epoch": 0.98, "learning_rate": 3.076831368440836e-08, "loss": 20.9805, "step": 90260 }, { "epoch": 0.98, "learning_rate": 3.0494471179649543e-08, "loss": 21.5772, "step": 90270 }, { "epoch": 0.98, "learning_rate": 3.0221850886559266e-08, "loss": 20.7771, "step": 90280 }, { "epoch": 0.98, "learning_rate": 2.995045283855857e-08, "loss": 21.8376, "step": 90290 }, { "epoch": 0.98, "learning_rate": 2.9680277068920848e-08, "loss": 20.8941, "step": 90300 }, { "epoch": 0.98, "learning_rate": 2.9411323610766264e-08, "loss": 20.8326, "step": 90310 }, { "epoch": 0.98, "learning_rate": 2.914359249706844e-08, "loss": 21.5435, "step": 90320 }, { "epoch": 0.98, "learning_rate": 2.8877083760650014e-08, "loss": 21.6054, "step": 90330 }, { "epoch": 0.98, "learning_rate": 2.8611797434183742e-08, "loss": 20.4939, "step": 90340 }, { "epoch": 0.98, "learning_rate": 2.834773355019138e-08, "loss": 21.8223, "step": 90350 }, { "epoch": 0.98, "learning_rate": 2.8084892141045926e-08, "loss": 21.4039, "step": 90360 }, { "epoch": 0.98, "learning_rate": 2.7823273238971604e-08, "loss": 21.1868, "step": 90370 }, { "epoch": 0.98, "learning_rate": 2.7562876876040534e-08, "loss": 21.4172, "step": 90380 }, { "epoch": 0.98, "learning_rate": 2.730370308417718e-08, "loss": 21.0302, "step": 90390 }, { "epoch": 0.98, "learning_rate": 2.7045751895153904e-08, "loss": 21.5443, "step": 90400 }, { "epoch": 0.98, "learning_rate": 2.67890233405943e-08, "loss": 21.0815, "step": 90410 }, { "epoch": 0.98, "learning_rate": 2.653351745197208e-08, "loss": 21.3905, "step": 90420 }, { "epoch": 0.98, "learning_rate": 2.6279234260612184e-08, "loss": 21.1998, "step": 90430 }, { "epoch": 0.98, "learning_rate": 2.602617379768635e-08, "loss": 20.9159, "step": 90440 }, { "epoch": 0.98, "learning_rate": 2.5774336094219754e-08, "loss": 21.4151, "step": 90450 }, { "epoch": 0.98, "learning_rate": 2.5523721181086593e-08, "loss": 21.2847, "step": 90460 }, { "epoch": 0.98, "learning_rate": 2.5274329089010064e-08, "loss": 21.4841, "step": 90470 }, { "epoch": 0.98, "learning_rate": 2.5026159848565713e-08, "loss": 20.8519, "step": 90480 }, { "epoch": 0.98, "learning_rate": 2.477921349017698e-08, "loss": 21.1796, "step": 90490 }, { "epoch": 0.98, "learning_rate": 2.4533490044119646e-08, "loss": 20.9031, "step": 90500 }, { "epoch": 0.98, "learning_rate": 2.4288989540515172e-08, "loss": 21.5539, "step": 90510 }, { "epoch": 0.98, "learning_rate": 2.4045712009340692e-08, "loss": 20.5038, "step": 90520 }, { "epoch": 0.98, "learning_rate": 2.380365748042013e-08, "loss": 21.5997, "step": 90530 }, { "epoch": 0.98, "learning_rate": 2.3562825983427517e-08, "loss": 21.0566, "step": 90540 }, { "epoch": 0.98, "learning_rate": 2.3323217547888134e-08, "loss": 21.2671, "step": 90550 }, { "epoch": 0.98, "learning_rate": 2.3084832203177367e-08, "loss": 20.8173, "step": 90560 }, { "epoch": 0.98, "learning_rate": 2.2847669978519616e-08, "loss": 20.685, "step": 90570 }, { "epoch": 0.98, "learning_rate": 2.2611730902989404e-08, "loss": 21.4031, "step": 90580 }, { "epoch": 0.98, "learning_rate": 2.2377015005511373e-08, "loss": 21.7565, "step": 90590 }, { "epoch": 0.98, "learning_rate": 2.2143522314862498e-08, "loss": 20.6476, "step": 90600 }, { "epoch": 0.98, "learning_rate": 2.1911252859665445e-08, "loss": 21.7401, "step": 90610 }, { "epoch": 0.98, "learning_rate": 2.1680206668396318e-08, "loss": 21.1823, "step": 90620 }, { "epoch": 0.98, "learning_rate": 2.1450383769380245e-08, "loss": 20.6052, "step": 90630 }, { "epoch": 0.98, "learning_rate": 2.122178419079246e-08, "loss": 21.0279, "step": 90640 }, { "epoch": 0.98, "learning_rate": 2.0994407960657216e-08, "loss": 21.0718, "step": 90650 }, { "epoch": 0.98, "learning_rate": 2.0768255106851098e-08, "loss": 21.1282, "step": 90660 }, { "epoch": 0.98, "learning_rate": 2.0543325657098602e-08, "loss": 21.2416, "step": 90670 }, { "epoch": 0.98, "learning_rate": 2.031961963897544e-08, "loss": 21.6403, "step": 90680 }, { "epoch": 0.98, "learning_rate": 2.0097137079906347e-08, "loss": 20.8361, "step": 90690 }, { "epoch": 0.98, "learning_rate": 1.9875878007166173e-08, "loss": 21.18, "step": 90700 }, { "epoch": 0.98, "learning_rate": 1.965584244788099e-08, "loss": 21.6891, "step": 90710 }, { "epoch": 0.98, "learning_rate": 1.9437030429025894e-08, "loss": 21.0091, "step": 90720 }, { "epoch": 0.98, "learning_rate": 1.921944197742609e-08, "loss": 21.2162, "step": 90730 }, { "epoch": 0.98, "learning_rate": 1.9003077119755797e-08, "loss": 21.025, "step": 90740 }, { "epoch": 0.98, "learning_rate": 1.8787935882541576e-08, "loss": 21.2945, "step": 90750 }, { "epoch": 0.98, "learning_rate": 1.8574018292158992e-08, "loss": 21.0808, "step": 90760 }, { "epoch": 0.98, "learning_rate": 1.8361324374832622e-08, "loss": 20.3843, "step": 90770 }, { "epoch": 0.98, "learning_rate": 1.814985415663717e-08, "loss": 21.4936, "step": 90780 }, { "epoch": 0.98, "learning_rate": 1.793960766349856e-08, "loss": 21.6923, "step": 90790 }, { "epoch": 0.98, "learning_rate": 1.773058492119173e-08, "loss": 21.9543, "step": 90800 }, { "epoch": 0.98, "learning_rate": 1.752278595534174e-08, "loss": 21.2598, "step": 90810 }, { "epoch": 0.98, "learning_rate": 1.731621079142376e-08, "loss": 20.9548, "step": 90820 }, { "epoch": 0.98, "learning_rate": 1.7110859454763097e-08, "loss": 21.4707, "step": 90830 }, { "epoch": 0.98, "learning_rate": 1.690673197053405e-08, "loss": 21.4865, "step": 90840 }, { "epoch": 0.98, "learning_rate": 1.6703828363762164e-08, "loss": 20.9691, "step": 90850 }, { "epoch": 0.98, "learning_rate": 1.6502148659323093e-08, "loss": 20.983, "step": 90860 }, { "epoch": 0.98, "learning_rate": 1.63016928819415e-08, "loss": 20.6611, "step": 90870 }, { "epoch": 0.98, "learning_rate": 1.6102461056191066e-08, "loss": 21.1312, "step": 90880 }, { "epoch": 0.98, "learning_rate": 1.5904453206497805e-08, "loss": 20.9705, "step": 90890 }, { "epoch": 0.98, "learning_rate": 1.5707669357135634e-08, "loss": 21.1589, "step": 90900 }, { "epoch": 0.98, "learning_rate": 1.5512109532229703e-08, "loss": 20.6164, "step": 90910 }, { "epoch": 0.98, "learning_rate": 1.5317773755755273e-08, "loss": 21.158, "step": 90920 }, { "epoch": 0.98, "learning_rate": 1.512466205153551e-08, "loss": 21.0124, "step": 90930 }, { "epoch": 0.98, "learning_rate": 1.4932774443247034e-08, "loss": 21.1809, "step": 90940 }, { "epoch": 0.98, "learning_rate": 1.4742110954412137e-08, "loss": 21.0446, "step": 90950 }, { "epoch": 0.98, "learning_rate": 1.4552671608406566e-08, "loss": 21.0293, "step": 90960 }, { "epoch": 0.98, "learning_rate": 1.4364456428453966e-08, "loss": 21.1766, "step": 90970 }, { "epoch": 0.98, "learning_rate": 1.4177465437629212e-08, "loss": 21.1561, "step": 90980 }, { "epoch": 0.98, "learning_rate": 1.399169865885619e-08, "loss": 21.5791, "step": 90990 }, { "epoch": 0.98, "learning_rate": 1.3807156114908904e-08, "loss": 21.6129, "step": 91000 }, { "epoch": 0.98, "learning_rate": 1.3623837828410368e-08, "loss": 20.8573, "step": 91010 }, { "epoch": 0.98, "learning_rate": 1.344174382183705e-08, "loss": 21.7112, "step": 91020 }, { "epoch": 0.98, "learning_rate": 1.3260874117509981e-08, "loss": 21.013, "step": 91030 }, { "epoch": 0.98, "learning_rate": 1.3081228737604757e-08, "loss": 21.0525, "step": 91040 }, { "epoch": 0.98, "learning_rate": 1.2902807704143761e-08, "loss": 20.9797, "step": 91050 }, { "epoch": 0.98, "learning_rate": 1.2725611039001717e-08, "loss": 21.9265, "step": 91060 }, { "epoch": 0.98, "learning_rate": 1.2549638763901251e-08, "loss": 21.2789, "step": 91070 }, { "epoch": 0.98, "learning_rate": 1.2374890900415104e-08, "loss": 20.9271, "step": 91080 }, { "epoch": 0.98, "learning_rate": 1.2201367469968362e-08, "loss": 20.9768, "step": 91090 }, { "epoch": 0.98, "learning_rate": 1.2029068493832895e-08, "loss": 20.8593, "step": 91100 }, { "epoch": 0.98, "learning_rate": 1.1857993993130701e-08, "loss": 21.161, "step": 91110 }, { "epoch": 0.99, "learning_rate": 1.1688143988837219e-08, "loss": 21.3001, "step": 91120 }, { "epoch": 0.99, "learning_rate": 1.1519518501772465e-08, "loss": 21.5703, "step": 91130 }, { "epoch": 0.99, "learning_rate": 1.1352117552611009e-08, "loss": 22.2776, "step": 91140 }, { "epoch": 0.99, "learning_rate": 1.1185941161875324e-08, "loss": 21.6399, "step": 91150 }, { "epoch": 0.99, "learning_rate": 1.1020989349936895e-08, "loss": 20.8152, "step": 91160 }, { "epoch": 0.99, "learning_rate": 1.0857262137018432e-08, "loss": 21.0397, "step": 91170 }, { "epoch": 0.99, "learning_rate": 1.0694759543191658e-08, "loss": 21.1081, "step": 91180 }, { "epoch": 0.99, "learning_rate": 1.0533481588379524e-08, "loss": 21.3314, "step": 91190 }, { "epoch": 0.99, "learning_rate": 1.0373428292352883e-08, "loss": 20.6078, "step": 91200 }, { "epoch": 0.99, "learning_rate": 1.0214599674733817e-08, "loss": 20.6476, "step": 91210 }, { "epoch": 0.99, "learning_rate": 1.0056995754993415e-08, "loss": 20.528, "step": 91220 }, { "epoch": 0.99, "learning_rate": 9.900616552454001e-09, "loss": 20.4594, "step": 91230 }, { "epoch": 0.99, "learning_rate": 9.745462086286906e-09, "loss": 20.6532, "step": 91240 }, { "epoch": 0.99, "learning_rate": 9.591532375513578e-09, "loss": 21.2046, "step": 91250 }, { "epoch": 0.99, "learning_rate": 9.438827439003373e-09, "loss": 21.2408, "step": 91260 }, { "epoch": 0.99, "learning_rate": 9.287347295479088e-09, "loss": 21.2896, "step": 91270 }, { "epoch": 0.99, "learning_rate": 9.137091963510314e-09, "loss": 21.1999, "step": 91280 }, { "epoch": 0.99, "learning_rate": 8.988061461516761e-09, "loss": 21.3401, "step": 91290 }, { "epoch": 0.99, "learning_rate": 8.840255807771592e-09, "loss": 21.1995, "step": 91300 }, { "epoch": 0.99, "learning_rate": 8.693675020392534e-09, "loss": 21.2125, "step": 91310 }, { "epoch": 0.99, "learning_rate": 8.548319117350767e-09, "loss": 21.3604, "step": 91320 }, { "epoch": 0.99, "learning_rate": 8.404188116465373e-09, "loss": 20.5624, "step": 91330 }, { "epoch": 0.99, "learning_rate": 8.26128203540666e-09, "loss": 21.528, "step": 91340 }, { "epoch": 0.99, "learning_rate": 8.119600891695056e-09, "loss": 20.7647, "step": 91350 }, { "epoch": 0.99, "learning_rate": 7.979144702698893e-09, "loss": 20.9463, "step": 91360 }, { "epoch": 0.99, "learning_rate": 7.839913485636619e-09, "loss": 21.6425, "step": 91370 }, { "epoch": 0.99, "learning_rate": 7.701907257579022e-09, "loss": 20.9778, "step": 91380 }, { "epoch": 0.99, "learning_rate": 7.565126035443682e-09, "loss": 21.5178, "step": 91390 }, { "epoch": 0.99, "learning_rate": 7.429569836000516e-09, "loss": 21.4277, "step": 91400 }, { "epoch": 0.99, "learning_rate": 7.295238675867344e-09, "loss": 21.6129, "step": 91410 }, { "epoch": 0.99, "learning_rate": 7.162132571512104e-09, "loss": 20.999, "step": 91420 }, { "epoch": 0.99, "learning_rate": 7.0302515392539625e-09, "loss": 21.4207, "step": 91430 }, { "epoch": 0.99, "learning_rate": 6.8995955952588785e-09, "loss": 20.7065, "step": 91440 }, { "epoch": 0.99, "learning_rate": 6.77016475554737e-09, "loss": 21.5798, "step": 91450 }, { "epoch": 0.99, "learning_rate": 6.641959035985634e-09, "loss": 21.5303, "step": 91460 }, { "epoch": 0.99, "learning_rate": 6.514978452289988e-09, "loss": 21.4796, "step": 91470 }, { "epoch": 0.99, "learning_rate": 6.389223020029089e-09, "loss": 20.8392, "step": 91480 }, { "epoch": 0.99, "learning_rate": 6.264692754620605e-09, "loss": 21.5079, "step": 91490 }, { "epoch": 0.99, "learning_rate": 6.141387671328991e-09, "loss": 22.5478, "step": 91500 }, { "epoch": 0.99, "learning_rate": 6.019307785272155e-09, "loss": 20.8981, "step": 91510 }, { "epoch": 0.99, "learning_rate": 5.898453111417013e-09, "loss": 21.1564, "step": 91520 }, { "epoch": 0.99, "learning_rate": 5.778823664579492e-09, "loss": 21.614, "step": 91530 }, { "epoch": 0.99, "learning_rate": 5.6604194594245266e-09, "loss": 20.77, "step": 91540 }, { "epoch": 0.99, "learning_rate": 5.543240510468284e-09, "loss": 21.1776, "step": 91550 }, { "epoch": 0.99, "learning_rate": 5.42728683207705e-09, "loss": 20.8924, "step": 91560 }, { "epoch": 0.99, "learning_rate": 5.31255843846612e-09, "loss": 20.6831, "step": 91570 }, { "epoch": 0.99, "learning_rate": 5.199055343699799e-09, "loss": 21.8896, "step": 91580 }, { "epoch": 0.99, "learning_rate": 5.086777561693623e-09, "loss": 21.7757, "step": 91590 }, { "epoch": 0.99, "learning_rate": 4.975725106212137e-09, "loss": 21.1937, "step": 91600 }, { "epoch": 0.99, "learning_rate": 4.865897990868896e-09, "loss": 21.2964, "step": 91610 }, { "epoch": 0.99, "learning_rate": 4.757296229129793e-09, "loss": 20.9381, "step": 91620 }, { "epoch": 0.99, "learning_rate": 4.649919834308625e-09, "loss": 21.4004, "step": 91630 }, { "epoch": 0.99, "learning_rate": 4.543768819568195e-09, "loss": 20.8306, "step": 91640 }, { "epoch": 0.99, "learning_rate": 4.438843197922538e-09, "loss": 20.6485, "step": 91650 }, { "epoch": 0.99, "learning_rate": 4.335142982234697e-09, "loss": 20.8557, "step": 91660 }, { "epoch": 0.99, "learning_rate": 4.2326681852189465e-09, "loss": 20.743, "step": 91670 }, { "epoch": 0.99, "learning_rate": 4.131418819437461e-09, "loss": 21.3261, "step": 91680 }, { "epoch": 0.99, "learning_rate": 4.031394897302532e-09, "loss": 19.7406, "step": 91690 }, { "epoch": 0.99, "learning_rate": 3.932596431076574e-09, "loss": 21.278, "step": 91700 }, { "epoch": 0.99, "learning_rate": 3.8350234328721204e-09, "loss": 20.881, "step": 91710 }, { "epoch": 0.99, "learning_rate": 3.738675914651823e-09, "loss": 20.2238, "step": 91720 }, { "epoch": 0.99, "learning_rate": 3.6435538882262366e-09, "loss": 20.3248, "step": 91730 }, { "epoch": 0.99, "learning_rate": 3.549657365257142e-09, "loss": 21.7862, "step": 91740 }, { "epoch": 0.99, "learning_rate": 3.456986357256442e-09, "loss": 20.8212, "step": 91750 }, { "epoch": 0.99, "learning_rate": 3.3655408755839393e-09, "loss": 21.4185, "step": 91760 }, { "epoch": 0.99, "learning_rate": 3.275320931451775e-09, "loss": 21.6465, "step": 91770 }, { "epoch": 0.99, "learning_rate": 3.1863265359199924e-09, "loss": 21.0906, "step": 91780 }, { "epoch": 0.99, "learning_rate": 3.098557699898752e-09, "loss": 21.2672, "step": 91790 }, { "epoch": 0.99, "learning_rate": 3.012014434147226e-09, "loss": 21.8096, "step": 91800 }, { "epoch": 0.99, "learning_rate": 2.926696749276925e-09, "loss": 21.7123, "step": 91810 }, { "epoch": 0.99, "learning_rate": 2.8426046557450406e-09, "loss": 20.6542, "step": 91820 }, { "epoch": 0.99, "learning_rate": 2.7597381638633238e-09, "loss": 21.3507, "step": 91830 }, { "epoch": 0.99, "learning_rate": 2.678097283789205e-09, "loss": 20.8493, "step": 91840 }, { "epoch": 0.99, "learning_rate": 2.5976820255324552e-09, "loss": 21.0071, "step": 91850 }, { "epoch": 0.99, "learning_rate": 2.518492398950745e-09, "loss": 21.0327, "step": 91860 }, { "epoch": 0.99, "learning_rate": 2.440528413752974e-09, "loss": 20.6682, "step": 91870 }, { "epoch": 0.99, "learning_rate": 2.3637900794970524e-09, "loss": 21.2112, "step": 91880 }, { "epoch": 0.99, "learning_rate": 2.2882774055899003e-09, "loss": 20.962, "step": 91890 }, { "epoch": 0.99, "learning_rate": 2.2139904012896675e-09, "loss": 20.9873, "step": 91900 }, { "epoch": 0.99, "learning_rate": 2.1409290757035126e-09, "loss": 21.2735, "step": 91910 }, { "epoch": 0.99, "learning_rate": 2.069093437787606e-09, "loss": 20.7706, "step": 91920 }, { "epoch": 0.99, "learning_rate": 1.998483496350456e-09, "loss": 21.6875, "step": 91930 }, { "epoch": 0.99, "learning_rate": 1.929099260047362e-09, "loss": 21.3854, "step": 91940 }, { "epoch": 0.99, "learning_rate": 1.8609407373837429e-09, "loss": 20.7963, "step": 91950 }, { "epoch": 0.99, "learning_rate": 1.7940079367162466e-09, "loss": 21.437, "step": 91960 }, { "epoch": 0.99, "learning_rate": 1.728300866251642e-09, "loss": 21.9034, "step": 91970 }, { "epoch": 0.99, "learning_rate": 1.663819534043487e-09, "loss": 21.4594, "step": 91980 }, { "epoch": 0.99, "learning_rate": 1.6005639479976798e-09, "loss": 21.352, "step": 91990 }, { "epoch": 0.99, "learning_rate": 1.538534115869128e-09, "loss": 20.561, "step": 92000 } ], "logging_steps": 10, "max_steps": 92501, "num_input_tokens_seen": 0, "num_train_epochs": 1, "save_steps": 4000, "total_flos": 0.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }