|
{"current_steps": 10, "total_steps": 3573, "loss": 1.7981, "lr": 1.3966480446927373e-06, "epoch": 0.008396305625524769, "percentage": 0.28, "elapsed_time": "0:00:30", "remaining_time": "2:59:09"} |
|
{"current_steps": 20, "total_steps": 3573, "loss": 1.7816, "lr": 2.7932960893854746e-06, "epoch": 0.016792611251049538, "percentage": 0.56, "elapsed_time": "0:00:42", "remaining_time": "2:05:34"} |
|
{"current_steps": 30, "total_steps": 3573, "loss": 1.6797, "lr": 4.189944134078212e-06, "epoch": 0.02518891687657431, "percentage": 0.84, "elapsed_time": "0:00:54", "remaining_time": "1:47:34"} |
|
{"current_steps": 40, "total_steps": 3573, "loss": 1.5657, "lr": 5.586592178770949e-06, "epoch": 0.033585222502099076, "percentage": 1.12, "elapsed_time": "0:01:06", "remaining_time": "1:38:30"} |
|
{"current_steps": 50, "total_steps": 3573, "loss": 1.4759, "lr": 6.983240223463687e-06, "epoch": 0.041981528127623846, "percentage": 1.4, "elapsed_time": "0:01:19", "remaining_time": "1:32:58"} |
|
{"current_steps": 60, "total_steps": 3573, "loss": 1.4312, "lr": 8.379888268156424e-06, "epoch": 0.05037783375314862, "percentage": 1.68, "elapsed_time": "0:01:31", "remaining_time": "1:29:12"} |
|
{"current_steps": 70, "total_steps": 3573, "loss": 1.4082, "lr": 9.776536312849161e-06, "epoch": 0.05877413937867338, "percentage": 1.96, "elapsed_time": "0:01:43", "remaining_time": "1:26:26"} |
|
{"current_steps": 80, "total_steps": 3573, "loss": 1.4263, "lr": 1.1173184357541899e-05, "epoch": 0.06717044500419815, "percentage": 2.24, "elapsed_time": "0:01:55", "remaining_time": "1:24:19"} |
|
{"current_steps": 90, "total_steps": 3573, "loss": 1.4216, "lr": 1.2569832402234637e-05, "epoch": 0.07556675062972293, "percentage": 2.52, "elapsed_time": "0:02:08", "remaining_time": "1:22:42"} |
|
{"current_steps": 100, "total_steps": 3573, "loss": 1.4207, "lr": 1.3966480446927374e-05, "epoch": 0.08396305625524769, "percentage": 2.8, "elapsed_time": "0:02:20", "remaining_time": "1:21:18"} |
|
{"current_steps": 110, "total_steps": 3573, "loss": 1.399, "lr": 1.5363128491620113e-05, "epoch": 0.09235936188077246, "percentage": 3.08, "elapsed_time": "0:02:32", "remaining_time": "1:20:06"} |
|
{"current_steps": 120, "total_steps": 3573, "loss": 1.404, "lr": 1.675977653631285e-05, "epoch": 0.10075566750629723, "percentage": 3.36, "elapsed_time": "0:02:44", "remaining_time": "1:19:05"} |
|
{"current_steps": 130, "total_steps": 3573, "loss": 1.4057, "lr": 1.8156424581005588e-05, "epoch": 0.109151973131822, "percentage": 3.64, "elapsed_time": "0:02:57", "remaining_time": "1:18:10"} |
|
{"current_steps": 140, "total_steps": 3573, "loss": 1.3956, "lr": 1.9553072625698323e-05, "epoch": 0.11754827875734676, "percentage": 3.92, "elapsed_time": "0:03:09", "remaining_time": "1:17:22"} |
|
{"current_steps": 150, "total_steps": 3573, "loss": 1.4179, "lr": 2.0949720670391062e-05, "epoch": 0.12594458438287154, "percentage": 4.2, "elapsed_time": "0:03:21", "remaining_time": "1:16:39"} |
|
{"current_steps": 160, "total_steps": 3573, "loss": 1.412, "lr": 2.2346368715083797e-05, "epoch": 0.1343408900083963, "percentage": 4.48, "elapsed_time": "0:03:33", "remaining_time": "1:16:00"} |
|
{"current_steps": 170, "total_steps": 3573, "loss": 1.39, "lr": 2.3743016759776536e-05, "epoch": 0.14273719563392107, "percentage": 4.76, "elapsed_time": "0:03:46", "remaining_time": "1:15:24"} |
|
{"current_steps": 180, "total_steps": 3573, "loss": 1.4004, "lr": 2.5139664804469275e-05, "epoch": 0.15113350125944586, "percentage": 5.04, "elapsed_time": "0:03:58", "remaining_time": "1:14:50"} |
|
{"current_steps": 190, "total_steps": 3573, "loss": 1.386, "lr": 2.6536312849162014e-05, "epoch": 0.15952980688497062, "percentage": 5.32, "elapsed_time": "0:04:10", "remaining_time": "1:14:18"} |
|
{"current_steps": 200, "total_steps": 3573, "loss": 1.4012, "lr": 2.793296089385475e-05, "epoch": 0.16792611251049538, "percentage": 5.6, "elapsed_time": "0:04:22", "remaining_time": "1:13:50"} |
|
{"current_steps": 210, "total_steps": 3573, "loss": 1.3707, "lr": 2.9329608938547488e-05, "epoch": 0.17632241813602015, "percentage": 5.88, "elapsed_time": "0:04:34", "remaining_time": "1:13:23"} |
|
{"current_steps": 220, "total_steps": 3573, "loss": 1.4125, "lr": 3.0726256983240227e-05, "epoch": 0.1847187237615449, "percentage": 6.16, "elapsed_time": "0:04:47", "remaining_time": "1:12:57"} |
|
{"current_steps": 230, "total_steps": 3573, "loss": 1.3699, "lr": 3.212290502793296e-05, "epoch": 0.19311502938706968, "percentage": 6.44, "elapsed_time": "0:04:59", "remaining_time": "1:12:31"} |
|
{"current_steps": 240, "total_steps": 3573, "loss": 1.374, "lr": 3.35195530726257e-05, "epoch": 0.20151133501259447, "percentage": 6.72, "elapsed_time": "0:05:11", "remaining_time": "1:12:06"} |
|
{"current_steps": 250, "total_steps": 3573, "loss": 1.3788, "lr": 3.491620111731844e-05, "epoch": 0.20990764063811923, "percentage": 7.0, "elapsed_time": "0:05:23", "remaining_time": "1:11:42"} |
|
{"current_steps": 260, "total_steps": 3573, "loss": 1.3565, "lr": 3.6312849162011175e-05, "epoch": 0.218303946263644, "percentage": 7.28, "elapsed_time": "0:05:35", "remaining_time": "1:11:20"} |
|
{"current_steps": 270, "total_steps": 3573, "loss": 1.3521, "lr": 3.770949720670392e-05, "epoch": 0.22670025188916876, "percentage": 7.56, "elapsed_time": "0:05:48", "remaining_time": "1:10:58"} |
|
{"current_steps": 280, "total_steps": 3573, "loss": 1.3613, "lr": 3.9106145251396646e-05, "epoch": 0.23509655751469352, "percentage": 7.84, "elapsed_time": "0:06:00", "remaining_time": "1:10:37"} |
|
{"current_steps": 290, "total_steps": 3573, "loss": 1.36, "lr": 4.050279329608939e-05, "epoch": 0.2434928631402183, "percentage": 8.12, "elapsed_time": "0:06:12", "remaining_time": "1:10:17"} |
|
{"current_steps": 300, "total_steps": 3573, "loss": 1.3799, "lr": 4.1899441340782123e-05, "epoch": 0.2518891687657431, "percentage": 8.4, "elapsed_time": "0:06:24", "remaining_time": "1:09:58"} |
|
{"current_steps": 310, "total_steps": 3573, "loss": 1.3797, "lr": 4.3296089385474866e-05, "epoch": 0.26028547439126787, "percentage": 8.68, "elapsed_time": "0:06:37", "remaining_time": "1:09:39"} |
|
{"current_steps": 320, "total_steps": 3573, "loss": 1.3675, "lr": 4.4692737430167594e-05, "epoch": 0.2686817800167926, "percentage": 8.96, "elapsed_time": "0:06:49", "remaining_time": "1:09:21"} |
|
{"current_steps": 330, "total_steps": 3573, "loss": 1.3888, "lr": 4.6089385474860336e-05, "epoch": 0.2770780856423174, "percentage": 9.24, "elapsed_time": "0:07:01", "remaining_time": "1:09:02"} |
|
{"current_steps": 340, "total_steps": 3573, "loss": 1.3626, "lr": 4.748603351955307e-05, "epoch": 0.28547439126784213, "percentage": 9.52, "elapsed_time": "0:07:13", "remaining_time": "1:08:45"} |
|
{"current_steps": 350, "total_steps": 3573, "loss": 1.3598, "lr": 4.8882681564245814e-05, "epoch": 0.2938706968933669, "percentage": 9.8, "elapsed_time": "0:07:26", "remaining_time": "1:08:27"} |
|
{"current_steps": 360, "total_steps": 3573, "loss": 1.3933, "lr": 4.9999952257225154e-05, "epoch": 0.3022670025188917, "percentage": 10.08, "elapsed_time": "0:07:38", "remaining_time": "1:08:10"} |
|
{"current_steps": 370, "total_steps": 3573, "loss": 1.3723, "lr": 4.9998281279252004e-05, "epoch": 0.31066330814441645, "percentage": 10.36, "elapsed_time": "0:07:50", "remaining_time": "1:07:53"} |
|
{"current_steps": 380, "total_steps": 3573, "loss": 1.3889, "lr": 4.9994223344882976e-05, "epoch": 0.31905961376994124, "percentage": 10.64, "elapsed_time": "0:08:02", "remaining_time": "1:07:36"} |
|
{"current_steps": 390, "total_steps": 3573, "loss": 1.3757, "lr": 4.9987778841589184e-05, "epoch": 0.327455919395466, "percentage": 10.92, "elapsed_time": "0:08:15", "remaining_time": "1:07:20"} |
|
{"current_steps": 400, "total_steps": 3573, "loss": 1.3602, "lr": 4.997894838472288e-05, "epoch": 0.33585222502099077, "percentage": 11.2, "elapsed_time": "0:08:27", "remaining_time": "1:07:04"} |
|
{"current_steps": 410, "total_steps": 3573, "loss": 1.3483, "lr": 4.996773281745864e-05, "epoch": 0.34424853064651556, "percentage": 11.47, "elapsed_time": "0:08:39", "remaining_time": "1:06:48"} |
|
{"current_steps": 420, "total_steps": 3573, "loss": 1.3773, "lr": 4.9954133210712904e-05, "epoch": 0.3526448362720403, "percentage": 11.75, "elapsed_time": "0:08:51", "remaining_time": "1:06:32"} |
|
{"current_steps": 430, "total_steps": 3573, "loss": 1.3817, "lr": 4.9938150863041666e-05, "epoch": 0.3610411418975651, "percentage": 12.03, "elapsed_time": "0:09:03", "remaining_time": "1:06:15"} |
|
{"current_steps": 440, "total_steps": 3573, "loss": 1.3436, "lr": 4.991978730051653e-05, "epoch": 0.3694374475230898, "percentage": 12.31, "elapsed_time": "0:09:16", "remaining_time": "1:05:59"} |
|
{"current_steps": 450, "total_steps": 3573, "loss": 1.376, "lr": 4.9899044276578956e-05, "epoch": 0.3778337531486146, "percentage": 12.59, "elapsed_time": "0:09:28", "remaining_time": "1:05:42"} |
|
{"current_steps": 460, "total_steps": 3573, "loss": 1.3699, "lr": 4.987592377187286e-05, "epoch": 0.38623005877413935, "percentage": 12.87, "elapsed_time": "0:09:40", "remaining_time": "1:05:27"} |
|
{"current_steps": 470, "total_steps": 3573, "loss": 1.3831, "lr": 4.985042799405547e-05, "epoch": 0.39462636439966414, "percentage": 13.15, "elapsed_time": "0:09:52", "remaining_time": "1:05:11"} |
|
{"current_steps": 480, "total_steps": 3573, "loss": 1.3579, "lr": 4.982255937758657e-05, "epoch": 0.40302267002518893, "percentage": 13.43, "elapsed_time": "0:10:04", "remaining_time": "1:04:56"} |
|
{"current_steps": 490, "total_steps": 3573, "loss": 1.348, "lr": 4.9792320583495975e-05, "epoch": 0.41141897565071367, "percentage": 13.71, "elapsed_time": "0:10:16", "remaining_time": "1:04:41"} |
|
{"current_steps": 500, "total_steps": 3573, "loss": 1.3474, "lr": 4.975971449912952e-05, "epoch": 0.41981528127623846, "percentage": 13.99, "elapsed_time": "0:10:29", "remaining_time": "1:04:26"} |
|
{"current_steps": 510, "total_steps": 3573, "loss": 1.3609, "lr": 4.972474423787331e-05, "epoch": 0.4282115869017632, "percentage": 14.27, "elapsed_time": "0:11:08", "remaining_time": "1:06:56"} |
|
{"current_steps": 520, "total_steps": 3573, "loss": 1.3829, "lr": 4.9687413138856446e-05, "epoch": 0.436607892527288, "percentage": 14.55, "elapsed_time": "0:11:20", "remaining_time": "1:06:38"} |
|
{"current_steps": 530, "total_steps": 3573, "loss": 1.3554, "lr": 4.964772476663222e-05, "epoch": 0.4450041981528128, "percentage": 14.83, "elapsed_time": "0:11:33", "remaining_time": "1:06:20"} |
|
{"current_steps": 540, "total_steps": 3573, "loss": 1.3515, "lr": 4.960568291083772e-05, "epoch": 0.4534005037783375, "percentage": 15.11, "elapsed_time": "0:11:45", "remaining_time": "1:06:02"} |
|
{"current_steps": 550, "total_steps": 3573, "loss": 1.3547, "lr": 4.956129158583199e-05, "epoch": 0.4617968094038623, "percentage": 15.39, "elapsed_time": "0:11:57", "remaining_time": "1:05:44"} |
|
{"current_steps": 560, "total_steps": 3573, "loss": 1.329, "lr": 4.951455503031271e-05, "epoch": 0.47019311502938704, "percentage": 15.67, "elapsed_time": "0:12:09", "remaining_time": "1:05:27"} |
|
{"current_steps": 570, "total_steps": 3573, "loss": 1.3547, "lr": 4.946547770691152e-05, "epoch": 0.47858942065491183, "percentage": 15.95, "elapsed_time": "0:12:22", "remaining_time": "1:05:09"} |
|
{"current_steps": 580, "total_steps": 3573, "loss": 1.3421, "lr": 4.9414064301767786e-05, "epoch": 0.4869857262804366, "percentage": 16.23, "elapsed_time": "0:12:34", "remaining_time": "1:04:52"} |
|
{"current_steps": 590, "total_steps": 3573, "loss": 1.3576, "lr": 4.9360319724081285e-05, "epoch": 0.49538203190596136, "percentage": 16.51, "elapsed_time": "0:12:46", "remaining_time": "1:04:35"} |
|
{"current_steps": 600, "total_steps": 3573, "loss": 1.3667, "lr": 4.930424910564334e-05, "epoch": 0.5037783375314862, "percentage": 16.79, "elapsed_time": "0:12:58", "remaining_time": "1:04:19"} |
|
{"current_steps": 600, "total_steps": 3573, "eval_loss": 1.3807679414749146, "epoch": 0.5037783375314862, "percentage": 16.79, "elapsed_time": "0:13:36", "remaining_time": "1:07:24"} |
|
{"current_steps": 610, "total_steps": 3573, "loss": 1.3504, "lr": 4.92458578003469e-05, "epoch": 0.5121746431570109, "percentage": 17.07, "elapsed_time": "0:13:48", "remaining_time": "1:07:04"} |
|
{"current_steps": 620, "total_steps": 3573, "loss": 1.339, "lr": 4.9185151383675246e-05, "epoch": 0.5205709487825357, "percentage": 17.35, "elapsed_time": "0:14:00", "remaining_time": "1:06:44"} |
|
{"current_steps": 630, "total_steps": 3573, "loss": 1.3358, "lr": 4.912213565216966e-05, "epoch": 0.5289672544080605, "percentage": 17.63, "elapsed_time": "0:14:12", "remaining_time": "1:06:24"} |
|
{"current_steps": 640, "total_steps": 3573, "loss": 1.3708, "lr": 4.905681662287595e-05, "epoch": 0.5373635600335852, "percentage": 17.91, "elapsed_time": "0:14:25", "remaining_time": "1:06:05"} |
|
{"current_steps": 650, "total_steps": 3573, "loss": 1.363, "lr": 4.898920053276989e-05, "epoch": 0.5457598656591099, "percentage": 18.19, "elapsed_time": "0:14:37", "remaining_time": "1:05:46"} |
|
{"current_steps": 660, "total_steps": 3573, "loss": 1.3993, "lr": 4.891929383816169e-05, "epoch": 0.5541561712846348, "percentage": 18.47, "elapsed_time": "0:14:49", "remaining_time": "1:05:26"} |
|
{"current_steps": 670, "total_steps": 3573, "loss": 1.351, "lr": 4.8847103214079524e-05, "epoch": 0.5625524769101595, "percentage": 18.75, "elapsed_time": "0:15:01", "remaining_time": "1:05:07"} |
|
{"current_steps": 680, "total_steps": 3573, "loss": 1.3494, "lr": 4.877263555363216e-05, "epoch": 0.5709487825356843, "percentage": 19.03, "elapsed_time": "0:15:14", "remaining_time": "1:04:48"} |
|
{"current_steps": 690, "total_steps": 3573, "loss": 1.3699, "lr": 4.869589796735078e-05, "epoch": 0.5793450881612091, "percentage": 19.31, "elapsed_time": "0:15:26", "remaining_time": "1:04:30"} |
|
{"current_steps": 700, "total_steps": 3573, "loss": 1.3358, "lr": 4.8616897782510006e-05, "epoch": 0.5877413937867338, "percentage": 19.59, "elapsed_time": "0:15:38", "remaining_time": "1:04:12"} |
|
{"current_steps": 710, "total_steps": 3573, "loss": 1.3417, "lr": 4.853564254242831e-05, "epoch": 0.5961376994122586, "percentage": 19.87, "elapsed_time": "0:15:50", "remaining_time": "1:03:54"} |
|
{"current_steps": 720, "total_steps": 3573, "loss": 1.3633, "lr": 4.845214000574768e-05, "epoch": 0.6045340050377834, "percentage": 20.15, "elapsed_time": "0:16:03", "remaining_time": "1:03:36"} |
|
{"current_steps": 730, "total_steps": 3573, "loss": 1.3582, "lr": 4.8366398145692824e-05, "epoch": 0.6129303106633082, "percentage": 20.43, "elapsed_time": "0:16:15", "remaining_time": "1:03:18"} |
|
{"current_steps": 740, "total_steps": 3573, "loss": 1.3702, "lr": 4.827842514930985e-05, "epoch": 0.6213266162888329, "percentage": 20.71, "elapsed_time": "0:16:27", "remaining_time": "1:03:00"} |
|
{"current_steps": 750, "total_steps": 3573, "loss": 1.3807, "lr": 4.81882294166845e-05, "epoch": 0.6297229219143576, "percentage": 20.99, "elapsed_time": "0:16:39", "remaining_time": "1:02:43"} |
|
{"current_steps": 760, "total_steps": 3573, "loss": 1.3593, "lr": 4.8095819560140096e-05, "epoch": 0.6381192275398825, "percentage": 21.27, "elapsed_time": "0:16:51", "remaining_time": "1:02:25"} |
|
{"current_steps": 770, "total_steps": 3573, "loss": 1.3583, "lr": 4.8001204403415204e-05, "epoch": 0.6465155331654072, "percentage": 21.55, "elapsed_time": "0:17:04", "remaining_time": "1:02:08"} |
|
{"current_steps": 780, "total_steps": 3573, "loss": 1.3478, "lr": 4.7904392980821035e-05, "epoch": 0.654911838790932, "percentage": 21.83, "elapsed_time": "0:17:16", "remaining_time": "1:01:50"} |
|
{"current_steps": 790, "total_steps": 3573, "loss": 1.361, "lr": 4.78053945363789e-05, "epoch": 0.6633081444164568, "percentage": 22.11, "elapsed_time": "0:17:28", "remaining_time": "1:01:33"} |
|
{"current_steps": 800, "total_steps": 3573, "loss": 1.3445, "lr": 4.770421852293746e-05, "epoch": 0.6717044500419815, "percentage": 22.39, "elapsed_time": "0:17:40", "remaining_time": "1:01:17"} |
|
{"current_steps": 810, "total_steps": 3573, "loss": 1.3328, "lr": 4.760087460127019e-05, "epoch": 0.6801007556675063, "percentage": 22.67, "elapsed_time": "0:17:53", "remaining_time": "1:01:00"} |
|
{"current_steps": 820, "total_steps": 3573, "loss": 1.327, "lr": 4.749537263915288e-05, "epoch": 0.6884970612930311, "percentage": 22.95, "elapsed_time": "0:18:05", "remaining_time": "1:00:43"} |
|
{"current_steps": 830, "total_steps": 3573, "loss": 1.3508, "lr": 4.7387722710421414e-05, "epoch": 0.6968933669185559, "percentage": 23.23, "elapsed_time": "0:18:17", "remaining_time": "1:00:26"} |
|
{"current_steps": 840, "total_steps": 3573, "loss": 1.331, "lr": 4.7277935094009896e-05, "epoch": 0.7052896725440806, "percentage": 23.51, "elapsed_time": "0:18:29", "remaining_time": "1:00:09"} |
|
{"current_steps": 850, "total_steps": 3573, "loss": 1.3398, "lr": 4.716602027296916e-05, "epoch": 0.7136859781696053, "percentage": 23.79, "elapsed_time": "0:18:41", "remaining_time": "0:59:53"} |
|
{"current_steps": 860, "total_steps": 3573, "loss": 1.3557, "lr": 4.705198893346578e-05, "epoch": 0.7220822837951302, "percentage": 24.07, "elapsed_time": "0:18:53", "remaining_time": "0:59:36"} |
|
{"current_steps": 870, "total_steps": 3573, "loss": 1.3422, "lr": 4.693585196376171e-05, "epoch": 0.7304785894206549, "percentage": 24.35, "elapsed_time": "0:19:05", "remaining_time": "0:59:20"} |
|
{"current_steps": 880, "total_steps": 3573, "loss": 1.3767, "lr": 4.681762045317464e-05, "epoch": 0.7388748950461796, "percentage": 24.63, "elapsed_time": "0:19:18", "remaining_time": "0:59:03"} |
|
{"current_steps": 890, "total_steps": 3573, "loss": 1.3459, "lr": 4.6697305691019105e-05, "epoch": 0.7472712006717045, "percentage": 24.91, "elapsed_time": "0:19:30", "remaining_time": "0:58:47"} |
|
{"current_steps": 900, "total_steps": 3573, "loss": 1.3253, "lr": 4.6574919165528567e-05, "epoch": 0.7556675062972292, "percentage": 25.19, "elapsed_time": "0:19:42", "remaining_time": "0:58:31"} |
|
{"current_steps": 910, "total_steps": 3573, "loss": 1.3419, "lr": 4.645047256275839e-05, "epoch": 0.764063811922754, "percentage": 25.47, "elapsed_time": "0:19:54", "remaining_time": "0:58:15"} |
|
{"current_steps": 920, "total_steps": 3573, "loss": 1.3478, "lr": 4.632397776547011e-05, "epoch": 0.7724601175482787, "percentage": 25.75, "elapsed_time": "0:20:06", "remaining_time": "0:57:59"} |
|
{"current_steps": 930, "total_steps": 3573, "loss": 1.3391, "lr": 4.619544685199669e-05, "epoch": 0.7808564231738035, "percentage": 26.03, "elapsed_time": "0:20:18", "remaining_time": "0:57:43"} |
|
{"current_steps": 940, "total_steps": 3573, "loss": 1.3445, "lr": 4.6064892095089326e-05, "epoch": 0.7892527287993283, "percentage": 26.31, "elapsed_time": "0:20:30", "remaining_time": "0:57:27"} |
|
{"current_steps": 950, "total_steps": 3573, "loss": 1.3167, "lr": 4.59323259607455e-05, "epoch": 0.797649034424853, "percentage": 26.59, "elapsed_time": "0:20:42", "remaining_time": "0:57:11"} |
|
{"current_steps": 960, "total_steps": 3573, "loss": 1.3383, "lr": 4.5797761107018754e-05, "epoch": 0.8060453400503779, "percentage": 26.87, "elapsed_time": "0:20:54", "remaining_time": "0:56:55"} |
|
{"current_steps": 970, "total_steps": 3573, "loss": 1.3404, "lr": 4.566121038280995e-05, "epoch": 0.8144416456759026, "percentage": 27.15, "elapsed_time": "0:21:07", "remaining_time": "0:56:40"} |
|
{"current_steps": 980, "total_steps": 3573, "loss": 1.3333, "lr": 4.552268682664045e-05, "epoch": 0.8228379513014273, "percentage": 27.43, "elapsed_time": "0:21:19", "remaining_time": "0:56:24"} |
|
{"current_steps": 990, "total_steps": 3573, "loss": 1.3182, "lr": 4.538220366540713e-05, "epoch": 0.8312342569269522, "percentage": 27.71, "elapsed_time": "0:21:31", "remaining_time": "0:56:09"} |
|
{"current_steps": 1000, "total_steps": 3573, "loss": 1.3494, "lr": 4.52397743131194e-05, "epoch": 0.8396305625524769, "percentage": 27.99, "elapsed_time": "0:21:43", "remaining_time": "0:55:53"} |
|
{"current_steps": 1010, "total_steps": 3573, "loss": 1.3372, "lr": 4.509541236961835e-05, "epoch": 0.8480268681780017, "percentage": 28.27, "elapsed_time": "0:22:17", "remaining_time": "0:56:35"} |
|
{"current_steps": 1020, "total_steps": 3573, "loss": 1.3459, "lr": 4.4949131619278233e-05, "epoch": 0.8564231738035264, "percentage": 28.55, "elapsed_time": "0:22:30", "remaining_time": "0:56:19"} |
|
{"current_steps": 1030, "total_steps": 3573, "loss": 1.3288, "lr": 4.4800946029690205e-05, "epoch": 0.8648194794290512, "percentage": 28.83, "elapsed_time": "0:22:42", "remaining_time": "0:56:03"} |
|
{"current_steps": 1040, "total_steps": 3573, "loss": 1.3524, "lr": 4.465086975032866e-05, "epoch": 0.873215785054576, "percentage": 29.11, "elapsed_time": "0:22:54", "remaining_time": "0:55:47"} |
|
{"current_steps": 1050, "total_steps": 3573, "loss": 1.3233, "lr": 4.4498917111200154e-05, "epoch": 0.8816120906801007, "percentage": 29.39, "elapsed_time": "0:23:06", "remaining_time": "0:55:31"} |
|
{"current_steps": 1060, "total_steps": 3573, "loss": 1.3486, "lr": 4.434510262147514e-05, "epoch": 0.8900083963056256, "percentage": 29.67, "elapsed_time": "0:23:18", "remaining_time": "0:55:15"} |
|
{"current_steps": 1070, "total_steps": 3573, "loss": 1.3375, "lr": 4.418944096810253e-05, "epoch": 0.8984047019311503, "percentage": 29.95, "elapsed_time": "0:23:30", "remaining_time": "0:55:00"} |
|
{"current_steps": 1080, "total_steps": 3573, "loss": 1.3428, "lr": 4.403194701440733e-05, "epoch": 0.906801007556675, "percentage": 30.23, "elapsed_time": "0:23:42", "remaining_time": "0:54:44"} |
|
{"current_steps": 1090, "total_steps": 3573, "loss": 1.3312, "lr": 4.3872635798671384e-05, "epoch": 0.9151973131821999, "percentage": 30.51, "elapsed_time": "0:23:55", "remaining_time": "0:54:29"} |
|
{"current_steps": 1100, "total_steps": 3573, "loss": 1.3268, "lr": 4.3711522532697526e-05, "epoch": 0.9235936188077246, "percentage": 30.79, "elapsed_time": "0:24:07", "remaining_time": "0:54:14"} |
|
{"current_steps": 1110, "total_steps": 3573, "loss": 1.2904, "lr": 4.354862260035699e-05, "epoch": 0.9319899244332494, "percentage": 31.07, "elapsed_time": "0:24:19", "remaining_time": "0:53:58"} |
|
{"current_steps": 1120, "total_steps": 3573, "loss": 1.3352, "lr": 4.338395155612055e-05, "epoch": 0.9403862300587741, "percentage": 31.35, "elapsed_time": "0:24:31", "remaining_time": "0:53:43"} |
|
{"current_steps": 1130, "total_steps": 3573, "loss": 1.3327, "lr": 4.321752512357328e-05, "epoch": 0.9487825356842989, "percentage": 31.63, "elapsed_time": "0:24:43", "remaining_time": "0:53:27"} |
|
{"current_steps": 1140, "total_steps": 3573, "loss": 1.3293, "lr": 4.304935919391317e-05, "epoch": 0.9571788413098237, "percentage": 31.91, "elapsed_time": "0:24:55", "remaining_time": "0:53:12"} |
|
{"current_steps": 1150, "total_steps": 3573, "loss": 1.3171, "lr": 4.2879469824433814e-05, "epoch": 0.9655751469353484, "percentage": 32.19, "elapsed_time": "0:25:08", "remaining_time": "0:52:57"} |
|
{"current_steps": 1160, "total_steps": 3573, "loss": 1.3291, "lr": 4.2707873236991116e-05, "epoch": 0.9739714525608733, "percentage": 32.47, "elapsed_time": "0:25:20", "remaining_time": "0:52:42"} |
|
{"current_steps": 1170, "total_steps": 3573, "loss": 1.2906, "lr": 4.2534585816454384e-05, "epoch": 0.982367758186398, "percentage": 32.75, "elapsed_time": "0:25:32", "remaining_time": "0:52:27"} |
|
{"current_steps": 1180, "total_steps": 3573, "loss": 1.3516, "lr": 4.235962410914185e-05, "epoch": 0.9907640638119227, "percentage": 33.03, "elapsed_time": "0:25:44", "remaining_time": "0:52:12"} |
|
{"current_steps": 1190, "total_steps": 3573, "loss": 1.3249, "lr": 4.218300482124069e-05, "epoch": 0.9991603694374476, "percentage": 33.31, "elapsed_time": "0:25:56", "remaining_time": "0:51:57"} |
|
{"current_steps": 1200, "total_steps": 3573, "loss": 1.2766, "lr": 4.2004744817211866e-05, "epoch": 1.0075566750629723, "percentage": 33.59, "elapsed_time": "0:26:08", "remaining_time": "0:51:42"} |
|
{"current_steps": 1200, "total_steps": 3573, "eval_loss": 1.3506666421890259, "epoch": 1.0075566750629723, "percentage": 33.59, "elapsed_time": "0:26:46", "remaining_time": "0:52:56"} |
|
{"current_steps": 1210, "total_steps": 3573, "loss": 1.2816, "lr": 4.182486111817983e-05, "epoch": 1.015952980688497, "percentage": 33.87, "elapsed_time": "0:26:58", "remaining_time": "0:52:40"} |
|
{"current_steps": 1220, "total_steps": 3573, "loss": 1.2815, "lr": 4.164337090030727e-05, "epoch": 1.0243492863140218, "percentage": 34.14, "elapsed_time": "0:27:10", "remaining_time": "0:52:24"} |
|
{"current_steps": 1230, "total_steps": 3573, "loss": 1.2692, "lr": 4.146029149315502e-05, "epoch": 1.0327455919395465, "percentage": 34.42, "elapsed_time": "0:27:22", "remaining_time": "0:52:08"} |
|
{"current_steps": 1240, "total_steps": 3573, "loss": 1.2572, "lr": 4.1275640378027367e-05, "epoch": 1.0411418975650715, "percentage": 34.7, "elapsed_time": "0:27:34", "remaining_time": "0:51:53"} |
|
{"current_steps": 1250, "total_steps": 3573, "loss": 1.2636, "lr": 4.108943518630287e-05, "epoch": 1.0495382031905962, "percentage": 34.98, "elapsed_time": "0:27:47", "remaining_time": "0:51:37"} |
|
{"current_steps": 1260, "total_steps": 3573, "loss": 1.246, "lr": 4.09016936977508e-05, "epoch": 1.057934508816121, "percentage": 35.26, "elapsed_time": "0:27:59", "remaining_time": "0:51:22"} |
|
{"current_steps": 1270, "total_steps": 3573, "loss": 1.2416, "lr": 4.071243383883344e-05, "epoch": 1.0663308144416457, "percentage": 35.54, "elapsed_time": "0:28:11", "remaining_time": "0:51:07"} |
|
{"current_steps": 1280, "total_steps": 3573, "loss": 1.2684, "lr": 4.052167368099443e-05, "epoch": 1.0747271200671704, "percentage": 35.82, "elapsed_time": "0:28:23", "remaining_time": "0:50:51"} |
|
{"current_steps": 1290, "total_steps": 3573, "loss": 1.2679, "lr": 4.032943143893315e-05, "epoch": 1.0831234256926952, "percentage": 36.1, "elapsed_time": "0:28:35", "remaining_time": "0:50:36"} |
|
{"current_steps": 1300, "total_steps": 3573, "loss": 1.2801, "lr": 4.0135725468865545e-05, "epoch": 1.0915197313182199, "percentage": 36.38, "elapsed_time": "0:28:47", "remaining_time": "0:50:21"} |
|
{"current_steps": 1310, "total_steps": 3573, "loss": 1.2552, "lr": 3.994057426677135e-05, "epoch": 1.0999160369437448, "percentage": 36.66, "elapsed_time": "0:29:00", "remaining_time": "0:50:05"} |
|
{"current_steps": 1320, "total_steps": 3573, "loss": 1.2467, "lr": 3.974399646662804e-05, "epoch": 1.1083123425692696, "percentage": 36.94, "elapsed_time": "0:29:12", "remaining_time": "0:49:50"} |
|
{"current_steps": 1330, "total_steps": 3573, "loss": 1.2393, "lr": 3.9546010838631523e-05, "epoch": 1.1167086481947943, "percentage": 37.22, "elapsed_time": "0:29:24", "remaining_time": "0:49:35"} |
|
{"current_steps": 1340, "total_steps": 3573, "loss": 1.2413, "lr": 3.9346636287403936e-05, "epoch": 1.125104953820319, "percentage": 37.5, "elapsed_time": "0:29:36", "remaining_time": "0:49:20"} |
|
{"current_steps": 1350, "total_steps": 3573, "loss": 1.2344, "lr": 3.9145891850188446e-05, "epoch": 1.1335012594458438, "percentage": 37.78, "elapsed_time": "0:29:48", "remaining_time": "0:49:05"} |
|
{"current_steps": 1360, "total_steps": 3573, "loss": 1.2723, "lr": 3.894379669503159e-05, "epoch": 1.1418975650713685, "percentage": 38.06, "elapsed_time": "0:30:00", "remaining_time": "0:48:50"} |
|
{"current_steps": 1370, "total_steps": 3573, "loss": 1.2441, "lr": 3.874037011895294e-05, "epoch": 1.1502938706968933, "percentage": 38.34, "elapsed_time": "0:30:12", "remaining_time": "0:48:35"} |
|
{"current_steps": 1380, "total_steps": 3573, "loss": 1.2599, "lr": 3.853563154610255e-05, "epoch": 1.1586901763224182, "percentage": 38.62, "elapsed_time": "0:30:25", "remaining_time": "0:48:20"} |
|
{"current_steps": 1390, "total_steps": 3573, "loss": 1.2596, "lr": 3.832960052590626e-05, "epoch": 1.167086481947943, "percentage": 38.9, "elapsed_time": "0:30:37", "remaining_time": "0:48:05"} |
|
{"current_steps": 1400, "total_steps": 3573, "loss": 1.2679, "lr": 3.812229673119902e-05, "epoch": 1.1754827875734677, "percentage": 39.18, "elapsed_time": "0:30:49", "remaining_time": "0:47:50"} |
|
{"current_steps": 1410, "total_steps": 3573, "loss": 1.2893, "lr": 3.791373995634641e-05, "epoch": 1.1838790931989924, "percentage": 39.46, "elapsed_time": "0:31:01", "remaining_time": "0:47:35"} |
|
{"current_steps": 1420, "total_steps": 3573, "loss": 1.2858, "lr": 3.770395011535459e-05, "epoch": 1.1922753988245172, "percentage": 39.74, "elapsed_time": "0:31:13", "remaining_time": "0:47:21"} |
|
{"current_steps": 1430, "total_steps": 3573, "loss": 1.2544, "lr": 3.749294723996884e-05, "epoch": 1.200671704450042, "percentage": 40.02, "elapsed_time": "0:31:26", "remaining_time": "0:47:06"} |
|
{"current_steps": 1440, "total_steps": 3573, "loss": 1.2406, "lr": 3.72807514777608e-05, "epoch": 1.2090680100755669, "percentage": 40.3, "elapsed_time": "0:31:38", "remaining_time": "0:46:51"} |
|
{"current_steps": 1450, "total_steps": 3573, "loss": 1.2687, "lr": 3.7067383090204696e-05, "epoch": 1.2174643157010916, "percentage": 40.58, "elapsed_time": "0:31:50", "remaining_time": "0:46:37"} |
|
{"current_steps": 1460, "total_steps": 3573, "loss": 1.2529, "lr": 3.6852862450742664e-05, "epoch": 1.2258606213266163, "percentage": 40.86, "elapsed_time": "0:32:02", "remaining_time": "0:46:22"} |
|
{"current_steps": 1470, "total_steps": 3573, "loss": 1.2607, "lr": 3.663721004283942e-05, "epoch": 1.234256926952141, "percentage": 41.14, "elapsed_time": "0:32:14", "remaining_time": "0:46:07"} |
|
{"current_steps": 1480, "total_steps": 3573, "loss": 1.2633, "lr": 3.642044645802638e-05, "epoch": 1.2426532325776658, "percentage": 41.42, "elapsed_time": "0:32:26", "remaining_time": "0:45:53"} |
|
{"current_steps": 1490, "total_steps": 3573, "loss": 1.2631, "lr": 3.620259239393549e-05, "epoch": 1.2510495382031905, "percentage": 41.7, "elapsed_time": "0:32:39", "remaining_time": "0:45:38"} |
|
{"current_steps": 1500, "total_steps": 3573, "loss": 1.2323, "lr": 3.5983668652322914e-05, "epoch": 1.2594458438287153, "percentage": 41.98, "elapsed_time": "0:32:51", "remaining_time": "0:45:24"} |
|
{"current_steps": 1510, "total_steps": 3573, "loss": 1.2499, "lr": 3.576369613708278e-05, "epoch": 1.26784214945424, "percentage": 42.26, "elapsed_time": "0:33:25", "remaining_time": "0:45:40"} |
|
{"current_steps": 1520, "total_steps": 3573, "loss": 1.2623, "lr": 3.554269585225117e-05, "epoch": 1.276238455079765, "percentage": 42.54, "elapsed_time": "0:33:37", "remaining_time": "0:45:25"} |
|
{"current_steps": 1530, "total_steps": 3573, "loss": 1.25, "lr": 3.532068890000059e-05, "epoch": 1.2846347607052897, "percentage": 42.82, "elapsed_time": "0:33:49", "remaining_time": "0:45:10"} |
|
{"current_steps": 1540, "total_steps": 3573, "loss": 1.2615, "lr": 3.5097696478624956e-05, "epoch": 1.2930310663308144, "percentage": 43.1, "elapsed_time": "0:34:02", "remaining_time": "0:44:55"} |
|
{"current_steps": 1550, "total_steps": 3573, "loss": 1.2577, "lr": 3.487373988051556e-05, "epoch": 1.3014273719563392, "percentage": 43.38, "elapsed_time": "0:34:14", "remaining_time": "0:44:41"} |
|
{"current_steps": 1560, "total_steps": 3573, "loss": 1.2252, "lr": 3.464884049012794e-05, "epoch": 1.309823677581864, "percentage": 43.66, "elapsed_time": "0:34:26", "remaining_time": "0:44:26"} |
|
{"current_steps": 1570, "total_steps": 3573, "loss": 1.2333, "lr": 3.442301978193996e-05, "epoch": 1.3182199832073889, "percentage": 43.94, "elapsed_time": "0:34:38", "remaining_time": "0:44:12"} |
|
{"current_steps": 1580, "total_steps": 3573, "loss": 1.2309, "lr": 3.419629931840137e-05, "epoch": 1.3266162888329136, "percentage": 44.22, "elapsed_time": "0:34:50", "remaining_time": "0:43:57"} |
|
{"current_steps": 1590, "total_steps": 3573, "loss": 1.2347, "lr": 3.396870074787489e-05, "epoch": 1.3350125944584383, "percentage": 44.5, "elapsed_time": "0:35:03", "remaining_time": "0:43:42"} |
|
{"current_steps": 1600, "total_steps": 3573, "loss": 1.2278, "lr": 3.374024580256913e-05, "epoch": 1.343408900083963, "percentage": 44.78, "elapsed_time": "0:35:15", "remaining_time": "0:43:28"} |
|
{"current_steps": 1610, "total_steps": 3573, "loss": 1.2459, "lr": 3.351095629646348e-05, "epoch": 1.3518052057094878, "percentage": 45.06, "elapsed_time": "0:35:27", "remaining_time": "0:43:13"} |
|
{"current_steps": 1620, "total_steps": 3573, "loss": 1.2567, "lr": 3.3280854123225245e-05, "epoch": 1.3602015113350125, "percentage": 45.34, "elapsed_time": "0:35:39", "remaining_time": "0:42:59"} |
|
{"current_steps": 1630, "total_steps": 3573, "loss": 1.2427, "lr": 3.3049961254119077e-05, "epoch": 1.3685978169605373, "percentage": 45.62, "elapsed_time": "0:35:51", "remaining_time": "0:42:44"} |
|
{"current_steps": 1640, "total_steps": 3573, "loss": 1.2292, "lr": 3.281829973590909e-05, "epoch": 1.376994122586062, "percentage": 45.9, "elapsed_time": "0:36:03", "remaining_time": "0:42:30"} |
|
{"current_steps": 1650, "total_steps": 3573, "loss": 1.2231, "lr": 3.258589168875373e-05, "epoch": 1.385390428211587, "percentage": 46.18, "elapsed_time": "0:36:16", "remaining_time": "0:42:16"} |
|
{"current_steps": 1660, "total_steps": 3573, "loss": 1.2399, "lr": 3.2352759304093624e-05, "epoch": 1.3937867338371117, "percentage": 46.46, "elapsed_time": "0:36:28", "remaining_time": "0:42:01"} |
|
{"current_steps": 1670, "total_steps": 3573, "loss": 1.2786, "lr": 3.211892484253261e-05, "epoch": 1.4021830394626364, "percentage": 46.74, "elapsed_time": "0:36:40", "remaining_time": "0:41:47"} |
|
{"current_steps": 1680, "total_steps": 3573, "loss": 1.2423, "lr": 3.1884410631712235e-05, "epoch": 1.4105793450881612, "percentage": 47.02, "elapsed_time": "0:36:52", "remaining_time": "0:41:32"} |
|
{"current_steps": 1690, "total_steps": 3573, "loss": 1.2399, "lr": 3.164923906417979e-05, "epoch": 1.418975650713686, "percentage": 47.3, "elapsed_time": "0:37:04", "remaining_time": "0:41:18"} |
|
{"current_steps": 1700, "total_steps": 3573, "loss": 1.2575, "lr": 3.1413432595250134e-05, "epoch": 1.4273719563392109, "percentage": 47.58, "elapsed_time": "0:37:16", "remaining_time": "0:41:04"} |
|
{"current_steps": 1710, "total_steps": 3573, "loss": 1.2155, "lr": 3.117701374086158e-05, "epoch": 1.4357682619647356, "percentage": 47.86, "elapsed_time": "0:37:28", "remaining_time": "0:40:50"} |
|
{"current_steps": 1720, "total_steps": 3573, "loss": 1.2561, "lr": 3.094000507542595e-05, "epoch": 1.4441645675902604, "percentage": 48.14, "elapsed_time": "0:37:40", "remaining_time": "0:40:35"} |
|
{"current_steps": 1730, "total_steps": 3573, "loss": 1.2389, "lr": 3.07024292296731e-05, "epoch": 1.452560873215785, "percentage": 48.42, "elapsed_time": "0:37:53", "remaining_time": "0:40:21"} |
|
{"current_steps": 1740, "total_steps": 3573, "loss": 1.2323, "lr": 3.0464308888489936e-05, "epoch": 1.4609571788413098, "percentage": 48.7, "elapsed_time": "0:38:05", "remaining_time": "0:40:07"} |
|
{"current_steps": 1750, "total_steps": 3573, "loss": 1.228, "lr": 3.022566678875446e-05, "epoch": 1.4693534844668346, "percentage": 48.98, "elapsed_time": "0:38:17", "remaining_time": "0:39:53"} |
|
{"current_steps": 1760, "total_steps": 3573, "loss": 1.2025, "lr": 2.9986525717164694e-05, "epoch": 1.4777497900923593, "percentage": 49.26, "elapsed_time": "0:38:29", "remaining_time": "0:39:39"} |
|
{"current_steps": 1770, "total_steps": 3573, "loss": 1.2585, "lr": 2.974690850806287e-05, "epoch": 1.486146095717884, "percentage": 49.54, "elapsed_time": "0:38:41", "remaining_time": "0:39:25"} |
|
{"current_steps": 1780, "total_steps": 3573, "loss": 1.2438, "lr": 2.9506838041255147e-05, "epoch": 1.4945424013434088, "percentage": 49.82, "elapsed_time": "0:38:54", "remaining_time": "0:39:11"} |
|
{"current_steps": 1790, "total_steps": 3573, "loss": 1.23, "lr": 2.926633723982692e-05, "epoch": 1.5029387069689337, "percentage": 50.1, "elapsed_time": "0:39:06", "remaining_time": "0:38:57"} |
|
{"current_steps": 1800, "total_steps": 3573, "loss": 1.2089, "lr": 2.9025429067953975e-05, "epoch": 1.5113350125944585, "percentage": 50.38, "elapsed_time": "0:39:18", "remaining_time": "0:38:43"} |
|
{"current_steps": 1800, "total_steps": 3573, "eval_loss": 1.3161499500274658, "epoch": 1.5113350125944585, "percentage": 50.38, "elapsed_time": "0:39:55", "remaining_time": "0:39:20"} |
|
{"current_steps": 1810, "total_steps": 3573, "loss": 1.2452, "lr": 2.878413652870983e-05, "epoch": 1.5197313182199832, "percentage": 50.66, "elapsed_time": "0:40:08", "remaining_time": "0:39:05"} |
|
{"current_steps": 1820, "total_steps": 3573, "loss": 1.2335, "lr": 2.8542482661869228e-05, "epoch": 1.528127623845508, "percentage": 50.94, "elapsed_time": "0:40:20", "remaining_time": "0:38:51"} |
|
{"current_steps": 1830, "total_steps": 3573, "loss": 1.2107, "lr": 2.8300490541708226e-05, "epoch": 1.536523929471033, "percentage": 51.22, "elapsed_time": "0:40:32", "remaining_time": "0:38:36"} |
|
{"current_steps": 1840, "total_steps": 3573, "loss": 1.2323, "lr": 2.8058183274800933e-05, "epoch": 1.5449202350965576, "percentage": 51.5, "elapsed_time": "0:40:44", "remaining_time": "0:38:22"} |
|
{"current_steps": 1850, "total_steps": 3573, "loss": 1.2208, "lr": 2.7815583997813176e-05, "epoch": 1.5533165407220824, "percentage": 51.78, "elapsed_time": "0:40:56", "remaining_time": "0:38:08"} |
|
{"current_steps": 1860, "total_steps": 3573, "loss": 1.2519, "lr": 2.7572715875293336e-05, "epoch": 1.561712846347607, "percentage": 52.06, "elapsed_time": "0:41:09", "remaining_time": "0:37:53"} |
|
{"current_steps": 1870, "total_steps": 3573, "loss": 1.2072, "lr": 2.7329602097460453e-05, "epoch": 1.5701091519731318, "percentage": 52.34, "elapsed_time": "0:41:21", "remaining_time": "0:37:39"} |
|
{"current_steps": 1880, "total_steps": 3573, "loss": 1.2171, "lr": 2.7086265877989907e-05, "epoch": 1.5785054575986566, "percentage": 52.62, "elapsed_time": "0:41:33", "remaining_time": "0:37:25"} |
|
{"current_steps": 1890, "total_steps": 3573, "loss": 1.2032, "lr": 2.68427304517969e-05, "epoch": 1.5869017632241813, "percentage": 52.9, "elapsed_time": "0:41:45", "remaining_time": "0:37:11"} |
|
{"current_steps": 1900, "total_steps": 3573, "loss": 1.2233, "lr": 2.6599019072817823e-05, "epoch": 1.595298068849706, "percentage": 53.18, "elapsed_time": "0:41:58", "remaining_time": "0:36:57"} |
|
{"current_steps": 1910, "total_steps": 3573, "loss": 1.2302, "lr": 2.6355155011789918e-05, "epoch": 1.6036943744752308, "percentage": 53.46, "elapsed_time": "0:42:10", "remaining_time": "0:36:43"} |
|
{"current_steps": 1920, "total_steps": 3573, "loss": 1.2237, "lr": 2.6111161554029216e-05, "epoch": 1.6120906801007555, "percentage": 53.74, "elapsed_time": "0:42:22", "remaining_time": "0:36:28"} |
|
{"current_steps": 1930, "total_steps": 3573, "loss": 1.2373, "lr": 2.5867061997207208e-05, "epoch": 1.6204869857262805, "percentage": 54.02, "elapsed_time": "0:42:34", "remaining_time": "0:36:14"} |
|
{"current_steps": 1940, "total_steps": 3573, "loss": 1.2366, "lr": 2.5622879649126204e-05, "epoch": 1.6288832913518052, "percentage": 54.3, "elapsed_time": "0:42:46", "remaining_time": "0:36:00"} |
|
{"current_steps": 1950, "total_steps": 3573, "loss": 1.2175, "lr": 2.5378637825493827e-05, "epoch": 1.63727959697733, "percentage": 54.58, "elapsed_time": "0:42:58", "remaining_time": "0:35:46"} |
|
{"current_steps": 1960, "total_steps": 3573, "loss": 1.2226, "lr": 2.5134359847696725e-05, "epoch": 1.645675902602855, "percentage": 54.86, "elapsed_time": "0:43:11", "remaining_time": "0:35:32"} |
|
{"current_steps": 1970, "total_steps": 3573, "loss": 1.2354, "lr": 2.48900690405737e-05, "epoch": 1.6540722082283796, "percentage": 55.14, "elapsed_time": "0:43:23", "remaining_time": "0:35:18"} |
|
{"current_steps": 1980, "total_steps": 3573, "loss": 1.2346, "lr": 2.4645788730188595e-05, "epoch": 1.6624685138539044, "percentage": 55.42, "elapsed_time": "0:43:35", "remaining_time": "0:35:04"} |
|
{"current_steps": 1990, "total_steps": 3573, "loss": 1.2266, "lr": 2.4401542241602936e-05, "epoch": 1.670864819479429, "percentage": 55.7, "elapsed_time": "0:43:47", "remaining_time": "0:34:50"} |
|
{"current_steps": 2000, "total_steps": 3573, "loss": 1.2489, "lr": 2.4157352896648785e-05, "epoch": 1.6792611251049538, "percentage": 55.98, "elapsed_time": "0:43:59", "remaining_time": "0:34:36"} |
|
{"current_steps": 2010, "total_steps": 3573, "loss": 1.2321, "lr": 2.391324401170189e-05, "epoch": 1.6876574307304786, "percentage": 56.26, "elapsed_time": "0:44:34", "remaining_time": "0:34:40"} |
|
{"current_steps": 2020, "total_steps": 3573, "loss": 1.2133, "lr": 2.3669238895455257e-05, "epoch": 1.6960537363560033, "percentage": 56.54, "elapsed_time": "0:44:47", "remaining_time": "0:34:25"} |
|
{"current_steps": 2030, "total_steps": 3573, "loss": 1.1832, "lr": 2.3425360846693546e-05, "epoch": 1.704450041981528, "percentage": 56.82, "elapsed_time": "0:44:59", "remaining_time": "0:34:11"} |
|
{"current_steps": 2040, "total_steps": 3573, "loss": 1.1978, "lr": 2.3181633152068444e-05, "epoch": 1.7128463476070528, "percentage": 57.09, "elapsed_time": "0:45:11", "remaining_time": "0:33:57"} |
|
{"current_steps": 2050, "total_steps": 3573, "loss": 1.2274, "lr": 2.293807908387507e-05, "epoch": 1.7212426532325775, "percentage": 57.37, "elapsed_time": "0:45:23", "remaining_time": "0:33:43"} |
|
{"current_steps": 2060, "total_steps": 3573, "loss": 1.2107, "lr": 2.269472189782984e-05, "epoch": 1.7296389588581025, "percentage": 57.65, "elapsed_time": "0:45:35", "remaining_time": "0:33:29"} |
|
{"current_steps": 2070, "total_steps": 3573, "loss": 1.2453, "lr": 2.2451584830849963e-05, "epoch": 1.7380352644836272, "percentage": 57.93, "elapsed_time": "0:45:48", "remaining_time": "0:33:15"} |
|
{"current_steps": 2080, "total_steps": 3573, "loss": 1.2112, "lr": 2.2208691098834574e-05, "epoch": 1.746431570109152, "percentage": 58.21, "elapsed_time": "0:46:00", "remaining_time": "0:33:01"} |
|
{"current_steps": 2090, "total_steps": 3573, "loss": 1.2301, "lr": 2.196606389444802e-05, "epoch": 1.7548278757346767, "percentage": 58.49, "elapsed_time": "0:46:12", "remaining_time": "0:32:47"} |
|
{"current_steps": 2100, "total_steps": 3573, "loss": 1.2254, "lr": 2.1723726384905332e-05, "epoch": 1.7632241813602016, "percentage": 58.77, "elapsed_time": "0:46:25", "remaining_time": "0:32:33"} |
|
{"current_steps": 2110, "total_steps": 3573, "loss": 1.2191, "lr": 2.1481701709760054e-05, "epoch": 1.7716204869857264, "percentage": 59.05, "elapsed_time": "0:46:37", "remaining_time": "0:32:19"} |
|
{"current_steps": 2120, "total_steps": 3573, "loss": 1.1897, "lr": 2.1240012978694786e-05, "epoch": 1.7800167926112511, "percentage": 59.33, "elapsed_time": "0:46:49", "remaining_time": "0:32:05"} |
|
{"current_steps": 2130, "total_steps": 3573, "loss": 1.1936, "lr": 2.0998683269314613e-05, "epoch": 1.7884130982367759, "percentage": 59.61, "elapsed_time": "0:47:01", "remaining_time": "0:31:51"} |
|
{"current_steps": 2140, "total_steps": 3573, "loss": 1.2248, "lr": 2.0757735624943448e-05, "epoch": 1.7968094038623006, "percentage": 59.89, "elapsed_time": "0:47:13", "remaining_time": "0:31:37"} |
|
{"current_steps": 2150, "total_steps": 3573, "loss": 1.2022, "lr": 2.0517193052423823e-05, "epoch": 1.8052057094878253, "percentage": 60.17, "elapsed_time": "0:47:26", "remaining_time": "0:31:23"} |
|
{"current_steps": 2160, "total_steps": 3573, "loss": 1.1938, "lr": 2.0277078519920044e-05, "epoch": 1.81360201511335, "percentage": 60.45, "elapsed_time": "0:47:38", "remaining_time": "0:31:09"} |
|
{"current_steps": 2170, "total_steps": 3573, "loss": 1.1825, "lr": 2.0037414954725117e-05, "epoch": 1.8219983207388748, "percentage": 60.73, "elapsed_time": "0:47:50", "remaining_time": "0:30:55"} |
|
{"current_steps": 2180, "total_steps": 3573, "loss": 1.2092, "lr": 1.979822524107148e-05, "epoch": 1.8303946263643995, "percentage": 61.01, "elapsed_time": "0:48:02", "remaining_time": "0:30:42"} |
|
{"current_steps": 2190, "total_steps": 3573, "loss": 1.2378, "lr": 1.9559532217945974e-05, "epoch": 1.8387909319899243, "percentage": 61.29, "elapsed_time": "0:48:15", "remaining_time": "0:30:28"} |
|
{"current_steps": 2200, "total_steps": 3573, "loss": 1.2142, "lr": 1.932135867690901e-05, "epoch": 1.8471872376154492, "percentage": 61.57, "elapsed_time": "0:48:27", "remaining_time": "0:30:14"} |
|
{"current_steps": 2210, "total_steps": 3573, "loss": 1.2003, "lr": 1.908372735991836e-05, "epoch": 1.855583543240974, "percentage": 61.85, "elapsed_time": "0:48:39", "remaining_time": "0:30:00"} |
|
{"current_steps": 2220, "total_steps": 3573, "loss": 1.2279, "lr": 1.8846660957157626e-05, "epoch": 1.8639798488664987, "percentage": 62.13, "elapsed_time": "0:48:51", "remaining_time": "0:29:46"} |
|
{"current_steps": 2230, "total_steps": 3573, "loss": 1.2175, "lr": 1.8610182104869676e-05, "epoch": 1.8723761544920237, "percentage": 62.41, "elapsed_time": "0:49:03", "remaining_time": "0:29:32"} |
|
{"current_steps": 2240, "total_steps": 3573, "loss": 1.1965, "lr": 1.837431338319523e-05, "epoch": 1.8807724601175484, "percentage": 62.69, "elapsed_time": "0:49:16", "remaining_time": "0:29:19"} |
|
{"current_steps": 2250, "total_steps": 3573, "loss": 1.2082, "lr": 1.813907731401677e-05, "epoch": 1.8891687657430731, "percentage": 62.97, "elapsed_time": "0:49:28", "remaining_time": "0:29:05"} |
|
{"current_steps": 2260, "total_steps": 3573, "loss": 1.1969, "lr": 1.790449635880813e-05, "epoch": 1.8975650713685979, "percentage": 63.25, "elapsed_time": "0:49:40", "remaining_time": "0:28:51"} |
|
{"current_steps": 2270, "total_steps": 3573, "loss": 1.2094, "lr": 1.7670592916489637e-05, "epoch": 1.9059613769941226, "percentage": 63.53, "elapsed_time": "0:49:52", "remaining_time": "0:28:37"} |
|
{"current_steps": 2280, "total_steps": 3573, "loss": 1.2171, "lr": 1.743738932128945e-05, "epoch": 1.9143576826196473, "percentage": 63.81, "elapsed_time": "0:50:05", "remaining_time": "0:28:24"} |
|
{"current_steps": 2290, "total_steps": 3573, "loss": 1.1902, "lr": 1.7204907840610968e-05, "epoch": 1.922753988245172, "percentage": 64.09, "elapsed_time": "0:50:17", "remaining_time": "0:28:10"} |
|
{"current_steps": 2300, "total_steps": 3573, "loss": 1.1915, "lr": 1.6973170672906592e-05, "epoch": 1.9311502938706968, "percentage": 64.37, "elapsed_time": "0:50:29", "remaining_time": "0:27:56"} |
|
{"current_steps": 2310, "total_steps": 3573, "loss": 1.2018, "lr": 1.6742199945558116e-05, "epoch": 1.9395465994962215, "percentage": 64.65, "elapsed_time": "0:50:41", "remaining_time": "0:27:43"} |
|
{"current_steps": 2320, "total_steps": 3573, "loss": 1.1742, "lr": 1.651201771276397e-05, "epoch": 1.9479429051217463, "percentage": 64.93, "elapsed_time": "0:50:54", "remaining_time": "0:27:29"} |
|
{"current_steps": 2330, "total_steps": 3573, "loss": 1.2024, "lr": 1.6282645953433278e-05, "epoch": 1.9563392107472712, "percentage": 65.21, "elapsed_time": "0:51:06", "remaining_time": "0:27:15"} |
|
{"current_steps": 2340, "total_steps": 3573, "loss": 1.2072, "lr": 1.6054106569087247e-05, "epoch": 1.964735516372796, "percentage": 65.49, "elapsed_time": "0:51:18", "remaining_time": "0:27:02"} |
|
{"current_steps": 2350, "total_steps": 3573, "loss": 1.1996, "lr": 1.5826421381767943e-05, "epoch": 1.9731318219983207, "percentage": 65.77, "elapsed_time": "0:51:30", "remaining_time": "0:26:48"} |
|
{"current_steps": 2360, "total_steps": 3573, "loss": 1.1963, "lr": 1.5599612131954562e-05, "epoch": 1.9815281276238457, "percentage": 66.05, "elapsed_time": "0:51:42", "remaining_time": "0:26:34"} |
|
{"current_steps": 2370, "total_steps": 3573, "loss": 1.1909, "lr": 1.537370047648755e-05, "epoch": 1.9899244332493704, "percentage": 66.33, "elapsed_time": "0:51:55", "remaining_time": "0:26:21"} |
|
{"current_steps": 2380, "total_steps": 3573, "loss": 1.1934, "lr": 1.5148707986500754e-05, "epoch": 1.9983207388748951, "percentage": 66.61, "elapsed_time": "0:52:07", "remaining_time": "0:26:07"} |
|
{"current_steps": 2390, "total_steps": 3573, "loss": 1.1015, "lr": 1.4924656145361642e-05, "epoch": 2.00671704450042, "percentage": 66.89, "elapsed_time": "0:52:19", "remaining_time": "0:25:53"} |
|
{"current_steps": 2400, "total_steps": 3573, "loss": 1.0911, "lr": 1.4701566346619994e-05, "epoch": 2.0151133501259446, "percentage": 67.17, "elapsed_time": "0:52:31", "remaining_time": "0:25:40"} |
|
{"current_steps": 2400, "total_steps": 3573, "eval_loss": 1.288699746131897, "epoch": 2.0151133501259446, "percentage": 67.17, "elapsed_time": "0:53:09", "remaining_time": "0:25:58"} |
|
{"current_steps": 2410, "total_steps": 3573, "loss": 1.0922, "lr": 1.447945989196518e-05, "epoch": 2.0235096557514693, "percentage": 67.45, "elapsed_time": "0:53:21", "remaining_time": "0:25:45"} |
|
{"current_steps": 2420, "total_steps": 3573, "loss": 1.0882, "lr": 1.4258357989192089e-05, "epoch": 2.031905961376994, "percentage": 67.73, "elapsed_time": "0:53:33", "remaining_time": "0:25:31"} |
|
{"current_steps": 2430, "total_steps": 3573, "loss": 1.0976, "lr": 1.403828175017618e-05, "epoch": 2.040302267002519, "percentage": 68.01, "elapsed_time": "0:53:46", "remaining_time": "0:25:17"} |
|
{"current_steps": 2440, "total_steps": 3573, "loss": 1.0999, "lr": 1.381925218885759e-05, "epoch": 2.0486985726280436, "percentage": 68.29, "elapsed_time": "0:53:58", "remaining_time": "0:25:03"} |
|
{"current_steps": 2450, "total_steps": 3573, "loss": 1.0848, "lr": 1.3601290219234642e-05, "epoch": 2.0570948782535683, "percentage": 68.57, "elapsed_time": "0:54:10", "remaining_time": "0:24:49"} |
|
{"current_steps": 2460, "total_steps": 3573, "loss": 1.1053, "lr": 1.3384416653366796e-05, "epoch": 2.065491183879093, "percentage": 68.85, "elapsed_time": "0:54:22", "remaining_time": "0:24:36"} |
|
{"current_steps": 2470, "total_steps": 3573, "loss": 1.0565, "lr": 1.3168652199387565e-05, "epoch": 2.0738874895046178, "percentage": 69.13, "elapsed_time": "0:54:34", "remaining_time": "0:24:22"} |
|
{"current_steps": 2480, "total_steps": 3573, "loss": 1.1135, "lr": 1.2954017459527037e-05, "epoch": 2.082283795130143, "percentage": 69.41, "elapsed_time": "0:54:46", "remaining_time": "0:24:08"} |
|
{"current_steps": 2490, "total_steps": 3573, "loss": 1.0978, "lr": 1.2740532928144785e-05, "epoch": 2.0906801007556677, "percentage": 69.69, "elapsed_time": "0:54:59", "remaining_time": "0:23:54"} |
|
{"current_steps": 2500, "total_steps": 3573, "loss": 1.0924, "lr": 1.2528218989772928e-05, "epoch": 2.0990764063811924, "percentage": 69.97, "elapsed_time": "0:55:11", "remaining_time": "0:23:41"} |
|
{"current_steps": 2510, "total_steps": 3573, "loss": 1.1122, "lr": 1.2317095917169729e-05, "epoch": 2.107472712006717, "percentage": 70.25, "elapsed_time": "0:55:45", "remaining_time": "0:23:36"} |
|
{"current_steps": 2520, "total_steps": 3573, "loss": 1.0654, "lr": 1.2107183869383817e-05, "epoch": 2.115869017632242, "percentage": 70.53, "elapsed_time": "0:55:57", "remaining_time": "0:23:23"} |
|
{"current_steps": 2530, "total_steps": 3573, "loss": 1.0885, "lr": 1.1898502889829367e-05, "epoch": 2.1242653232577666, "percentage": 70.81, "elapsed_time": "0:56:09", "remaining_time": "0:23:09"} |
|
{"current_steps": 2540, "total_steps": 3573, "loss": 1.0814, "lr": 1.1691072904372211e-05, "epoch": 2.1326616288832914, "percentage": 71.09, "elapsed_time": "0:56:22", "remaining_time": "0:22:55"} |
|
{"current_steps": 2550, "total_steps": 3573, "loss": 1.1074, "lr": 1.1484913719427245e-05, "epoch": 2.141057934508816, "percentage": 71.37, "elapsed_time": "0:56:34", "remaining_time": "0:22:41"} |
|
{"current_steps": 2560, "total_steps": 3573, "loss": 1.0624, "lr": 1.1280045020067173e-05, "epoch": 2.149454240134341, "percentage": 71.65, "elapsed_time": "0:56:46", "remaining_time": "0:22:27"} |
|
{"current_steps": 2570, "total_steps": 3573, "loss": 1.075, "lr": 1.1076486368142974e-05, "epoch": 2.1578505457598656, "percentage": 71.93, "elapsed_time": "0:56:58", "remaining_time": "0:22:14"} |
|
{"current_steps": 2580, "total_steps": 3573, "loss": 1.1239, "lr": 1.0874257200415921e-05, "epoch": 2.1662468513853903, "percentage": 72.21, "elapsed_time": "0:57:10", "remaining_time": "0:22:00"} |
|
{"current_steps": 2590, "total_steps": 3573, "loss": 1.0855, "lr": 1.0673376826701764e-05, "epoch": 2.174643157010915, "percentage": 72.49, "elapsed_time": "0:57:22", "remaining_time": "0:21:46"} |
|
{"current_steps": 2600, "total_steps": 3573, "loss": 1.0613, "lr": 1.0473864428026903e-05, "epoch": 2.1830394626364398, "percentage": 72.77, "elapsed_time": "0:57:34", "remaining_time": "0:21:32"} |
|
{"current_steps": 2610, "total_steps": 3573, "loss": 1.0874, "lr": 1.0275739054796849e-05, "epoch": 2.1914357682619645, "percentage": 73.05, "elapsed_time": "0:57:47", "remaining_time": "0:21:19"} |
|
{"current_steps": 2620, "total_steps": 3573, "loss": 1.093, "lr": 1.0079019624977277e-05, "epoch": 2.1998320738874897, "percentage": 73.33, "elapsed_time": "0:57:59", "remaining_time": "0:21:05"} |
|
{"current_steps": 2630, "total_steps": 3573, "loss": 1.0792, "lr": 9.883724922287593e-06, "epoch": 2.2082283795130144, "percentage": 73.61, "elapsed_time": "0:58:11", "remaining_time": "0:20:51"} |
|
{"current_steps": 2640, "total_steps": 3573, "loss": 1.0513, "lr": 9.689873594407398e-06, "epoch": 2.216624685138539, "percentage": 73.89, "elapsed_time": "0:58:23", "remaining_time": "0:20:38"} |
|
{"current_steps": 2650, "total_steps": 3573, "loss": 1.0663, "lr": 9.497484151195874e-06, "epoch": 2.225020990764064, "percentage": 74.17, "elapsed_time": "0:58:35", "remaining_time": "0:20:24"} |
|
{"current_steps": 2660, "total_steps": 3573, "loss": 1.0787, "lr": 9.30657496292447e-06, "epoch": 2.2334172963895886, "percentage": 74.45, "elapsed_time": "0:58:48", "remaining_time": "0:20:10"} |
|
{"current_steps": 2670, "total_steps": 3573, "loss": 1.0579, "lr": 9.117164258522695e-06, "epoch": 2.2418136020151134, "percentage": 74.73, "elapsed_time": "0:59:00", "remaining_time": "0:19:57"} |
|
{"current_steps": 2680, "total_steps": 3573, "loss": 1.0512, "lr": 8.929270123837632e-06, "epoch": 2.250209907640638, "percentage": 75.01, "elapsed_time": "0:59:12", "remaining_time": "0:19:43"} |
|
{"current_steps": 2690, "total_steps": 3573, "loss": 1.0658, "lr": 8.742910499906973e-06, "epoch": 2.258606213266163, "percentage": 75.29, "elapsed_time": "0:59:24", "remaining_time": "0:19:30"} |
|
{"current_steps": 2700, "total_steps": 3573, "loss": 1.0696, "lr": 8.558103181245921e-06, "epoch": 2.2670025188916876, "percentage": 75.57, "elapsed_time": "0:59:36", "remaining_time": "0:19:16"} |
|
{"current_steps": 2710, "total_steps": 3573, "loss": 1.092, "lr": 8.374865814148073e-06, "epoch": 2.2753988245172123, "percentage": 75.85, "elapsed_time": "0:59:48", "remaining_time": "0:19:02"} |
|
{"current_steps": 2720, "total_steps": 3573, "loss": 1.0822, "lr": 8.193215895000526e-06, "epoch": 2.283795130142737, "percentage": 76.13, "elapsed_time": "1:00:01", "remaining_time": "0:18:49"} |
|
{"current_steps": 2730, "total_steps": 3573, "loss": 1.0568, "lr": 8.013170768613146e-06, "epoch": 2.292191435768262, "percentage": 76.41, "elapsed_time": "1:00:13", "remaining_time": "0:18:35"} |
|
{"current_steps": 2740, "total_steps": 3573, "loss": 1.0731, "lr": 7.834747626562484e-06, "epoch": 2.3005877413937865, "percentage": 76.69, "elapsed_time": "1:00:25", "remaining_time": "0:18:22"} |
|
{"current_steps": 2750, "total_steps": 3573, "loss": 1.075, "lr": 7.657963505550189e-06, "epoch": 2.3089840470193117, "percentage": 76.97, "elapsed_time": "1:00:37", "remaining_time": "0:18:08"} |
|
{"current_steps": 2760, "total_steps": 3573, "loss": 1.0854, "lr": 7.482835285776305e-06, "epoch": 2.3173803526448364, "percentage": 77.25, "elapsed_time": "1:00:49", "remaining_time": "0:17:55"} |
|
{"current_steps": 2770, "total_steps": 3573, "loss": 1.093, "lr": 7.309379689327409e-06, "epoch": 2.325776658270361, "percentage": 77.53, "elapsed_time": "1:01:01", "remaining_time": "0:17:41"} |
|
{"current_steps": 2780, "total_steps": 3573, "loss": 1.0926, "lr": 7.137613278579964e-06, "epoch": 2.334172963895886, "percentage": 77.81, "elapsed_time": "1:01:14", "remaining_time": "0:17:28"} |
|
{"current_steps": 2790, "total_steps": 3573, "loss": 1.1078, "lr": 6.967552454618839e-06, "epoch": 2.3425692695214106, "percentage": 78.09, "elapsed_time": "1:01:26", "remaining_time": "0:17:14"} |
|
{"current_steps": 2800, "total_steps": 3573, "loss": 1.0781, "lr": 6.799213455671255e-06, "epoch": 2.3509655751469354, "percentage": 78.37, "elapsed_time": "1:01:38", "remaining_time": "0:17:00"} |
|
{"current_steps": 2810, "total_steps": 3573, "loss": 1.0824, "lr": 6.632612355556256e-06, "epoch": 2.35936188077246, "percentage": 78.65, "elapsed_time": "1:01:50", "remaining_time": "0:16:47"} |
|
{"current_steps": 2820, "total_steps": 3573, "loss": 1.0686, "lr": 6.467765062149977e-06, "epoch": 2.367758186397985, "percentage": 78.93, "elapsed_time": "1:02:02", "remaining_time": "0:16:34"} |
|
{"current_steps": 2830, "total_steps": 3573, "loss": 1.0902, "lr": 6.304687315866589e-06, "epoch": 2.3761544920235096, "percentage": 79.21, "elapsed_time": "1:02:14", "remaining_time": "0:16:20"} |
|
{"current_steps": 2840, "total_steps": 3573, "loss": 1.0704, "lr": 6.143394688155396e-06, "epoch": 2.3845507976490343, "percentage": 79.49, "elapsed_time": "1:02:26", "remaining_time": "0:16:07"} |
|
{"current_steps": 2850, "total_steps": 3573, "loss": 1.0824, "lr": 5.98390258001397e-06, "epoch": 2.392947103274559, "percentage": 79.76, "elapsed_time": "1:02:39", "remaining_time": "0:15:53"} |
|
{"current_steps": 2860, "total_steps": 3573, "loss": 1.0549, "lr": 5.826226220517606e-06, "epoch": 2.401343408900084, "percentage": 80.04, "elapsed_time": "1:02:51", "remaining_time": "0:15:40"} |
|
{"current_steps": 2870, "total_steps": 3573, "loss": 1.0999, "lr": 5.670380665365144e-06, "epoch": 2.4097397145256085, "percentage": 80.32, "elapsed_time": "1:03:03", "remaining_time": "0:15:26"} |
|
{"current_steps": 2880, "total_steps": 3573, "loss": 1.0929, "lr": 5.516380795441417e-06, "epoch": 2.4181360201511337, "percentage": 80.6, "elapsed_time": "1:03:15", "remaining_time": "0:15:13"} |
|
{"current_steps": 2890, "total_steps": 3573, "loss": 1.0857, "lr": 5.364241315396335e-06, "epoch": 2.4265323257766584, "percentage": 80.88, "elapsed_time": "1:03:27", "remaining_time": "0:14:59"} |
|
{"current_steps": 2900, "total_steps": 3573, "loss": 1.0763, "lr": 5.21397675224081e-06, "epoch": 2.434928631402183, "percentage": 81.16, "elapsed_time": "1:03:40", "remaining_time": "0:14:46"} |
|
{"current_steps": 2910, "total_steps": 3573, "loss": 1.0837, "lr": 5.065601453959659e-06, "epoch": 2.443324937027708, "percentage": 81.44, "elapsed_time": "1:03:52", "remaining_time": "0:14:33"} |
|
{"current_steps": 2920, "total_steps": 3573, "loss": 1.0655, "lr": 4.919129588141563e-06, "epoch": 2.4517212426532327, "percentage": 81.72, "elapsed_time": "1:04:04", "remaining_time": "0:14:19"} |
|
{"current_steps": 2930, "total_steps": 3573, "loss": 1.0604, "lr": 4.7745751406263165e-06, "epoch": 2.4601175482787574, "percentage": 82.0, "elapsed_time": "1:04:16", "remaining_time": "0:14:06"} |
|
{"current_steps": 2940, "total_steps": 3573, "loss": 1.0635, "lr": 4.631951914169363e-06, "epoch": 2.468513853904282, "percentage": 82.28, "elapsed_time": "1:04:28", "remaining_time": "0:13:52"} |
|
{"current_steps": 2950, "total_steps": 3573, "loss": 1.0838, "lr": 4.491273527123866e-06, "epoch": 2.476910159529807, "percentage": 82.56, "elapsed_time": "1:04:40", "remaining_time": "0:13:39"} |
|
{"current_steps": 2960, "total_steps": 3573, "loss": 1.06, "lr": 4.352553412140303e-06, "epoch": 2.4853064651553316, "percentage": 82.84, "elapsed_time": "1:04:53", "remaining_time": "0:13:26"} |
|
{"current_steps": 2970, "total_steps": 3573, "loss": 1.0728, "lr": 4.215804814883959e-06, "epoch": 2.4937027707808563, "percentage": 83.12, "elapsed_time": "1:05:05", "remaining_time": "0:13:12"} |
|
{"current_steps": 2980, "total_steps": 3573, "loss": 1.0567, "lr": 4.08104079277005e-06, "epoch": 2.502099076406381, "percentage": 83.4, "elapsed_time": "1:05:17", "remaining_time": "0:12:59"} |
|
{"current_steps": 2990, "total_steps": 3573, "loss": 1.0833, "lr": 3.948274213717015e-06, "epoch": 2.510495382031906, "percentage": 83.68, "elapsed_time": "1:05:29", "remaining_time": "0:12:46"} |
|
{"current_steps": 3000, "total_steps": 3573, "loss": 1.0794, "lr": 3.817517754917802e-06, "epoch": 2.5188916876574305, "percentage": 83.96, "elapsed_time": "1:05:41", "remaining_time": "0:12:32"} |
|
{"current_steps": 3000, "total_steps": 3573, "eval_loss": 1.271108627319336, "epoch": 2.5188916876574305, "percentage": 83.96, "elapsed_time": "1:06:19", "remaining_time": "0:12:40"} |
|
{"current_steps": 3010, "total_steps": 3573, "loss": 1.0797, "lr": 3.6887839016293807e-06, "epoch": 2.5272879932829557, "percentage": 84.24, "elapsed_time": "1:06:53", "remaining_time": "0:12:30"} |
|
{"current_steps": 3020, "total_steps": 3573, "loss": 1.0809, "lr": 3.5620849459805983e-06, "epoch": 2.53568429890848, "percentage": 84.52, "elapsed_time": "1:07:05", "remaining_time": "0:12:17"} |
|
{"current_steps": 3030, "total_steps": 3573, "loss": 1.0841, "lr": 3.4374329857984637e-06, "epoch": 2.544080604534005, "percentage": 84.8, "elapsed_time": "1:07:17", "remaining_time": "0:12:03"} |
|
{"current_steps": 3040, "total_steps": 3573, "loss": 1.0783, "lr": 3.314839923453003e-06, "epoch": 2.55247691015953, "percentage": 85.08, "elapsed_time": "1:07:29", "remaining_time": "0:11:50"} |
|
{"current_steps": 3050, "total_steps": 3573, "loss": 1.0657, "lr": 3.1943174647207474e-06, "epoch": 2.5608732157850547, "percentage": 85.36, "elapsed_time": "1:07:42", "remaining_time": "0:11:36"} |
|
{"current_steps": 3060, "total_steps": 3573, "loss": 1.0811, "lr": 3.0758771176669948e-06, "epoch": 2.5692695214105794, "percentage": 85.64, "elapsed_time": "1:07:54", "remaining_time": "0:11:23"} |
|
{"current_steps": 3070, "total_steps": 3573, "loss": 1.085, "lr": 2.9595301915470246e-06, "epoch": 2.577665827036104, "percentage": 85.92, "elapsed_time": "1:08:06", "remaining_time": "0:11:09"} |
|
{"current_steps": 3080, "total_steps": 3573, "loss": 1.0682, "lr": 2.8452877957261537e-06, "epoch": 2.586062132661629, "percentage": 86.2, "elapsed_time": "1:08:18", "remaining_time": "0:10:56"} |
|
{"current_steps": 3090, "total_steps": 3573, "loss": 1.0705, "lr": 2.73316083861902e-06, "epoch": 2.5944584382871536, "percentage": 86.48, "elapsed_time": "1:08:31", "remaining_time": "0:10:42"} |
|
{"current_steps": 3100, "total_steps": 3573, "loss": 1.08, "lr": 2.623160026647978e-06, "epoch": 2.6028547439126783, "percentage": 86.76, "elapsed_time": "1:08:43", "remaining_time": "0:10:29"} |
|
{"current_steps": 3110, "total_steps": 3573, "loss": 1.055, "lr": 2.515295863220796e-06, "epoch": 2.611251049538203, "percentage": 87.04, "elapsed_time": "1:08:55", "remaining_time": "0:10:15"} |
|
{"current_steps": 3120, "total_steps": 3573, "loss": 1.0541, "lr": 2.4095786477277253e-06, "epoch": 2.619647355163728, "percentage": 87.32, "elapsed_time": "1:09:07", "remaining_time": "0:10:02"} |
|
{"current_steps": 3130, "total_steps": 3573, "loss": 1.0712, "lr": 2.3060184745580972e-06, "epoch": 2.6280436607892526, "percentage": 87.6, "elapsed_time": "1:09:20", "remaining_time": "0:09:48"} |
|
{"current_steps": 3140, "total_steps": 3573, "loss": 1.0785, "lr": 2.2046252321364368e-06, "epoch": 2.6364399664147777, "percentage": 87.88, "elapsed_time": "1:09:32", "remaining_time": "0:09:35"} |
|
{"current_steps": 3150, "total_steps": 3573, "loss": 1.0623, "lr": 2.1054086019782785e-06, "epoch": 2.644836272040302, "percentage": 88.16, "elapsed_time": "1:09:44", "remaining_time": "0:09:21"} |
|
{"current_steps": 3160, "total_steps": 3573, "loss": 1.0629, "lr": 2.008378057765725e-06, "epoch": 2.653232577665827, "percentage": 88.44, "elapsed_time": "1:09:56", "remaining_time": "0:09:08"} |
|
{"current_steps": 3170, "total_steps": 3573, "loss": 1.0682, "lr": 1.913542864442849e-06, "epoch": 2.661628883291352, "percentage": 88.72, "elapsed_time": "1:10:08", "remaining_time": "0:08:55"} |
|
{"current_steps": 3180, "total_steps": 3573, "loss": 1.0352, "lr": 1.8209120773310468e-06, "epoch": 2.6700251889168767, "percentage": 89.0, "elapsed_time": "1:10:21", "remaining_time": "0:08:41"} |
|
{"current_steps": 3190, "total_steps": 3573, "loss": 1.0617, "lr": 1.7304945412643825e-06, "epoch": 2.6784214945424014, "percentage": 89.28, "elapsed_time": "1:10:33", "remaining_time": "0:08:28"} |
|
{"current_steps": 3200, "total_steps": 3573, "loss": 1.0712, "lr": 1.6422988897450392e-06, "epoch": 2.686817800167926, "percentage": 89.56, "elapsed_time": "1:10:45", "remaining_time": "0:08:14"} |
|
{"current_steps": 3210, "total_steps": 3573, "loss": 1.0735, "lr": 1.5563335441189458e-06, "epoch": 2.695214105793451, "percentage": 89.84, "elapsed_time": "1:10:57", "remaining_time": "0:08:01"} |
|
{"current_steps": 3220, "total_steps": 3573, "loss": 1.0621, "lr": 1.4726067127716958e-06, "epoch": 2.7036104114189756, "percentage": 90.12, "elapsed_time": "1:11:10", "remaining_time": "0:07:48"} |
|
{"current_steps": 3230, "total_steps": 3573, "loss": 1.0652, "lr": 1.3911263903447241e-06, "epoch": 2.7120067170445004, "percentage": 90.4, "elapsed_time": "1:11:22", "remaining_time": "0:07:34"} |
|
{"current_steps": 3240, "total_steps": 3573, "loss": 1.0622, "lr": 1.3119003569719789e-06, "epoch": 2.720403022670025, "percentage": 90.68, "elapsed_time": "1:11:34", "remaining_time": "0:07:21"} |
|
{"current_steps": 3250, "total_steps": 3573, "loss": 1.063, "lr": 1.2349361775370245e-06, "epoch": 2.72879932829555, "percentage": 90.96, "elapsed_time": "1:11:46", "remaining_time": "0:07:08"} |
|
{"current_steps": 3260, "total_steps": 3573, "loss": 1.0598, "lr": 1.1602412009507014e-06, "epoch": 2.7371956339210746, "percentage": 91.24, "elapsed_time": "1:11:59", "remaining_time": "0:06:54"} |
|
{"current_steps": 3270, "total_steps": 3573, "loss": 1.037, "lr": 1.087822559449425e-06, "epoch": 2.7455919395465997, "percentage": 91.52, "elapsed_time": "1:12:11", "remaining_time": "0:06:41"} |
|
{"current_steps": 3280, "total_steps": 3573, "loss": 1.0721, "lr": 1.0176871679141664e-06, "epoch": 2.753988245172124, "percentage": 91.8, "elapsed_time": "1:12:23", "remaining_time": "0:06:28"} |
|
{"current_steps": 3290, "total_steps": 3573, "loss": 1.0624, "lr": 9.49841723210182e-07, "epoch": 2.762384550797649, "percentage": 92.08, "elapsed_time": "1:12:35", "remaining_time": "0:06:14"} |
|
{"current_steps": 3300, "total_steps": 3573, "loss": 1.0868, "lr": 8.842927035475763e-07, "epoch": 2.770780856423174, "percentage": 92.36, "elapsed_time": "1:12:48", "remaining_time": "0:06:01"} |
|
{"current_steps": 3310, "total_steps": 3573, "loss": 1.0509, "lr": 8.210463678626989e-07, "epoch": 2.7791771620486987, "percentage": 92.64, "elapsed_time": "1:13:00", "remaining_time": "0:05:48"} |
|
{"current_steps": 3320, "total_steps": 3573, "loss": 1.0568, "lr": 7.601087552205621e-07, "epoch": 2.7875734676742234, "percentage": 92.92, "elapsed_time": "1:13:12", "remaining_time": "0:05:34"} |
|
{"current_steps": 3330, "total_steps": 3573, "loss": 1.0745, "lr": 7.014856842381484e-07, "epoch": 2.795969773299748, "percentage": 93.2, "elapsed_time": "1:13:24", "remaining_time": "0:05:21"} |
|
{"current_steps": 3340, "total_steps": 3573, "loss": 1.0708, "lr": 6.451827525288612e-07, "epoch": 2.804366078925273, "percentage": 93.48, "elapsed_time": "1:13:36", "remaining_time": "0:05:08"} |
|
{"current_steps": 3350, "total_steps": 3573, "loss": 1.0772, "lr": 5.912053361680159e-07, "epoch": 2.8127623845507976, "percentage": 93.76, "elapsed_time": "1:13:48", "remaining_time": "0:04:54"} |
|
{"current_steps": 3360, "total_steps": 3573, "loss": 1.0437, "lr": 5.395585891795174e-07, "epoch": 2.8211586901763224, "percentage": 94.04, "elapsed_time": "1:14:01", "remaining_time": "0:04:41"} |
|
{"current_steps": 3370, "total_steps": 3573, "loss": 1.064, "lr": 4.90247443043712e-07, "epoch": 2.829554995801847, "percentage": 94.32, "elapsed_time": "1:14:13", "remaining_time": "0:04:28"} |
|
{"current_steps": 3380, "total_steps": 3573, "loss": 1.0702, "lr": 4.43276606226542e-07, "epoch": 2.837951301427372, "percentage": 94.6, "elapsed_time": "1:14:25", "remaining_time": "0:04:14"} |
|
{"current_steps": 3390, "total_steps": 3573, "loss": 1.0731, "lr": 3.9865056372990763e-07, "epoch": 2.8463476070528966, "percentage": 94.88, "elapsed_time": "1:14:37", "remaining_time": "0:04:01"} |
|
{"current_steps": 3400, "total_steps": 3573, "loss": 1.0576, "lr": 3.563735766634629e-07, "epoch": 2.8547439126784218, "percentage": 95.16, "elapsed_time": "1:14:49", "remaining_time": "0:03:48"} |
|
{"current_steps": 3410, "total_steps": 3573, "loss": 1.0526, "lr": 3.164496818377188e-07, "epoch": 2.863140218303946, "percentage": 95.44, "elapsed_time": "1:15:01", "remaining_time": "0:03:35"} |
|
{"current_steps": 3420, "total_steps": 3573, "loss": 1.0631, "lr": 2.7888269137860413e-07, "epoch": 2.8715365239294712, "percentage": 95.72, "elapsed_time": "1:15:14", "remaining_time": "0:03:21"} |
|
{"current_steps": 3430, "total_steps": 3573, "loss": 1.1013, "lr": 2.436761923634456e-07, "epoch": 2.879932829554996, "percentage": 96.0, "elapsed_time": "1:15:26", "remaining_time": "0:03:08"} |
|
{"current_steps": 3440, "total_steps": 3573, "loss": 1.0737, "lr": 2.108335464784811e-07, "epoch": 2.8883291351805207, "percentage": 96.28, "elapsed_time": "1:15:38", "remaining_time": "0:02:55"} |
|
{"current_steps": 3450, "total_steps": 3573, "loss": 1.0823, "lr": 1.8035788969784638e-07, "epoch": 2.8967254408060454, "percentage": 96.56, "elapsed_time": "1:15:50", "remaining_time": "0:02:42"} |
|
{"current_steps": 3460, "total_steps": 3573, "loss": 1.0692, "lr": 1.522521319841541e-07, "epoch": 2.90512174643157, "percentage": 96.84, "elapsed_time": "1:16:03", "remaining_time": "0:02:29"} |
|
{"current_steps": 3470, "total_steps": 3573, "loss": 1.0698, "lr": 1.2651895701063233e-07, "epoch": 2.913518052057095, "percentage": 97.12, "elapsed_time": "1:16:15", "remaining_time": "0:02:15"} |
|
{"current_steps": 3480, "total_steps": 3573, "loss": 1.0746, "lr": 1.0316082190486298e-07, "epoch": 2.9219143576826196, "percentage": 97.4, "elapsed_time": "1:16:27", "remaining_time": "0:02:02"} |
|
{"current_steps": 3490, "total_steps": 3573, "loss": 1.0454, "lr": 8.217995701418624e-08, "epoch": 2.9303106633081444, "percentage": 97.68, "elapsed_time": "1:16:39", "remaining_time": "0:01:49"} |
|
{"current_steps": 3500, "total_steps": 3573, "loss": 1.056, "lr": 6.35783656927097e-08, "epoch": 2.938706968933669, "percentage": 97.96, "elapsed_time": "1:16:51", "remaining_time": "0:01:36"} |
|
{"current_steps": 3510, "total_steps": 3573, "loss": 1.0689, "lr": 4.7357824110044743e-08, "epoch": 2.947103274559194, "percentage": 98.24, "elapsed_time": "1:17:24", "remaining_time": "0:01:23"} |
|
{"current_steps": 3520, "total_steps": 3573, "loss": 1.0603, "lr": 3.351988108168391e-08, "epoch": 2.9554995801847186, "percentage": 98.52, "elapsed_time": "1:17:37", "remaining_time": "0:01:10"} |
|
{"current_steps": 3530, "total_steps": 3573, "loss": 1.0822, "lr": 2.2065857921133025e-08, "epoch": 2.9638958858102438, "percentage": 98.8, "elapsed_time": "1:17:49", "remaining_time": "0:00:56"} |
|
{"current_steps": 3540, "total_steps": 3573, "loss": 1.075, "lr": 1.2996848313734378e-08, "epoch": 2.972292191435768, "percentage": 99.08, "elapsed_time": "1:18:01", "remaining_time": "0:00:43"} |
|
{"current_steps": 3550, "total_steps": 3573, "loss": 1.0692, "lr": 6.31371821224469e-09, "epoch": 2.9806884970612932, "percentage": 99.36, "elapsed_time": "1:18:13", "remaining_time": "0:00:30"} |
|
{"current_steps": 3560, "total_steps": 3573, "loss": 1.0895, "lr": 2.017105754134607e-09, "epoch": 2.9890848026868175, "percentage": 99.64, "elapsed_time": "1:18:25", "remaining_time": "0:00:17"} |
|
{"current_steps": 3570, "total_steps": 3573, "loss": 1.0465, "lr": 1.0742120067630535e-10, "epoch": 2.9974811083123427, "percentage": 99.92, "elapsed_time": "1:18:37", "remaining_time": "0:00:03"} |
|
{"current_steps": 3573, "total_steps": 3573, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:19:00", "remaining_time": "0:00:00"} |
|
|