File size: 13,265 Bytes
56f1801
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
{"current_steps": 10, "total_steps": 2022, "loss": 0.6862, "learning_rate": 5e-06, "epoch": 0.014825796886582653, "percentage": 0.49, "elapsed_time": "0:01:32", "remaining_time": "5:09:22"}
{"current_steps": 20, "total_steps": 2022, "loss": 0.6305, "learning_rate": 5e-06, "epoch": 0.029651593773165306, "percentage": 0.99, "elapsed_time": "0:02:54", "remaining_time": "4:51:51"}
{"current_steps": 30, "total_steps": 2022, "loss": 0.5946, "learning_rate": 5e-06, "epoch": 0.04447739065974796, "percentage": 1.48, "elapsed_time": "0:04:17", "remaining_time": "4:45:26"}
{"current_steps": 40, "total_steps": 2022, "loss": 0.5858, "learning_rate": 5e-06, "epoch": 0.05930318754633061, "percentage": 1.98, "elapsed_time": "0:05:41", "remaining_time": "4:41:42"}
{"current_steps": 50, "total_steps": 2022, "loss": 0.5662, "learning_rate": 5e-06, "epoch": 0.07412898443291327, "percentage": 2.47, "elapsed_time": "0:07:03", "remaining_time": "4:38:37"}
{"current_steps": 60, "total_steps": 2022, "loss": 0.564, "learning_rate": 5e-06, "epoch": 0.08895478131949593, "percentage": 2.97, "elapsed_time": "0:08:26", "remaining_time": "4:36:12"}
{"current_steps": 70, "total_steps": 2022, "loss": 0.5536, "learning_rate": 5e-06, "epoch": 0.10378057820607858, "percentage": 3.46, "elapsed_time": "0:09:50", "remaining_time": "4:34:22"}
{"current_steps": 80, "total_steps": 2022, "loss": 0.5447, "learning_rate": 5e-06, "epoch": 0.11860637509266123, "percentage": 3.96, "elapsed_time": "0:11:14", "remaining_time": "4:32:44"}
{"current_steps": 90, "total_steps": 2022, "loss": 0.5466, "learning_rate": 5e-06, "epoch": 0.1334321719792439, "percentage": 4.45, "elapsed_time": "0:12:37", "remaining_time": "4:31:07"}
{"current_steps": 100, "total_steps": 2022, "loss": 0.5354, "learning_rate": 5e-06, "epoch": 0.14825796886582654, "percentage": 4.95, "elapsed_time": "0:14:01", "remaining_time": "4:29:33"}
{"current_steps": 110, "total_steps": 2022, "loss": 0.535, "learning_rate": 5e-06, "epoch": 0.16308376575240918, "percentage": 5.44, "elapsed_time": "0:15:25", "remaining_time": "4:28:02"}
{"current_steps": 120, "total_steps": 2022, "loss": 0.5338, "learning_rate": 5e-06, "epoch": 0.17790956263899185, "percentage": 5.93, "elapsed_time": "0:16:48", "remaining_time": "4:26:28"}
{"current_steps": 130, "total_steps": 2022, "loss": 0.5301, "learning_rate": 5e-06, "epoch": 0.1927353595255745, "percentage": 6.43, "elapsed_time": "0:18:11", "remaining_time": "4:24:39"}
{"current_steps": 140, "total_steps": 2022, "loss": 0.5263, "learning_rate": 5e-06, "epoch": 0.20756115641215717, "percentage": 6.92, "elapsed_time": "0:19:33", "remaining_time": "4:22:57"}
{"current_steps": 150, "total_steps": 2022, "loss": 0.5248, "learning_rate": 5e-06, "epoch": 0.2223869532987398, "percentage": 7.42, "elapsed_time": "0:20:56", "remaining_time": "4:21:21"}
{"current_steps": 160, "total_steps": 2022, "loss": 0.5279, "learning_rate": 5e-06, "epoch": 0.23721275018532245, "percentage": 7.91, "elapsed_time": "0:22:19", "remaining_time": "4:19:48"}
{"current_steps": 170, "total_steps": 2022, "loss": 0.526, "learning_rate": 5e-06, "epoch": 0.2520385470719051, "percentage": 8.41, "elapsed_time": "0:23:42", "remaining_time": "4:18:21"}
{"current_steps": 180, "total_steps": 2022, "loss": 0.5224, "learning_rate": 5e-06, "epoch": 0.2668643439584878, "percentage": 8.9, "elapsed_time": "0:25:06", "remaining_time": "4:16:51"}
{"current_steps": 190, "total_steps": 2022, "loss": 0.52, "learning_rate": 5e-06, "epoch": 0.28169014084507044, "percentage": 9.4, "elapsed_time": "0:26:29", "remaining_time": "4:15:26"}
{"current_steps": 200, "total_steps": 2022, "loss": 0.5179, "learning_rate": 5e-06, "epoch": 0.2965159377316531, "percentage": 9.89, "elapsed_time": "0:27:53", "remaining_time": "4:14:05"}
{"current_steps": 210, "total_steps": 2022, "loss": 0.5182, "learning_rate": 5e-06, "epoch": 0.3113417346182357, "percentage": 10.39, "elapsed_time": "0:29:17", "remaining_time": "4:12:40"}
{"current_steps": 220, "total_steps": 2022, "loss": 0.5104, "learning_rate": 5e-06, "epoch": 0.32616753150481836, "percentage": 10.88, "elapsed_time": "0:30:40", "remaining_time": "4:11:13"}
{"current_steps": 230, "total_steps": 2022, "loss": 0.5131, "learning_rate": 5e-06, "epoch": 0.34099332839140106, "percentage": 11.37, "elapsed_time": "0:32:03", "remaining_time": "4:09:46"}
{"current_steps": 240, "total_steps": 2022, "loss": 0.5191, "learning_rate": 5e-06, "epoch": 0.3558191252779837, "percentage": 11.87, "elapsed_time": "0:33:26", "remaining_time": "4:08:18"}
{"current_steps": 250, "total_steps": 2022, "loss": 0.5093, "learning_rate": 5e-06, "epoch": 0.37064492216456635, "percentage": 12.36, "elapsed_time": "0:34:49", "remaining_time": "4:06:52"}
{"current_steps": 260, "total_steps": 2022, "loss": 0.5161, "learning_rate": 5e-06, "epoch": 0.385470719051149, "percentage": 12.86, "elapsed_time": "0:36:13", "remaining_time": "4:05:26"}
{"current_steps": 270, "total_steps": 2022, "loss": 0.5178, "learning_rate": 5e-06, "epoch": 0.40029651593773163, "percentage": 13.35, "elapsed_time": "0:37:36", "remaining_time": "4:04:01"}
{"current_steps": 280, "total_steps": 2022, "loss": 0.5142, "learning_rate": 5e-06, "epoch": 0.41512231282431433, "percentage": 13.85, "elapsed_time": "0:38:59", "remaining_time": "4:02:36"}
{"current_steps": 290, "total_steps": 2022, "loss": 0.5125, "learning_rate": 5e-06, "epoch": 0.429948109710897, "percentage": 14.34, "elapsed_time": "0:40:22", "remaining_time": "4:01:09"}
{"current_steps": 300, "total_steps": 2022, "loss": 0.5078, "learning_rate": 5e-06, "epoch": 0.4447739065974796, "percentage": 14.84, "elapsed_time": "0:41:45", "remaining_time": "3:59:43"}
{"current_steps": 310, "total_steps": 2022, "loss": 0.5045, "learning_rate": 5e-06, "epoch": 0.45959970348406226, "percentage": 15.33, "elapsed_time": "0:43:08", "remaining_time": "3:58:17"}
{"current_steps": 320, "total_steps": 2022, "loss": 0.5047, "learning_rate": 5e-06, "epoch": 0.4744255003706449, "percentage": 15.83, "elapsed_time": "0:44:32", "remaining_time": "3:56:51"}
{"current_steps": 330, "total_steps": 2022, "loss": 0.5067, "learning_rate": 5e-06, "epoch": 0.4892512972572276, "percentage": 16.32, "elapsed_time": "0:45:55", "remaining_time": "3:55:26"}
{"current_steps": 340, "total_steps": 2022, "loss": 0.5135, "learning_rate": 5e-06, "epoch": 0.5040770941438102, "percentage": 16.82, "elapsed_time": "0:47:18", "remaining_time": "3:54:01"}
{"current_steps": 350, "total_steps": 2022, "loss": 0.5034, "learning_rate": 5e-06, "epoch": 0.5189028910303929, "percentage": 17.31, "elapsed_time": "0:48:41", "remaining_time": "3:52:36"}
{"current_steps": 360, "total_steps": 2022, "loss": 0.5048, "learning_rate": 5e-06, "epoch": 0.5337286879169756, "percentage": 17.8, "elapsed_time": "0:50:04", "remaining_time": "3:51:12"}
{"current_steps": 370, "total_steps": 2022, "loss": 0.4991, "learning_rate": 5e-06, "epoch": 0.5485544848035582, "percentage": 18.3, "elapsed_time": "0:51:27", "remaining_time": "3:49:47"}
{"current_steps": 380, "total_steps": 2022, "loss": 0.5025, "learning_rate": 5e-06, "epoch": 0.5633802816901409, "percentage": 18.79, "elapsed_time": "0:52:51", "remaining_time": "3:48:25"}
{"current_steps": 390, "total_steps": 2022, "loss": 0.5072, "learning_rate": 5e-06, "epoch": 0.5782060785767235, "percentage": 19.29, "elapsed_time": "0:54:15", "remaining_time": "3:47:02"}
{"current_steps": 400, "total_steps": 2022, "loss": 0.4948, "learning_rate": 5e-06, "epoch": 0.5930318754633062, "percentage": 19.78, "elapsed_time": "0:55:38", "remaining_time": "3:45:37"}
{"current_steps": 410, "total_steps": 2022, "loss": 0.5024, "learning_rate": 5e-06, "epoch": 0.6078576723498889, "percentage": 20.28, "elapsed_time": "0:57:01", "remaining_time": "3:44:13"}
{"current_steps": 420, "total_steps": 2022, "loss": 0.5034, "learning_rate": 5e-06, "epoch": 0.6226834692364714, "percentage": 20.77, "elapsed_time": "0:58:25", "remaining_time": "3:42:51"}
{"current_steps": 430, "total_steps": 2022, "loss": 0.4912, "learning_rate": 5e-06, "epoch": 0.6375092661230541, "percentage": 21.27, "elapsed_time": "0:59:48", "remaining_time": "3:41:26"}
{"current_steps": 440, "total_steps": 2022, "loss": 0.4898, "learning_rate": 5e-06, "epoch": 0.6523350630096367, "percentage": 21.76, "elapsed_time": "1:01:11", "remaining_time": "3:40:01"}
{"current_steps": 450, "total_steps": 2022, "loss": 0.5027, "learning_rate": 5e-06, "epoch": 0.6671608598962194, "percentage": 22.26, "elapsed_time": "1:02:35", "remaining_time": "3:38:38"}
{"current_steps": 460, "total_steps": 2022, "loss": 0.49, "learning_rate": 5e-06, "epoch": 0.6819866567828021, "percentage": 22.75, "elapsed_time": "1:03:58", "remaining_time": "3:37:13"}
{"current_steps": 470, "total_steps": 2022, "loss": 0.4962, "learning_rate": 5e-06, "epoch": 0.6968124536693847, "percentage": 23.24, "elapsed_time": "1:05:21", "remaining_time": "3:35:49"}
{"current_steps": 480, "total_steps": 2022, "loss": 0.4979, "learning_rate": 5e-06, "epoch": 0.7116382505559674, "percentage": 23.74, "elapsed_time": "1:06:44", "remaining_time": "3:34:24"}
{"current_steps": 490, "total_steps": 2022, "loss": 0.4982, "learning_rate": 5e-06, "epoch": 0.72646404744255, "percentage": 24.23, "elapsed_time": "1:08:07", "remaining_time": "3:33:00"}
{"current_steps": 500, "total_steps": 2022, "loss": 0.4891, "learning_rate": 5e-06, "epoch": 0.7412898443291327, "percentage": 24.73, "elapsed_time": "1:09:30", "remaining_time": "3:31:35"}
{"current_steps": 510, "total_steps": 2022, "loss": 0.5006, "learning_rate": 5e-06, "epoch": 0.7561156412157154, "percentage": 25.22, "elapsed_time": "1:10:53", "remaining_time": "3:30:11"}
{"current_steps": 520, "total_steps": 2022, "loss": 0.4966, "learning_rate": 5e-06, "epoch": 0.770941438102298, "percentage": 25.72, "elapsed_time": "1:12:16", "remaining_time": "3:28:46"}
{"current_steps": 530, "total_steps": 2022, "loss": 0.4962, "learning_rate": 5e-06, "epoch": 0.7857672349888807, "percentage": 26.21, "elapsed_time": "1:13:39", "remaining_time": "3:27:21"}
{"current_steps": 540, "total_steps": 2022, "loss": 0.4947, "learning_rate": 5e-06, "epoch": 0.8005930318754633, "percentage": 26.71, "elapsed_time": "1:15:02", "remaining_time": "3:25:57"}
{"current_steps": 550, "total_steps": 2022, "loss": 0.4919, "learning_rate": 5e-06, "epoch": 0.815418828762046, "percentage": 27.2, "elapsed_time": "1:16:25", "remaining_time": "3:24:32"}
{"current_steps": 560, "total_steps": 2022, "loss": 0.4864, "learning_rate": 5e-06, "epoch": 0.8302446256486287, "percentage": 27.7, "elapsed_time": "1:17:48", "remaining_time": "3:23:08"}
{"current_steps": 570, "total_steps": 2022, "loss": 0.4926, "learning_rate": 5e-06, "epoch": 0.8450704225352113, "percentage": 28.19, "elapsed_time": "1:19:11", "remaining_time": "3:21:43"}
{"current_steps": 580, "total_steps": 2022, "loss": 0.4877, "learning_rate": 5e-06, "epoch": 0.859896219421794, "percentage": 28.68, "elapsed_time": "1:20:34", "remaining_time": "3:20:20"}
{"current_steps": 590, "total_steps": 2022, "loss": 0.4903, "learning_rate": 5e-06, "epoch": 0.8747220163083765, "percentage": 29.18, "elapsed_time": "1:21:58", "remaining_time": "3:18:57"}
{"current_steps": 600, "total_steps": 2022, "loss": 0.4945, "learning_rate": 5e-06, "epoch": 0.8895478131949592, "percentage": 29.67, "elapsed_time": "1:23:21", "remaining_time": "3:17:33"}
{"current_steps": 610, "total_steps": 2022, "loss": 0.4898, "learning_rate": 5e-06, "epoch": 0.9043736100815419, "percentage": 30.17, "elapsed_time": "1:24:45", "remaining_time": "3:16:10"}
{"current_steps": 620, "total_steps": 2022, "loss": 0.4916, "learning_rate": 5e-06, "epoch": 0.9191994069681245, "percentage": 30.66, "elapsed_time": "1:26:08", "remaining_time": "3:14:48"}
{"current_steps": 630, "total_steps": 2022, "loss": 0.4876, "learning_rate": 5e-06, "epoch": 0.9340252038547072, "percentage": 31.16, "elapsed_time": "1:27:32", "remaining_time": "3:13:24"}
{"current_steps": 640, "total_steps": 2022, "loss": 0.4911, "learning_rate": 5e-06, "epoch": 0.9488510007412898, "percentage": 31.65, "elapsed_time": "1:28:55", "remaining_time": "3:12:00"}
{"current_steps": 650, "total_steps": 2022, "loss": 0.4907, "learning_rate": 5e-06, "epoch": 0.9636767976278725, "percentage": 32.15, "elapsed_time": "1:30:18", "remaining_time": "3:10:36"}
{"current_steps": 660, "total_steps": 2022, "loss": 0.4864, "learning_rate": 5e-06, "epoch": 0.9785025945144552, "percentage": 32.64, "elapsed_time": "1:31:41", "remaining_time": "3:09:12"}
{"current_steps": 670, "total_steps": 2022, "loss": 0.4886, "learning_rate": 5e-06, "epoch": 0.9933283914010378, "percentage": 33.14, "elapsed_time": "1:33:03", "remaining_time": "3:07:47"}
{"current_steps": 674, "total_steps": 2022, "eval_loss": 0.489400178194046, "epoch": 0.9992587101556709, "percentage": 33.33, "elapsed_time": "1:35:39", "remaining_time": "3:11:18"}
{"current_steps": 680, "total_steps": 2022, "loss": 0.4775, "learning_rate": 5e-06, "epoch": 1.0081541882876204, "percentage": 33.63, "elapsed_time": "1:37:17", "remaining_time": "3:12:01"}
{"current_steps": 690, "total_steps": 2022, "loss": 0.4344, "learning_rate": 5e-06, "epoch": 1.0229799851742032, "percentage": 34.12, "elapsed_time": "1:38:40", "remaining_time": "3:10:28"}