open-lilm-v2 / trainer_log.jsonl
0xtaipoian's picture
Upload folder using huggingface_hub
05012b5 verified
{"current_steps": 10, "total_steps": 445, "loss": 3.8476, "learning_rate": 2.222222222222222e-06, "epoch": 0.02244210955829848, "percentage": 2.25, "elapsed_time": "0:13:44", "remaining_time": "9:57:47", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 20, "total_steps": 445, "loss": 3.2218, "learning_rate": 4.444444444444444e-06, "epoch": 0.04488421911659696, "percentage": 4.49, "elapsed_time": "0:27:04", "remaining_time": "9:35:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 30, "total_steps": 445, "loss": 2.9756, "learning_rate": 6.666666666666667e-06, "epoch": 0.06732632867489544, "percentage": 6.74, "elapsed_time": "0:40:32", "remaining_time": "9:20:53", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 40, "total_steps": 445, "loss": 2.88, "learning_rate": 8.888888888888888e-06, "epoch": 0.08976843823319391, "percentage": 8.99, "elapsed_time": "0:54:05", "remaining_time": "9:07:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 50, "total_steps": 445, "loss": 2.8198, "learning_rate": 9.996145181203616e-06, "epoch": 0.11221054779149241, "percentage": 11.24, "elapsed_time": "1:08:29", "remaining_time": "9:01:03", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 60, "total_steps": 445, "loss": 2.8122, "learning_rate": 9.965342284774633e-06, "epoch": 0.13465265734979087, "percentage": 13.48, "elapsed_time": "1:22:54", "remaining_time": "8:51:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 70, "total_steps": 445, "loss": 2.7806, "learning_rate": 9.903926402016153e-06, "epoch": 0.15709476690808935, "percentage": 15.73, "elapsed_time": "1:36:58", "remaining_time": "8:39:31", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 80, "total_steps": 445, "loss": 2.7422, "learning_rate": 9.812276182268236e-06, "epoch": 0.17953687646638783, "percentage": 17.98, "elapsed_time": "1:50:49", "remaining_time": "8:25:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 90, "total_steps": 445, "loss": 2.736, "learning_rate": 9.690956679612422e-06, "epoch": 0.2019789860246863, "percentage": 20.22, "elapsed_time": "2:04:30", "remaining_time": "8:11:08", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 100, "total_steps": 445, "loss": 2.7361, "learning_rate": 9.540715869125407e-06, "epoch": 0.22442109558298481, "percentage": 22.47, "elapsed_time": "2:18:35", "remaining_time": "7:58:07", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 110, "total_steps": 445, "loss": 2.7135, "learning_rate": 9.362480035363987e-06, "epoch": 0.2468632051412833, "percentage": 24.72, "elapsed_time": "2:32:40", "remaining_time": "7:44:59", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 120, "total_steps": 445, "loss": 2.7064, "learning_rate": 9.157348061512728e-06, "epoch": 0.26930531469958174, "percentage": 26.97, "elapsed_time": "2:46:38", "remaining_time": "7:31:19", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 130, "total_steps": 445, "loss": 2.7018, "learning_rate": 8.926584654403725e-06, "epoch": 0.29174742425788025, "percentage": 29.21, "elapsed_time": "3:00:35", "remaining_time": "7:17:36", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 140, "total_steps": 445, "loss": 2.6961, "learning_rate": 8.671612547178428e-06, "epoch": 0.3141895338161787, "percentage": 31.46, "elapsed_time": "3:14:28", "remaining_time": "7:03:40", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 150, "total_steps": 445, "loss": 2.6968, "learning_rate": 8.39400372766471e-06, "epoch": 0.3366316433744772, "percentage": 33.71, "elapsed_time": "3:28:14", "remaining_time": "6:49:33", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 160, "total_steps": 445, "loss": 2.6879, "learning_rate": 8.095469746549172e-06, "epoch": 0.35907375293277566, "percentage": 35.96, "elapsed_time": "3:42:09", "remaining_time": "6:35:43", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 170, "total_steps": 445, "loss": 2.6686, "learning_rate": 7.777851165098012e-06, "epoch": 0.38151586249107416, "percentage": 38.2, "elapsed_time": "3:56:01", "remaining_time": "6:21:48", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 180, "total_steps": 445, "loss": 2.6497, "learning_rate": 7.443106207484776e-06, "epoch": 0.4039579720493726, "percentage": 40.45, "elapsed_time": "4:09:47", "remaining_time": "6:07:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 190, "total_steps": 445, "loss": 2.6413, "learning_rate": 7.093298687687141e-06, "epoch": 0.4264000816076711, "percentage": 42.7, "elapsed_time": "4:23:56", "remaining_time": "5:54:14", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 200, "total_steps": 445, "loss": 2.6472, "learning_rate": 6.730585285387465e-06, "epoch": 0.44884219116596963, "percentage": 44.94, "elapsed_time": "4:37:58", "remaining_time": "5:40:30", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 200, "total_steps": 445, "eval_loss": 2.642993450164795, "epoch": 0.44884219116596963, "percentage": 44.94, "elapsed_time": "4:59:33", "remaining_time": "6:06:57", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 210, "total_steps": 445, "loss": 2.6369, "learning_rate": 6.3572022493253715e-06, "epoch": 0.4712843007242681, "percentage": 47.19, "elapsed_time": "5:13:34", "remaining_time": "5:50:54", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 220, "total_steps": 445, "loss": 2.63, "learning_rate": 5.975451610080643e-06, "epoch": 0.4937264102825666, "percentage": 49.44, "elapsed_time": "5:27:23", "remaining_time": "5:34:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 230, "total_steps": 445, "loss": 2.6209, "learning_rate": 5.587686987289189e-06, "epoch": 0.5161685198408651, "percentage": 51.69, "elapsed_time": "5:41:21", "remaining_time": "5:19:06", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 240, "total_steps": 445, "loss": 2.6318, "learning_rate": 5.1962990787953436e-06, "epoch": 0.5386106293991635, "percentage": 53.93, "elapsed_time": "5:55:03", "remaining_time": "5:03:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 250, "total_steps": 445, "loss": 2.621, "learning_rate": 4.803700921204659e-06, "epoch": 0.561052738957462, "percentage": 56.18, "elapsed_time": "6:08:55", "remaining_time": "4:47:45", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 260, "total_steps": 445, "loss": 2.6161, "learning_rate": 4.4123130127108125e-06, "epoch": 0.5834948485157605, "percentage": 58.43, "elapsed_time": "6:22:39", "remaining_time": "4:32:16", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 270, "total_steps": 445, "loss": 2.6164, "learning_rate": 4.02454838991936e-06, "epoch": 0.605936958074059, "percentage": 60.67, "elapsed_time": "6:36:39", "remaining_time": "4:17:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 280, "total_steps": 445, "loss": 2.6091, "learning_rate": 3.6427977506746293e-06, "epoch": 0.6283790676323574, "percentage": 62.92, "elapsed_time": "6:50:40", "remaining_time": "4:02:00", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 290, "total_steps": 445, "loss": 2.5967, "learning_rate": 3.269414714612534e-06, "epoch": 0.6508211771906559, "percentage": 65.17, "elapsed_time": "7:04:34", "remaining_time": "3:46:55", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 300, "total_steps": 445, "loss": 2.6031, "learning_rate": 2.906701312312861e-06, "epoch": 0.6732632867489544, "percentage": 67.42, "elapsed_time": "7:18:40", "remaining_time": "3:32:01", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 310, "total_steps": 445, "loss": 2.6014, "learning_rate": 2.5568937925152272e-06, "epoch": 0.6957053963072529, "percentage": 69.66, "elapsed_time": "7:32:32", "remaining_time": "3:17:04", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 320, "total_steps": 445, "loss": 2.5978, "learning_rate": 2.2221488349019903e-06, "epoch": 0.7181475058655513, "percentage": 71.91, "elapsed_time": "7:46:30", "remaining_time": "3:02:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 330, "total_steps": 445, "loss": 2.5911, "learning_rate": 1.9045302534508298e-06, "epoch": 0.7405896154238498, "percentage": 74.16, "elapsed_time": "8:00:23", "remaining_time": "2:47:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 340, "total_steps": 445, "loss": 2.5913, "learning_rate": 1.6059962723352912e-06, "epoch": 0.7630317249821483, "percentage": 76.4, "elapsed_time": "8:14:27", "remaining_time": "2:32:42", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 350, "total_steps": 445, "loss": 2.5819, "learning_rate": 1.3283874528215735e-06, "epoch": 0.7854738345404468, "percentage": 78.65, "elapsed_time": "8:28:44", "remaining_time": "2:18:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 360, "total_steps": 445, "loss": 2.5833, "learning_rate": 1.0734153455962765e-06, "epoch": 0.8079159440987452, "percentage": 80.9, "elapsed_time": "8:42:44", "remaining_time": "2:03:25", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 370, "total_steps": 445, "loss": 2.5851, "learning_rate": 8.426519384872733e-07, "epoch": 0.8303580536570437, "percentage": 83.15, "elapsed_time": "8:56:50", "remaining_time": "1:48:49", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 380, "total_steps": 445, "loss": 2.5853, "learning_rate": 6.375199646360142e-07, "epoch": 0.8528001632153422, "percentage": 85.39, "elapsed_time": "9:10:53", "remaining_time": "1:34:13", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 390, "total_steps": 445, "loss": 2.5832, "learning_rate": 4.5928413087459325e-07, "epoch": 0.8752422727736408, "percentage": 87.64, "elapsed_time": "9:24:43", "remaining_time": "1:19:38", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 400, "total_steps": 445, "loss": 2.5779, "learning_rate": 3.0904332038757977e-07, "epoch": 0.8976843823319393, "percentage": 89.89, "elapsed_time": "9:38:32", "remaining_time": "1:05:05", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 400, "total_steps": 445, "eval_loss": 2.582942485809326, "epoch": 0.8976843823319393, "percentage": 89.89, "elapsed_time": "9:59:46", "remaining_time": "1:07:28", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 410, "total_steps": 445, "loss": 2.5833, "learning_rate": 1.8772381773176417e-07, "epoch": 0.9201264918902377, "percentage": 92.13, "elapsed_time": "10:13:48", "remaining_time": "0:52:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 420, "total_steps": 445, "loss": 2.597, "learning_rate": 9.607359798384785e-08, "epoch": 0.9425686014485362, "percentage": 94.38, "elapsed_time": "10:28:05", "remaining_time": "0:37:23", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 430, "total_steps": 445, "loss": 2.5725, "learning_rate": 3.465771522536854e-08, "epoch": 0.9650107110068347, "percentage": 96.63, "elapsed_time": "10:42:08", "remaining_time": "0:22:24", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 440, "total_steps": 445, "loss": 2.575, "learning_rate": 3.854818796385495e-09, "epoch": 0.9874528205651332, "percentage": 98.88, "elapsed_time": "10:55:58", "remaining_time": "0:07:27", "throughput": "0.00", "total_tokens": 0}
{"current_steps": 445, "total_steps": 445, "epoch": 0.9986738753442823, "percentage": 100.0, "elapsed_time": "11:05:37", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}