TianyiQ's picture
Upload folder using huggingface_hub
05ee955 verified
raw
history blame
20 kB
{"current_steps": 1, "total_steps": 192, "loss": 0.8766, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.0, "epoch": 0.020833333333333332, "percentage": 0.52, "elapsed_time": "0:00:03", "remaining_time": "0:09:41"}
{"current_steps": 5, "total_steps": 192, "loss": 0.8675, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.25e-06, "epoch": 0.10416666666666667, "percentage": 2.6, "elapsed_time": "0:00:08", "remaining_time": "0:05:18"}
{"current_steps": 5, "total_steps": 192, "loss": null, "eval_loss": 0.8584801554679871, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.10416666666666667, "percentage": 2.6, "elapsed_time": "0:00:08", "remaining_time": "0:05:18"}
{"current_steps": 10, "total_steps": 192, "loss": 0.8415, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.25e-06, "epoch": 0.20833333333333334, "percentage": 5.21, "elapsed_time": "0:00:59", "remaining_time": "0:18:00"}
{"current_steps": 10, "total_steps": 192, "loss": null, "eval_loss": 0.8062803149223328, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.20833333333333334, "percentage": 5.21, "elapsed_time": "0:00:59", "remaining_time": "0:18:00"}
{"current_steps": 15, "total_steps": 192, "loss": 0.8225, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.25e-06, "epoch": 0.3125, "percentage": 7.81, "elapsed_time": "0:01:52", "remaining_time": "0:22:11"}
{"current_steps": 15, "total_steps": 192, "loss": null, "eval_loss": 0.820951521396637, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.3125, "percentage": 7.81, "elapsed_time": "0:01:52", "remaining_time": "0:22:11"}
{"current_steps": 20, "total_steps": 192, "loss": 0.806, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2e-05, "epoch": 0.4166666666666667, "percentage": 10.42, "elapsed_time": "0:03:49", "remaining_time": "0:32:56"}
{"current_steps": 20, "total_steps": 192, "loss": null, "eval_loss": 0.8412486910820007, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.4166666666666667, "percentage": 10.42, "elapsed_time": "0:03:49", "remaining_time": "0:32:56"}
{"current_steps": 25, "total_steps": 192, "loss": 0.8139, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4071209905461127e-05, "epoch": 0.5208333333333334, "percentage": 13.02, "elapsed_time": "0:05:44", "remaining_time": "0:38:20"}
{"current_steps": 25, "total_steps": 192, "loss": null, "eval_loss": 0.8701534867286682, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.5208333333333334, "percentage": 13.02, "elapsed_time": "0:05:44", "remaining_time": "0:38:20"}
{"current_steps": 30, "total_steps": 192, "loss": 0.8978, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0166196232101288e-05, "epoch": 0.625, "percentage": 15.62, "elapsed_time": "0:07:41", "remaining_time": "0:41:30"}
{"current_steps": 30, "total_steps": 192, "loss": null, "eval_loss": 0.8630704879760742, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.625, "percentage": 15.62, "elapsed_time": "0:07:41", "remaining_time": "0:41:30"}
{"current_steps": 35, "total_steps": 192, "loss": 0.814, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.276248845991498e-06, "epoch": 0.7291666666666666, "percentage": 18.23, "elapsed_time": "0:09:38", "remaining_time": "0:43:14"}
{"current_steps": 35, "total_steps": 192, "loss": null, "eval_loss": 0.8549697995185852, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.7291666666666666, "percentage": 18.23, "elapsed_time": "0:09:38", "remaining_time": "0:43:14"}
{"current_steps": 40, "total_steps": 192, "loss": 0.7989, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.157388080190487e-06, "epoch": 0.8333333333333334, "percentage": 20.83, "elapsed_time": "0:11:33", "remaining_time": "0:43:56"}
{"current_steps": 40, "total_steps": 192, "loss": null, "eval_loss": 0.8472943902015686, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.8333333333333334, "percentage": 20.83, "elapsed_time": "0:11:33", "remaining_time": "0:43:56"}
{"current_steps": 45, "total_steps": 192, "loss": 0.8769, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.6192313334626905e-06, "epoch": 0.9375, "percentage": 23.44, "elapsed_time": "0:13:28", "remaining_time": "0:44:01"}
{"current_steps": 45, "total_steps": 192, "loss": null, "eval_loss": 0.8382811546325684, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.9375, "percentage": 23.44, "elapsed_time": "0:13:28", "remaining_time": "0:44:01"}
{"current_steps": 50, "total_steps": 192, "loss": 0.7244, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.514391432582838e-06, "epoch": 1.0416666666666667, "percentage": 26.04, "elapsed_time": "0:15:23", "remaining_time": "0:43:43"}
{"current_steps": 50, "total_steps": 192, "loss": null, "eval_loss": 0.8277742266654968, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.0416666666666667, "percentage": 26.04, "elapsed_time": "0:15:23", "remaining_time": "0:43:43"}
{"current_steps": 55, "total_steps": 192, "loss": 0.4644, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.7297262757656213e-06, "epoch": 1.1458333333333333, "percentage": 28.65, "elapsed_time": "0:17:17", "remaining_time": "0:43:05"}
{"current_steps": 55, "total_steps": 192, "loss": null, "eval_loss": 0.8387134671211243, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.1458333333333333, "percentage": 28.65, "elapsed_time": "0:17:17", "remaining_time": "0:43:05"}
{"current_steps": 60, "total_steps": 192, "loss": 0.4488, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.1791620375982074e-06, "epoch": 1.25, "percentage": 31.25, "elapsed_time": "0:19:12", "remaining_time": "0:42:16"}
{"current_steps": 60, "total_steps": 192, "loss": null, "eval_loss": 0.8680305480957031, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.25, "percentage": 31.25, "elapsed_time": "0:19:12", "remaining_time": "0:42:16"}
{"current_steps": 65, "total_steps": 192, "loss": 0.3973, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.978466092394693e-07, "epoch": 1.3541666666666667, "percentage": 33.85, "elapsed_time": "0:21:07", "remaining_time": "0:41:15"}
{"current_steps": 65, "total_steps": 192, "loss": null, "eval_loss": 0.8717625737190247, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.3541666666666667, "percentage": 33.85, "elapsed_time": "0:21:07", "remaining_time": "0:41:15"}
{"current_steps": 70, "total_steps": 192, "loss": 0.443, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.374210410959207e-07, "epoch": 1.4583333333333333, "percentage": 36.46, "elapsed_time": "0:22:59", "remaining_time": "0:40:03"}
{"current_steps": 70, "total_steps": 192, "loss": null, "eval_loss": 0.8596016764640808, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.4583333333333333, "percentage": 36.46, "elapsed_time": "0:22:59", "remaining_time": "0:40:03"}
{"current_steps": 75, "total_steps": 192, "loss": 0.4346, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.6222476698215175e-07, "epoch": 1.5625, "percentage": 39.06, "elapsed_time": "0:24:51", "remaining_time": "0:38:46"}
{"current_steps": 75, "total_steps": 192, "loss": null, "eval_loss": 0.8514222502708435, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.5625, "percentage": 39.06, "elapsed_time": "0:24:51", "remaining_time": "0:38:46"}
{"current_steps": 80, "total_steps": 192, "loss": 0.4701, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.462755297384099e-07, "epoch": 1.6666666666666665, "percentage": 41.67, "elapsed_time": "0:26:44", "remaining_time": "0:37:25"}
{"current_steps": 80, "total_steps": 192, "loss": null, "eval_loss": 0.8461114764213562, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.6666666666666665, "percentage": 41.67, "elapsed_time": "0:26:44", "remaining_time": "0:37:25"}
{"current_steps": 85, "total_steps": 192, "loss": 0.4344, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.7088740175034947e-07, "epoch": 1.7708333333333335, "percentage": 44.27, "elapsed_time": "0:28:36", "remaining_time": "0:36:00"}
{"current_steps": 85, "total_steps": 192, "loss": null, "eval_loss": 0.8437052369117737, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.7708333333333335, "percentage": 44.27, "elapsed_time": "0:28:36", "remaining_time": "0:36:00"}
{"current_steps": 90, "total_steps": 192, "loss": 0.4274, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.228102956599465e-07, "epoch": 1.875, "percentage": 46.88, "elapsed_time": "0:30:27", "remaining_time": "0:34:31"}
{"current_steps": 90, "total_steps": 192, "loss": null, "eval_loss": 0.8434357643127441, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.875, "percentage": 46.88, "elapsed_time": "0:30:27", "remaining_time": "0:34:31"}
{"current_steps": 95, "total_steps": 192, "loss": 0.4771, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.279207916081227e-08, "epoch": 1.9791666666666665, "percentage": 49.48, "elapsed_time": "0:32:20", "remaining_time": "0:33:01"}
{"current_steps": 95, "total_steps": 192, "loss": null, "eval_loss": 0.8434197902679443, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.9791666666666665, "percentage": 49.48, "elapsed_time": "0:32:20", "remaining_time": "0:33:01"}
{"current_steps": 100, "total_steps": 192, "loss": 0.3876, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.448002404850094e-08, "epoch": 2.0833333333333335, "percentage": 52.08, "elapsed_time": "0:34:12", "remaining_time": "0:31:28"}
{"current_steps": 100, "total_steps": 192, "loss": null, "eval_loss": 0.8438728451728821, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.0833333333333335, "percentage": 52.08, "elapsed_time": "0:34:12", "remaining_time": "0:31:28"}
{"current_steps": 105, "total_steps": 192, "loss": 0.3698, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.35920070839697e-08, "epoch": 2.1875, "percentage": 54.69, "elapsed_time": "0:36:01", "remaining_time": "0:29:51"}
{"current_steps": 105, "total_steps": 192, "loss": null, "eval_loss": 0.845079243183136, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.1875, "percentage": 54.69, "elapsed_time": "0:36:01", "remaining_time": "0:29:51"}
{"current_steps": 110, "total_steps": 192, "loss": 0.407, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.7299804687499997e-08, "epoch": 2.2916666666666665, "percentage": 57.29, "elapsed_time": "0:37:49", "remaining_time": "0:28:12"}
{"current_steps": 110, "total_steps": 192, "loss": null, "eval_loss": 0.8465444445610046, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.2916666666666665, "percentage": 57.29, "elapsed_time": "0:37:49", "remaining_time": "0:28:12"}
{"current_steps": 115, "total_steps": 192, "loss": 0.374, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.37771434967624e-08, "epoch": 2.3958333333333335, "percentage": 59.9, "elapsed_time": "0:39:40", "remaining_time": "0:26:33"}
{"current_steps": 115, "total_steps": 192, "loss": null, "eval_loss": 0.8481599688529968, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.3958333333333335, "percentage": 59.9, "elapsed_time": "0:39:40", "remaining_time": "0:26:33"}
{"current_steps": 120, "total_steps": 192, "loss": 0.3945, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.187403540619925e-08, "epoch": 2.5, "percentage": 62.5, "elapsed_time": "0:41:28", "remaining_time": "0:24:53"}
{"current_steps": 120, "total_steps": 192, "loss": null, "eval_loss": 0.8498236536979675, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.5, "percentage": 62.5, "elapsed_time": "0:41:28", "remaining_time": "0:24:53"}
{"current_steps": 125, "total_steps": 192, "loss": 0.3753, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.088648238966908e-08, "epoch": 2.6041666666666665, "percentage": 65.1, "elapsed_time": "0:43:19", "remaining_time": "0:23:13"}
{"current_steps": 125, "total_steps": 192, "loss": null, "eval_loss": 0.8512565493583679, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.6041666666666665, "percentage": 65.1, "elapsed_time": "0:43:19", "remaining_time": "0:23:13"}
{"current_steps": 130, "total_steps": 192, "loss": 0.3721, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.039701925276604e-08, "epoch": 2.7083333333333335, "percentage": 67.71, "elapsed_time": "0:45:11", "remaining_time": "0:21:32"}
{"current_steps": 130, "total_steps": 192, "loss": null, "eval_loss": 0.8527700304985046, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.7083333333333335, "percentage": 67.71, "elapsed_time": "0:45:11", "remaining_time": "0:21:32"}
{"current_steps": 135, "total_steps": 192, "loss": 0.3718, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0166900048082497e-08, "epoch": 2.8125, "percentage": 70.31, "elapsed_time": "0:47:01", "remaining_time": "0:19:51"}
{"current_steps": 135, "total_steps": 192, "loss": null, "eval_loss": 0.8541720509529114, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.8125, "percentage": 70.31, "elapsed_time": "0:47:01", "remaining_time": "0:19:51"}
{"current_steps": 140, "total_steps": 192, "loss": 0.3773, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0065147322870076e-08, "epoch": 2.9166666666666665, "percentage": 72.92, "elapsed_time": "0:48:51", "remaining_time": "0:18:09"}
{"current_steps": 140, "total_steps": 192, "loss": null, "eval_loss": 0.8555252552032471, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.9166666666666665, "percentage": 72.92, "elapsed_time": "0:48:51", "remaining_time": "0:18:09"}
{"current_steps": 145, "total_steps": 192, "loss": 0.3723, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.002328628528332e-08, "epoch": 3.0208333333333335, "percentage": 75.52, "elapsed_time": "0:50:40", "remaining_time": "0:16:25"}
{"current_steps": 145, "total_steps": 192, "loss": null, "eval_loss": 0.8565484881401062, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.0208333333333335, "percentage": 75.52, "elapsed_time": "0:50:40", "remaining_time": "0:16:25"}
{"current_steps": 150, "total_steps": 192, "loss": 0.374, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0007484528133236e-08, "epoch": 3.125, "percentage": 78.12, "elapsed_time": "0:52:32", "remaining_time": "0:14:42"}
{"current_steps": 150, "total_steps": 192, "loss": null, "eval_loss": 0.8576194643974304, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.125, "percentage": 78.12, "elapsed_time": "0:52:32", "remaining_time": "0:14:42"}
{"current_steps": 155, "total_steps": 192, "loss": 0.3728, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0002110817570477e-08, "epoch": 3.2291666666666665, "percentage": 80.73, "elapsed_time": "0:54:21", "remaining_time": "0:12:58"}
{"current_steps": 155, "total_steps": 192, "loss": null, "eval_loss": 0.8588044047355652, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.2291666666666665, "percentage": 80.73, "elapsed_time": "0:54:21", "remaining_time": "0:12:58"}
{"current_steps": 160, "total_steps": 192, "loss": 0.3686, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0000504842356326e-08, "epoch": 3.3333333333333335, "percentage": 83.33, "elapsed_time": "0:56:13", "remaining_time": "0:11:14"}
{"current_steps": 160, "total_steps": 192, "loss": null, "eval_loss": 0.859791100025177, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.3333333333333335, "percentage": 83.33, "elapsed_time": "0:56:13", "remaining_time": "0:11:14"}
{"current_steps": 165, "total_steps": 192, "loss": 0.3617, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.000009745562451e-08, "epoch": 3.4375, "percentage": 85.94, "elapsed_time": "0:58:03", "remaining_time": "0:09:29"}
{"current_steps": 165, "total_steps": 192, "loss": null, "eval_loss": 0.8607122302055359, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.4375, "percentage": 85.94, "elapsed_time": "0:58:03", "remaining_time": "0:09:29"}
{"current_steps": 170, "total_steps": 192, "loss": 0.3546, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0000014077810156e-08, "epoch": 3.5416666666666665, "percentage": 88.54, "elapsed_time": "0:59:52", "remaining_time": "0:07:44"}
{"current_steps": 170, "total_steps": 192, "loss": null, "eval_loss": 0.8613293170928955, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.5416666666666665, "percentage": 88.54, "elapsed_time": "0:59:52", "remaining_time": "0:07:44"}
{"current_steps": 175, "total_steps": 192, "loss": 0.3707, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0000001343508807e-08, "epoch": 3.6458333333333335, "percentage": 91.15, "elapsed_time": "1:01:40", "remaining_time": "0:05:59"}
{"current_steps": 175, "total_steps": 192, "loss": null, "eval_loss": 0.8619220852851868, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.6458333333333335, "percentage": 91.15, "elapsed_time": "1:01:40", "remaining_time": "0:05:59"}
{"current_steps": 180, "total_steps": 192, "loss": 0.3739, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.000000006747581e-08, "epoch": 3.75, "percentage": 93.75, "elapsed_time": "1:03:31", "remaining_time": "0:04:14"}
{"current_steps": 180, "total_steps": 192, "loss": null, "eval_loss": 0.862490177154541, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.75, "percentage": 93.75, "elapsed_time": "1:03:31", "remaining_time": "0:04:14"}
{"current_steps": 185, "total_steps": 192, "loss": 0.3617, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0000000001094325e-08, "epoch": 3.8541666666666665, "percentage": 96.35, "elapsed_time": "1:05:21", "remaining_time": "0:02:28"}
{"current_steps": 185, "total_steps": 192, "loss": null, "eval_loss": 0.8631939888000488, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.8541666666666665, "percentage": 96.35, "elapsed_time": "1:05:21", "remaining_time": "0:02:28"}
{"current_steps": 190, "total_steps": 192, "loss": 0.3591, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.000000000000139e-08, "epoch": 3.9583333333333335, "percentage": 98.96, "elapsed_time": "1:07:12", "remaining_time": "0:00:42"}
{"current_steps": 190, "total_steps": 192, "loss": null, "eval_loss": 0.8637197613716125, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.9583333333333335, "percentage": 98.96, "elapsed_time": "1:07:12", "remaining_time": "0:00:42"}
{"current_steps": 192, "total_steps": 192, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 4.0, "percentage": 100.0, "elapsed_time": "1:08:56", "remaining_time": "0:00:00"}
{"current_steps": 3, "total_steps": 3, "loss": null, "eval_loss": 0.8062803149223328, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 4.0, "percentage": 100.0, "elapsed_time": "1:09:34", "remaining_time": "0:00:00"}