TianyiQ's picture
Upload folder using huggingface_hub
aeb3166 verified
{"current_steps": 1, "total_steps": 192, "loss": 0.9805, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.0, "epoch": 0.020833333333333332, "percentage": 0.52, "elapsed_time": "0:00:21", "remaining_time": "1:08:51"}
{"current_steps": 1, "total_steps": 192, "loss": null, "eval_loss": 0.9736970067024231, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.020833333333333332, "percentage": 0.52, "elapsed_time": "0:00:21", "remaining_time": "1:08:51"}
{"current_steps": 5, "total_steps": 192, "loss": 0.9446, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.5e-06, "epoch": 0.10416666666666667, "percentage": 2.6, "elapsed_time": "0:01:25", "remaining_time": "0:53:13"}
{"current_steps": 5, "total_steps": 192, "loss": null, "eval_loss": 0.9454841613769531, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.10416666666666667, "percentage": 2.6, "elapsed_time": "0:01:25", "remaining_time": "0:53:13"}
{"current_steps": 10, "total_steps": 192, "loss": 0.8481, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.25e-06, "epoch": 0.20833333333333334, "percentage": 5.21, "elapsed_time": "0:04:04", "remaining_time": "1:14:01"}
{"current_steps": 10, "total_steps": 192, "loss": null, "eval_loss": 0.8153812289237976, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.20833333333333334, "percentage": 5.21, "elapsed_time": "0:04:04", "remaining_time": "1:14:01"}
{"current_steps": 15, "total_steps": 192, "loss": 0.7794, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9e-06, "epoch": 0.3125, "percentage": 7.81, "elapsed_time": "0:06:37", "remaining_time": "1:18:10"}
{"current_steps": 15, "total_steps": 192, "loss": null, "eval_loss": 0.8123041987419128, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.3125, "percentage": 7.81, "elapsed_time": "0:06:37", "remaining_time": "1:18:10"}
{"current_steps": 20, "total_steps": 192, "loss": 0.7798, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.275e-05, "epoch": 0.4166666666666667, "percentage": 10.42, "elapsed_time": "0:09:16", "remaining_time": "1:19:44"}
{"current_steps": 20, "total_steps": 192, "loss": null, "eval_loss": 0.8410752415657043, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.4166666666666667, "percentage": 10.42, "elapsed_time": "0:09:16", "remaining_time": "1:19:44"}
{"current_steps": 25, "total_steps": 192, "loss": 0.8576, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.3195176200175283e-05, "epoch": 0.5208333333333334, "percentage": 13.02, "elapsed_time": "0:11:57", "remaining_time": "1:19:51"}
{"current_steps": 25, "total_steps": 192, "loss": null, "eval_loss": 0.8676239848136902, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.5208333333333334, "percentage": 13.02, "elapsed_time": "0:11:57", "remaining_time": "1:19:51"}
{"current_steps": 30, "total_steps": 192, "loss": 0.8852, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.515676612044427e-06, "epoch": 0.625, "percentage": 15.62, "elapsed_time": "0:14:41", "remaining_time": "1:19:17"}
{"current_steps": 30, "total_steps": 192, "loss": null, "eval_loss": 0.867268979549408, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.625, "percentage": 15.62, "elapsed_time": "0:14:41", "remaining_time": "1:19:17"}
{"current_steps": 35, "total_steps": 192, "loss": 0.8529, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.797580677308734e-06, "epoch": 0.7291666666666666, "percentage": 18.23, "elapsed_time": "0:17:12", "remaining_time": "1:17:10"}
{"current_steps": 35, "total_steps": 192, "loss": null, "eval_loss": 0.8560981154441833, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.7291666666666666, "percentage": 18.23, "elapsed_time": "0:17:12", "remaining_time": "1:17:10"}
{"current_steps": 40, "total_steps": 192, "loss": 0.8224, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.808575415542887e-06, "epoch": 0.8333333333333334, "percentage": 20.83, "elapsed_time": "0:19:49", "remaining_time": "1:15:19"}
{"current_steps": 40, "total_steps": 192, "loss": null, "eval_loss": 0.8470456004142761, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.8333333333333334, "percentage": 20.83, "elapsed_time": "0:19:49", "remaining_time": "1:15:19"}
{"current_steps": 45, "total_steps": 192, "loss": 0.8536, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.3676619069852654e-06, "epoch": 0.9375, "percentage": 23.44, "elapsed_time": "0:22:24", "remaining_time": "1:13:13"}
{"current_steps": 45, "total_steps": 192, "loss": null, "eval_loss": 0.8378292918205261, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.9375, "percentage": 23.44, "elapsed_time": "0:22:24", "remaining_time": "1:13:13"}
{"current_steps": 50, "total_steps": 192, "loss": 0.662, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.334947896124909e-06, "epoch": 1.0416666666666667, "percentage": 26.04, "elapsed_time": "0:25:01", "remaining_time": "1:11:05"}
{"current_steps": 50, "total_steps": 192, "loss": null, "eval_loss": 0.8293696045875549, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.0416666666666667, "percentage": 26.04, "elapsed_time": "0:25:01", "remaining_time": "1:11:05"}
{"current_steps": 55, "total_steps": 192, "loss": 0.437, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.603233215095547e-06, "epoch": 1.1458333333333333, "percentage": 28.65, "elapsed_time": "0:27:38", "remaining_time": "1:08:51"}
{"current_steps": 55, "total_steps": 192, "loss": null, "eval_loss": 0.8531150817871094, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.1458333333333333, "percentage": 28.65, "elapsed_time": "0:27:38", "remaining_time": "1:08:51"}
{"current_steps": 60, "total_steps": 192, "loss": 0.4402, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0911174606561334e-06, "epoch": 1.25, "percentage": 31.25, "elapsed_time": "0:30:17", "remaining_time": "1:06:37"}
{"current_steps": 60, "total_steps": 192, "loss": null, "eval_loss": 0.8569180369377136, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.25, "percentage": 31.25, "elapsed_time": "0:30:17", "remaining_time": "1:06:37"}
{"current_steps": 65, "total_steps": 192, "loss": 0.4244, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.373930741131784e-07, "epoch": 1.3541666666666667, "percentage": 33.85, "elapsed_time": "0:32:53", "remaining_time": "1:04:15"}
{"current_steps": 65, "total_steps": 192, "loss": null, "eval_loss": 0.8569238185882568, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.3541666666666667, "percentage": 33.85, "elapsed_time": "0:32:53", "remaining_time": "1:04:15"}
{"current_steps": 70, "total_steps": 192, "loss": 0.4495, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.374210410959207e-07, "epoch": 1.4583333333333333, "percentage": 36.46, "elapsed_time": "0:35:28", "remaining_time": "1:01:50"}
{"current_steps": 70, "total_steps": 192, "loss": null, "eval_loss": 0.8547163605690002, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.4583333333333333, "percentage": 36.46, "elapsed_time": "0:35:28", "remaining_time": "1:01:50"}
{"current_steps": 75, "total_steps": 192, "loss": 0.4689, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.6222476698215175e-07, "epoch": 1.5625, "percentage": 39.06, "elapsed_time": "0:38:03", "remaining_time": "0:59:22"}
{"current_steps": 75, "total_steps": 192, "loss": null, "eval_loss": 0.8493571877479553, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.5625, "percentage": 39.06, "elapsed_time": "0:38:03", "remaining_time": "0:59:22"}
{"current_steps": 80, "total_steps": 192, "loss": 0.4309, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.462755297384099e-07, "epoch": 1.6666666666666665, "percentage": 41.67, "elapsed_time": "0:40:43", "remaining_time": "0:57:00"}
{"current_steps": 80, "total_steps": 192, "loss": null, "eval_loss": 0.846055269241333, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.6666666666666665, "percentage": 41.67, "elapsed_time": "0:40:43", "remaining_time": "0:57:00"}
{"current_steps": 85, "total_steps": 192, "loss": 0.4299, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.7088740175034947e-07, "epoch": 1.7708333333333335, "percentage": 44.27, "elapsed_time": "0:43:19", "remaining_time": "0:54:32"}
{"current_steps": 85, "total_steps": 192, "loss": null, "eval_loss": 0.8445951342582703, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.7708333333333335, "percentage": 44.27, "elapsed_time": "0:43:19", "remaining_time": "0:54:32"}
{"current_steps": 90, "total_steps": 192, "loss": 0.4461, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.228102956599465e-07, "epoch": 1.875, "percentage": 46.88, "elapsed_time": "0:45:54", "remaining_time": "0:52:01"}
{"current_steps": 90, "total_steps": 192, "loss": null, "eval_loss": 0.8440027832984924, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.875, "percentage": 46.88, "elapsed_time": "0:45:54", "remaining_time": "0:52:01"}
{"current_steps": 95, "total_steps": 192, "loss": 0.4474, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.279207916081227e-08, "epoch": 1.9791666666666665, "percentage": 49.48, "elapsed_time": "0:48:29", "remaining_time": "0:49:30"}
{"current_steps": 95, "total_steps": 192, "loss": null, "eval_loss": 0.8438854217529297, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.9791666666666665, "percentage": 49.48, "elapsed_time": "0:48:29", "remaining_time": "0:49:30"}
{"current_steps": 100, "total_steps": 192, "loss": 0.3614, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.448002404850094e-08, "epoch": 2.0833333333333335, "percentage": 52.08, "elapsed_time": "0:51:06", "remaining_time": "0:47:00"}
{"current_steps": 100, "total_steps": 192, "loss": null, "eval_loss": 0.8445320725440979, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.0833333333333335, "percentage": 52.08, "elapsed_time": "0:51:06", "remaining_time": "0:47:00"}
{"current_steps": 105, "total_steps": 192, "loss": 0.3861, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.35920070839697e-08, "epoch": 2.1875, "percentage": 54.69, "elapsed_time": "0:53:39", "remaining_time": "0:44:27"}
{"current_steps": 105, "total_steps": 192, "loss": null, "eval_loss": 0.8457441926002502, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.1875, "percentage": 54.69, "elapsed_time": "0:53:39", "remaining_time": "0:44:27"}
{"current_steps": 110, "total_steps": 192, "loss": 0.3829, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.7299804687499997e-08, "epoch": 2.2916666666666665, "percentage": 57.29, "elapsed_time": "0:56:16", "remaining_time": "0:41:57"}
{"current_steps": 110, "total_steps": 192, "loss": null, "eval_loss": 0.847288191318512, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.2916666666666665, "percentage": 57.29, "elapsed_time": "0:56:16", "remaining_time": "0:41:57"}
{"current_steps": 115, "total_steps": 192, "loss": 0.3764, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.37771434967624e-08, "epoch": 2.3958333333333335, "percentage": 59.9, "elapsed_time": "0:58:52", "remaining_time": "0:39:24"}
{"current_steps": 115, "total_steps": 192, "loss": null, "eval_loss": 0.8487641215324402, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.3958333333333335, "percentage": 59.9, "elapsed_time": "0:58:52", "remaining_time": "0:39:24"}
{"current_steps": 120, "total_steps": 192, "loss": 0.3655, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.187403540619925e-08, "epoch": 2.5, "percentage": 62.5, "elapsed_time": "1:01:27", "remaining_time": "0:36:52"}
{"current_steps": 120, "total_steps": 192, "loss": null, "eval_loss": 0.8499611020088196, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.5, "percentage": 62.5, "elapsed_time": "1:01:27", "remaining_time": "0:36:52"}
{"current_steps": 125, "total_steps": 192, "loss": 0.4243, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.088648238966908e-08, "epoch": 2.6041666666666665, "percentage": 65.1, "elapsed_time": "1:04:01", "remaining_time": "0:34:19"}
{"current_steps": 125, "total_steps": 192, "loss": null, "eval_loss": 0.8510637879371643, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.6041666666666665, "percentage": 65.1, "elapsed_time": "1:04:01", "remaining_time": "0:34:19"}
{"current_steps": 130, "total_steps": 192, "loss": 0.3884, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.039701925276604e-08, "epoch": 2.7083333333333335, "percentage": 67.71, "elapsed_time": "1:06:38", "remaining_time": "0:31:46"}
{"current_steps": 130, "total_steps": 192, "loss": null, "eval_loss": 0.8520172238349915, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.7083333333333335, "percentage": 67.71, "elapsed_time": "1:06:38", "remaining_time": "0:31:46"}
{"current_steps": 135, "total_steps": 192, "loss": 0.3634, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0166900048082497e-08, "epoch": 2.8125, "percentage": 70.31, "elapsed_time": "1:09:13", "remaining_time": "0:29:13"}
{"current_steps": 135, "total_steps": 192, "loss": null, "eval_loss": 0.8528143763542175, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.8125, "percentage": 70.31, "elapsed_time": "1:09:13", "remaining_time": "0:29:13"}
{"current_steps": 140, "total_steps": 192, "loss": 0.3846, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0065147322870076e-08, "epoch": 2.9166666666666665, "percentage": 72.92, "elapsed_time": "1:11:49", "remaining_time": "0:26:40"}
{"current_steps": 140, "total_steps": 192, "loss": null, "eval_loss": 0.8537066578865051, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.9166666666666665, "percentage": 72.92, "elapsed_time": "1:11:49", "remaining_time": "0:26:40"}
{"current_steps": 145, "total_steps": 192, "loss": 0.3872, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.002328628528332e-08, "epoch": 3.0208333333333335, "percentage": 75.52, "elapsed_time": "1:14:24", "remaining_time": "0:24:06"}
{"current_steps": 145, "total_steps": 192, "loss": null, "eval_loss": 0.8547406196594238, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.0208333333333335, "percentage": 75.52, "elapsed_time": "1:14:24", "remaining_time": "0:24:06"}
{"current_steps": 150, "total_steps": 192, "loss": 0.3869, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0007484528133236e-08, "epoch": 3.125, "percentage": 78.12, "elapsed_time": "1:17:02", "remaining_time": "0:21:34"}
{"current_steps": 150, "total_steps": 192, "loss": null, "eval_loss": 0.8557960391044617, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.125, "percentage": 78.12, "elapsed_time": "1:17:02", "remaining_time": "0:21:34"}
{"current_steps": 155, "total_steps": 192, "loss": 0.3876, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0002110817570477e-08, "epoch": 3.2291666666666665, "percentage": 80.73, "elapsed_time": "1:19:36", "remaining_time": "0:19:00"}
{"current_steps": 155, "total_steps": 192, "loss": null, "eval_loss": 0.8566272854804993, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.2291666666666665, "percentage": 80.73, "elapsed_time": "1:19:36", "remaining_time": "0:19:00"}
{"current_steps": 160, "total_steps": 192, "loss": 0.3844, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0000504842356326e-08, "epoch": 3.3333333333333335, "percentage": 83.33, "elapsed_time": "1:22:13", "remaining_time": "0:16:26"}
{"current_steps": 160, "total_steps": 192, "loss": null, "eval_loss": 0.8572790026664734, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.3333333333333335, "percentage": 83.33, "elapsed_time": "1:22:13", "remaining_time": "0:16:26"}
{"current_steps": 165, "total_steps": 192, "loss": 0.3535, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.000009745562451e-08, "epoch": 3.4375, "percentage": 85.94, "elapsed_time": "1:24:48", "remaining_time": "0:13:52"}
{"current_steps": 165, "total_steps": 192, "loss": null, "eval_loss": 0.8578632473945618, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.4375, "percentage": 85.94, "elapsed_time": "1:24:48", "remaining_time": "0:13:52"}
{"current_steps": 170, "total_steps": 192, "loss": 0.3488, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0000014077810156e-08, "epoch": 3.5416666666666665, "percentage": 88.54, "elapsed_time": "1:27:24", "remaining_time": "0:11:18"}
{"current_steps": 170, "total_steps": 192, "loss": null, "eval_loss": 0.85884028673172, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.5416666666666665, "percentage": 88.54, "elapsed_time": "1:27:24", "remaining_time": "0:11:18"}
{"current_steps": 175, "total_steps": 192, "loss": 0.3464, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0000001343508807e-08, "epoch": 3.6458333333333335, "percentage": 91.15, "elapsed_time": "1:30:00", "remaining_time": "0:08:44"}
{"current_steps": 175, "total_steps": 192, "loss": null, "eval_loss": 0.8598365783691406, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.6458333333333335, "percentage": 91.15, "elapsed_time": "1:30:00", "remaining_time": "0:08:44"}
{"current_steps": 180, "total_steps": 192, "loss": 0.361, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.000000006747581e-08, "epoch": 3.75, "percentage": 93.75, "elapsed_time": "1:32:36", "remaining_time": "0:06:10"}
{"current_steps": 180, "total_steps": 192, "loss": null, "eval_loss": 0.8606703877449036, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.75, "percentage": 93.75, "elapsed_time": "1:32:36", "remaining_time": "0:06:10"}
{"current_steps": 185, "total_steps": 192, "loss": 0.3674, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0000000001094325e-08, "epoch": 3.8541666666666665, "percentage": 96.35, "elapsed_time": "1:35:11", "remaining_time": "0:03:36"}
{"current_steps": 185, "total_steps": 192, "loss": null, "eval_loss": 0.8611735701560974, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.8541666666666665, "percentage": 96.35, "elapsed_time": "1:35:11", "remaining_time": "0:03:36"}
{"current_steps": 190, "total_steps": 192, "loss": 0.3988, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.000000000000139e-08, "epoch": 3.9583333333333335, "percentage": 98.96, "elapsed_time": "1:37:48", "remaining_time": "0:01:01"}
{"current_steps": 190, "total_steps": 192, "loss": null, "eval_loss": 0.8612277507781982, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.9583333333333335, "percentage": 98.96, "elapsed_time": "1:37:48", "remaining_time": "0:01:01"}
{"current_steps": 192, "total_steps": 192, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 4.0, "percentage": 100.0, "elapsed_time": "1:39:43", "remaining_time": "0:00:00"}
{"current_steps": 3, "total_steps": 3, "loss": null, "eval_loss": 0.8123041987419128, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 4.0, "percentage": 100.0, "elapsed_time": "1:40:42", "remaining_time": "0:00:00"}