Gemma-2-9B-It-SFT / trainer_log.jsonl
chchen's picture
Training in progress, step 168
c8a49ca verified
raw
history blame
3.4 kB
{"current_steps": 10, "total_steps": 168, "loss": 2.8371, "learning_rate": 2.9411764705882355e-06, "epoch": 0.17777777777777778, "percentage": 5.95, "elapsed_time": "0:00:37", "remaining_time": "0:09:52"}
{"current_steps": 20, "total_steps": 168, "loss": 2.5866, "learning_rate": 4.995131923687488e-06, "epoch": 0.35555555555555557, "percentage": 11.9, "elapsed_time": "0:01:13", "remaining_time": "0:09:06"}
{"current_steps": 30, "total_steps": 168, "loss": 2.1317, "learning_rate": 4.90911473983908e-06, "epoch": 0.5333333333333333, "percentage": 17.86, "elapsed_time": "0:01:50", "remaining_time": "0:08:28"}
{"current_steps": 40, "total_steps": 168, "loss": 1.6483, "learning_rate": 4.71919261421297e-06, "epoch": 0.7111111111111111, "percentage": 23.81, "elapsed_time": "0:02:27", "remaining_time": "0:07:50"}
{"current_steps": 50, "total_steps": 168, "loss": 1.258, "learning_rate": 4.43355687413747e-06, "epoch": 0.8888888888888888, "percentage": 29.76, "elapsed_time": "0:03:03", "remaining_time": "0:07:12"}
{"current_steps": 60, "total_steps": 168, "loss": 0.9961, "learning_rate": 4.064526968101844e-06, "epoch": 1.0666666666666667, "percentage": 35.71, "elapsed_time": "0:03:39", "remaining_time": "0:06:35"}
{"current_steps": 70, "total_steps": 168, "loss": 0.6742, "learning_rate": 3.6280191288478437e-06, "epoch": 1.2444444444444445, "percentage": 41.67, "elapsed_time": "0:04:16", "remaining_time": "0:05:58"}
{"current_steps": 80, "total_steps": 168, "loss": 0.4521, "learning_rate": 3.142859907420615e-06, "epoch": 1.4222222222222223, "percentage": 47.62, "elapsed_time": "0:04:52", "remaining_time": "0:05:21"}
{"current_steps": 90, "total_steps": 168, "loss": 0.3905, "learning_rate": 2.629974185404951e-06, "epoch": 1.6, "percentage": 53.57, "elapsed_time": "0:05:28", "remaining_time": "0:04:44"}
{"current_steps": 100, "total_steps": 168, "loss": 0.2197, "learning_rate": 2.1114826863194882e-06, "epoch": 1.7777777777777777, "percentage": 59.52, "elapsed_time": "0:06:04", "remaining_time": "0:04:08"}
{"current_steps": 110, "total_steps": 168, "loss": 0.235, "learning_rate": 1.6097479104361328e-06, "epoch": 1.9555555555555557, "percentage": 65.48, "elapsed_time": "0:06:40", "remaining_time": "0:03:31"}
{"current_steps": 120, "total_steps": 168, "loss": 0.177, "learning_rate": 1.1464096417858821e-06, "epoch": 2.1333333333333333, "percentage": 71.43, "elapsed_time": "0:07:17", "remaining_time": "0:02:54"}
{"current_steps": 130, "total_steps": 168, "loss": 0.1756, "learning_rate": 7.414516258630245e-07, "epoch": 2.311111111111111, "percentage": 77.38, "elapsed_time": "0:07:53", "remaining_time": "0:02:18"}
{"current_steps": 140, "total_steps": 168, "loss": 0.1916, "learning_rate": 4.123396721497977e-07, "epoch": 2.488888888888889, "percentage": 83.33, "elapsed_time": "0:08:29", "remaining_time": "0:01:41"}
{"current_steps": 150, "total_steps": 168, "loss": 0.1296, "learning_rate": 1.7326835503629542e-07, "epoch": 2.6666666666666665, "percentage": 89.29, "elapsed_time": "0:09:05", "remaining_time": "0:01:05"}
{"current_steps": 160, "total_steps": 168, "loss": 0.1469, "learning_rate": 3.4548802869627806e-08, "epoch": 2.8444444444444446, "percentage": 95.24, "elapsed_time": "0:09:41", "remaining_time": "0:00:29"}
{"current_steps": 168, "total_steps": 168, "epoch": 2.986666666666667, "percentage": 100.0, "elapsed_time": "0:10:12", "remaining_time": "0:00:00"}