Training in progress, epoch 3

Files changed (5) hide show

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:064843fdd202f923a17d6b23dfdd83bf1704b4dc40476dd0d973421c42ea4af6
 size 4976698672

 version https://git-lfs.github.com/spec/v1
+oid sha256:f3d4486ead5e47a9a114029b12ff4543c7eeb81b2890e52b677d4b6d9e30c196
 size 4976698672

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:05e9af8806620d65be64b2c9555838a129c7b0310fcf44bedf667dd258c43fb2
 size 4999802720

 version https://git-lfs.github.com/spec/v1
+oid sha256:fa5168e17cfd0a249022e2854175aaec2a8ded94346662ba672f86bc8a43ef22
 size 4999802720

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:35bbf4a8a2627505f83d512bbeb6a96732e3e80aea4764c0e9a24df35cbc620e
 size 4915916176

 version https://git-lfs.github.com/spec/v1
+oid sha256:6af0e268c68b4b2102ff5582d74e1bdcffbb0f40b05972e278fe4b12ce53d505
 size 4915916176

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5593fa10ba8c2eaf4349e7420e4995d40981fc3177768c1e886ba8a4a2369e72
 size 1168138808

 version https://git-lfs.github.com/spec/v1
+oid sha256:541b951dd05c81d8e45884d423786498305ea9b26047a6418558bf60a0ac0fd5
 size 1168138808

trainer_log.jsonl CHANGED Viewed

@@ -3,3 +3,6 @@
 {"current_steps": 20, "total_steps": 48, "loss": 0.7853, "learning_rate": 5e-06, "epoch": 1.25, "percentage": 41.67, "elapsed_time": "0:11:47", "remaining_time": "0:16:30"}
 {"current_steps": 30, "total_steps": 48, "loss": 0.7293, "learning_rate": 5e-06, "epoch": 1.875, "percentage": 62.5, "elapsed_time": "0:17:07", "remaining_time": "0:10:16"}
 {"current_steps": 32, "total_steps": 48, "eval_loss": 0.7811707258224487, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:18:22", "remaining_time": "0:09:11"}

 {"current_steps": 20, "total_steps": 48, "loss": 0.7853, "learning_rate": 5e-06, "epoch": 1.25, "percentage": 41.67, "elapsed_time": "0:11:47", "remaining_time": "0:16:30"}
 {"current_steps": 30, "total_steps": 48, "loss": 0.7293, "learning_rate": 5e-06, "epoch": 1.875, "percentage": 62.5, "elapsed_time": "0:17:07", "remaining_time": "0:10:16"}
 {"current_steps": 32, "total_steps": 48, "eval_loss": 0.7811707258224487, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:18:22", "remaining_time": "0:09:11"}
+{"current_steps": 40, "total_steps": 48, "loss": 0.677, "learning_rate": 5e-06, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "0:23:31", "remaining_time": "0:04:42"}
+{"current_steps": 48, "total_steps": 48, "eval_loss": 0.765191376209259, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:28:53", "remaining_time": "0:00:00"}
+{"current_steps": 48, "total_steps": 48, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:29:50", "remaining_time": "0:00:00"}