esfrankel17
commited on
Commit
•
ae9846b
1
Parent(s):
3119434
Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76f9d1b113ac6306fe1f7cff1e7eaf0cd199642d3456726c7de30b843997c500
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea75547d43f74d420897b2e70f75133c5f1f1fee187bb5277213be1dd229c0dc
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95fc91e1dd89cc48d865d81c6a14cc8b9837fe63e9b50c160d64c10f3b427bde
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecf865bbbd3d1e6d4abb3b5b23ac05fdf477c81c145ccc082258c0e7499527eb
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -10,3 +10,15 @@
|
|
10 |
{"current_steps": 100, "total_steps": 321, "loss": 0.6853, "learning_rate": 5e-06, "epoch": 0.9313154831199069, "percentage": 31.15, "elapsed_time": "0:51:26", "remaining_time": "1:53:41"}
|
11 |
{"current_steps": 107, "total_steps": 321, "eval_loss": 0.6684155464172363, "epoch": 0.9965075669383003, "percentage": 33.33, "elapsed_time": "0:56:25", "remaining_time": "1:52:50"}
|
12 |
{"current_steps": 110, "total_steps": 321, "loss": 0.7062, "learning_rate": 5e-06, "epoch": 1.0244470314318976, "percentage": 34.27, "elapsed_time": "0:58:46", "remaining_time": "1:52:43"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
10 |
{"current_steps": 100, "total_steps": 321, "loss": 0.6853, "learning_rate": 5e-06, "epoch": 0.9313154831199069, "percentage": 31.15, "elapsed_time": "0:51:26", "remaining_time": "1:53:41"}
|
11 |
{"current_steps": 107, "total_steps": 321, "eval_loss": 0.6684155464172363, "epoch": 0.9965075669383003, "percentage": 33.33, "elapsed_time": "0:56:25", "remaining_time": "1:52:50"}
|
12 |
{"current_steps": 110, "total_steps": 321, "loss": 0.7062, "learning_rate": 5e-06, "epoch": 1.0244470314318976, "percentage": 34.27, "elapsed_time": "0:58:46", "remaining_time": "1:52:43"}
|
13 |
+
{"current_steps": 120, "total_steps": 321, "loss": 0.6098, "learning_rate": 5e-06, "epoch": 1.1175785797438882, "percentage": 37.38, "elapsed_time": "1:03:54", "remaining_time": "1:47:03"}
|
14 |
+
{"current_steps": 130, "total_steps": 321, "loss": 0.6019, "learning_rate": 5e-06, "epoch": 1.210710128055879, "percentage": 40.5, "elapsed_time": "1:09:01", "remaining_time": "1:41:24"}
|
15 |
+
{"current_steps": 140, "total_steps": 321, "loss": 0.6043, "learning_rate": 5e-06, "epoch": 1.3038416763678695, "percentage": 43.61, "elapsed_time": "1:14:10", "remaining_time": "1:35:53"}
|
16 |
+
{"current_steps": 150, "total_steps": 321, "loss": 0.6023, "learning_rate": 5e-06, "epoch": 1.3969732246798603, "percentage": 46.73, "elapsed_time": "1:19:18", "remaining_time": "1:30:24"}
|
17 |
+
{"current_steps": 160, "total_steps": 321, "loss": 0.6021, "learning_rate": 5e-06, "epoch": 1.490104772991851, "percentage": 49.84, "elapsed_time": "1:24:27", "remaining_time": "1:24:59"}
|
18 |
+
{"current_steps": 170, "total_steps": 321, "loss": 0.6002, "learning_rate": 5e-06, "epoch": 1.5832363213038416, "percentage": 52.96, "elapsed_time": "1:29:34", "remaining_time": "1:19:33"}
|
19 |
+
{"current_steps": 180, "total_steps": 321, "loss": 0.5935, "learning_rate": 5e-06, "epoch": 1.6763678696158324, "percentage": 56.07, "elapsed_time": "1:34:41", "remaining_time": "1:14:10"}
|
20 |
+
{"current_steps": 190, "total_steps": 321, "loss": 0.589, "learning_rate": 5e-06, "epoch": 1.7694994179278232, "percentage": 59.19, "elapsed_time": "1:39:50", "remaining_time": "1:08:50"}
|
21 |
+
{"current_steps": 200, "total_steps": 321, "loss": 0.5954, "learning_rate": 5e-06, "epoch": 1.8626309662398137, "percentage": 62.31, "elapsed_time": "1:44:57", "remaining_time": "1:03:30"}
|
22 |
+
{"current_steps": 210, "total_steps": 321, "loss": 0.591, "learning_rate": 5e-06, "epoch": 1.9557625145518043, "percentage": 65.42, "elapsed_time": "1:50:05", "remaining_time": "0:58:11"}
|
23 |
+
{"current_steps": 214, "total_steps": 321, "eval_loss": 0.6565061807632446, "epoch": 1.9930151338766007, "percentage": 66.67, "elapsed_time": "1:53:44", "remaining_time": "0:56:52"}
|
24 |
+
{"current_steps": 220, "total_steps": 321, "loss": 0.5986, "learning_rate": 5e-06, "epoch": 2.0488940628637953, "percentage": 68.54, "elapsed_time": "1:57:39", "remaining_time": "0:54:00"}
|