Rakancorle1
commited on
Commit
•
b62f7b7
1
Parent(s):
5421ea7
Training in progress, step 1500
Browse files
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 42002584
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:100738da090b0fc9c43406df36f7954c39510f42e3a1137f5eac1b4fe48a8ebe
|
3 |
size 42002584
|
runs/Dec15_23-48-47_COE-CS-sv003/events.out.tfevents.1734306542.COE-CS-sv003.1994217.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ea9afd6010bc836a711ab3992a824f04a85252669d33c3b45286602246aa71f8
|
3 |
+
size 37088
|
trainer_log.jsonl
CHANGED
@@ -98,3 +98,53 @@
|
|
98 |
{"current_steps": 980, "total_steps": 1875, "loss": 0.259, "lr": 4.6442536626561675e-05, "epoch": 1.568, "percentage": 52.27, "elapsed_time": "2:31:27", "remaining_time": "2:18:19"}
|
99 |
{"current_steps": 990, "total_steps": 1875, "loss": 0.2623, "lr": 4.560744017246284e-05, "epoch": 1.584, "percentage": 52.8, "elapsed_time": "2:32:59", "remaining_time": "2:16:46"}
|
100 |
{"current_steps": 1000, "total_steps": 1875, "loss": 0.2867, "lr": 4.477357683661734e-05, "epoch": 1.6, "percentage": 53.33, "elapsed_time": "2:34:32", "remaining_time": "2:15:13"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
98 |
{"current_steps": 980, "total_steps": 1875, "loss": 0.259, "lr": 4.6442536626561675e-05, "epoch": 1.568, "percentage": 52.27, "elapsed_time": "2:31:27", "remaining_time": "2:18:19"}
|
99 |
{"current_steps": 990, "total_steps": 1875, "loss": 0.2623, "lr": 4.560744017246284e-05, "epoch": 1.584, "percentage": 52.8, "elapsed_time": "2:32:59", "remaining_time": "2:16:46"}
|
100 |
{"current_steps": 1000, "total_steps": 1875, "loss": 0.2867, "lr": 4.477357683661734e-05, "epoch": 1.6, "percentage": 53.33, "elapsed_time": "2:34:32", "remaining_time": "2:15:13"}
|
101 |
+
{"current_steps": 1010, "total_steps": 1875, "loss": 0.2851, "lr": 4.394118070851749e-05, "epoch": 1.616, "percentage": 53.87, "elapsed_time": "2:36:12", "remaining_time": "2:13:47"}
|
102 |
+
{"current_steps": 1020, "total_steps": 1875, "loss": 0.269, "lr": 4.31104854657681e-05, "epoch": 1.6320000000000001, "percentage": 54.4, "elapsed_time": "2:37:44", "remaining_time": "2:12:13"}
|
103 |
+
{"current_steps": 1030, "total_steps": 1875, "loss": 0.2526, "lr": 4.228172430848644e-05, "epoch": 1.6480000000000001, "percentage": 54.93, "elapsed_time": "2:39:16", "remaining_time": "2:10:39"}
|
104 |
+
{"current_steps": 1040, "total_steps": 1875, "loss": 0.2788, "lr": 4.1455129893836174e-05, "epoch": 1.6640000000000001, "percentage": 55.47, "elapsed_time": "2:40:48", "remaining_time": "2:09:06"}
|
105 |
+
{"current_steps": 1050, "total_steps": 1875, "loss": 0.2439, "lr": 4.063093427071376e-05, "epoch": 1.6800000000000002, "percentage": 56.0, "elapsed_time": "2:42:19", "remaining_time": "2:07:32"}
|
106 |
+
{"current_steps": 1060, "total_steps": 1875, "loss": 0.2701, "lr": 3.9809368814605766e-05, "epoch": 1.696, "percentage": 56.53, "elapsed_time": "2:43:51", "remaining_time": "2:05:59"}
|
107 |
+
{"current_steps": 1070, "total_steps": 1875, "loss": 0.2665, "lr": 3.899066416263493e-05, "epoch": 1.712, "percentage": 57.07, "elapsed_time": "2:45:23", "remaining_time": "2:04:25"}
|
108 |
+
{"current_steps": 1080, "total_steps": 1875, "loss": 0.3048, "lr": 3.817505014881378e-05, "epoch": 1.728, "percentage": 57.6, "elapsed_time": "2:46:54", "remaining_time": "2:02:52"}
|
109 |
+
{"current_steps": 1090, "total_steps": 1875, "loss": 0.2298, "lr": 3.736275573952354e-05, "epoch": 1.744, "percentage": 58.13, "elapsed_time": "2:48:26", "remaining_time": "2:01:18"}
|
110 |
+
{"current_steps": 1100, "total_steps": 1875, "loss": 0.2568, "lr": 3.655400896923672e-05, "epoch": 1.76, "percentage": 58.67, "elapsed_time": "2:49:58", "remaining_time": "1:59:45"}
|
111 |
+
{"current_steps": 1110, "total_steps": 1875, "loss": 0.2685, "lr": 3.5749036876501194e-05, "epoch": 1.776, "percentage": 59.2, "elapsed_time": "2:51:30", "remaining_time": "1:58:11"}
|
112 |
+
{"current_steps": 1120, "total_steps": 1875, "loss": 0.2675, "lr": 3.494806544020398e-05, "epoch": 1.792, "percentage": 59.73, "elapsed_time": "2:53:01", "remaining_time": "1:56:38"}
|
113 |
+
{"current_steps": 1130, "total_steps": 1875, "loss": 0.2539, "lr": 3.4151319516132416e-05, "epoch": 1.808, "percentage": 60.27, "elapsed_time": "2:54:33", "remaining_time": "1:55:05"}
|
114 |
+
{"current_steps": 1140, "total_steps": 1875, "loss": 0.26, "lr": 3.335902277385067e-05, "epoch": 1.8239999999999998, "percentage": 60.8, "elapsed_time": "2:56:05", "remaining_time": "1:53:32"}
|
115 |
+
{"current_steps": 1150, "total_steps": 1875, "loss": 0.262, "lr": 3.257139763390925e-05, "epoch": 1.8399999999999999, "percentage": 61.33, "elapsed_time": "2:57:37", "remaining_time": "1:51:58"}
|
116 |
+
{"current_steps": 1160, "total_steps": 1875, "loss": 0.2381, "lr": 3.178866520540509e-05, "epoch": 1.8559999999999999, "percentage": 61.87, "elapsed_time": "2:59:09", "remaining_time": "1:50:25"}
|
117 |
+
{"current_steps": 1170, "total_steps": 1875, "loss": 0.2682, "lr": 3.101104522390995e-05, "epoch": 1.8719999999999999, "percentage": 62.4, "elapsed_time": "3:00:40", "remaining_time": "1:48:52"}
|
118 |
+
{"current_steps": 1180, "total_steps": 1875, "loss": 0.2902, "lr": 3.023875598978419e-05, "epoch": 1.888, "percentage": 62.93, "elapsed_time": "3:02:12", "remaining_time": "1:47:19"}
|
119 |
+
{"current_steps": 1190, "total_steps": 1875, "loss": 0.2624, "lr": 2.9472014306893603e-05, "epoch": 1.904, "percentage": 63.47, "elapsed_time": "3:03:44", "remaining_time": "1:45:45"}
|
120 |
+
{"current_steps": 1200, "total_steps": 1875, "loss": 0.2686, "lr": 2.8711035421746367e-05, "epoch": 1.92, "percentage": 64.0, "elapsed_time": "3:05:15", "remaining_time": "1:44:12"}
|
121 |
+
{"current_steps": 1210, "total_steps": 1875, "loss": 0.2443, "lr": 2.795603296306708e-05, "epoch": 1.936, "percentage": 64.53, "elapsed_time": "3:06:47", "remaining_time": "1:42:39"}
|
122 |
+
{"current_steps": 1220, "total_steps": 1875, "loss": 0.2752, "lr": 2.7207218881825014e-05, "epoch": 1.952, "percentage": 65.07, "elapsed_time": "3:08:19", "remaining_time": "1:41:06"}
|
123 |
+
{"current_steps": 1230, "total_steps": 1875, "loss": 0.3108, "lr": 2.6464803391733374e-05, "epoch": 1.968, "percentage": 65.6, "elapsed_time": "3:09:51", "remaining_time": "1:39:33"}
|
124 |
+
{"current_steps": 1240, "total_steps": 1875, "loss": 0.2517, "lr": 2.5728994910236304e-05, "epoch": 1.984, "percentage": 66.13, "elapsed_time": "3:11:22", "remaining_time": "1:38:00"}
|
125 |
+
{"current_steps": 1250, "total_steps": 1875, "loss": 0.2494, "lr": 2.500000000000001e-05, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "3:12:54", "remaining_time": "1:36:27"}
|
126 |
+
{"current_steps": 1260, "total_steps": 1875, "loss": 0.2276, "lr": 2.4278023310924673e-05, "epoch": 2.016, "percentage": 67.2, "elapsed_time": "3:14:26", "remaining_time": "1:34:54"}
|
127 |
+
{"current_steps": 1270, "total_steps": 1875, "loss": 0.2145, "lr": 2.3563267522693415e-05, "epoch": 2.032, "percentage": 67.73, "elapsed_time": "3:15:57", "remaining_time": "1:33:21"}
|
128 |
+
{"current_steps": 1280, "total_steps": 1875, "loss": 0.1993, "lr": 2.2855933287874138e-05, "epoch": 2.048, "percentage": 68.27, "elapsed_time": "3:17:29", "remaining_time": "1:31:48"}
|
129 |
+
{"current_steps": 1290, "total_steps": 1875, "loss": 0.2402, "lr": 2.215621917559062e-05, "epoch": 2.064, "percentage": 68.8, "elapsed_time": "3:19:00", "remaining_time": "1:30:15"}
|
130 |
+
{"current_steps": 1300, "total_steps": 1875, "loss": 0.198, "lr": 2.1464321615778422e-05, "epoch": 2.08, "percentage": 69.33, "elapsed_time": "3:20:32", "remaining_time": "1:28:42"}
|
131 |
+
{"current_steps": 1310, "total_steps": 1875, "loss": 0.1847, "lr": 2.07804348440414e-05, "epoch": 2.096, "percentage": 69.87, "elapsed_time": "3:22:04", "remaining_time": "1:27:09"}
|
132 |
+
{"current_steps": 1320, "total_steps": 1875, "loss": 0.2217, "lr": 2.0104750847124075e-05, "epoch": 2.112, "percentage": 70.4, "elapsed_time": "3:23:36", "remaining_time": "1:25:36"}
|
133 |
+
{"current_steps": 1330, "total_steps": 1875, "loss": 0.219, "lr": 1.9437459309015427e-05, "epoch": 2.128, "percentage": 70.93, "elapsed_time": "3:25:07", "remaining_time": "1:24:03"}
|
134 |
+
{"current_steps": 1340, "total_steps": 1875, "loss": 0.2219, "lr": 1.8778747557699224e-05, "epoch": 2.144, "percentage": 71.47, "elapsed_time": "3:26:39", "remaining_time": "1:22:30"}
|
135 |
+
{"current_steps": 1350, "total_steps": 1875, "loss": 0.2043, "lr": 1.8128800512565513e-05, "epoch": 2.16, "percentage": 72.0, "elapsed_time": "3:28:11", "remaining_time": "1:20:57"}
|
136 |
+
{"current_steps": 1360, "total_steps": 1875, "loss": 0.1848, "lr": 1.7487800632498545e-05, "epoch": 2.176, "percentage": 72.53, "elapsed_time": "3:29:42", "remaining_time": "1:19:24"}
|
137 |
+
{"current_steps": 1370, "total_steps": 1875, "loss": 0.2063, "lr": 1.685592786465524e-05, "epoch": 2.192, "percentage": 73.07, "elapsed_time": "3:31:14", "remaining_time": "1:17:51"}
|
138 |
+
{"current_steps": 1380, "total_steps": 1875, "loss": 0.203, "lr": 1.6233359593948777e-05, "epoch": 2.208, "percentage": 73.6, "elapsed_time": "3:32:46", "remaining_time": "1:16:19"}
|
139 |
+
{"current_steps": 1390, "total_steps": 1875, "loss": 0.1998, "lr": 1.5620270593251635e-05, "epoch": 2.224, "percentage": 74.13, "elapsed_time": "3:34:17", "remaining_time": "1:14:46"}
|
140 |
+
{"current_steps": 1400, "total_steps": 1875, "loss": 0.2029, "lr": 1.5016832974331724e-05, "epoch": 2.24, "percentage": 74.67, "elapsed_time": "3:35:49", "remaining_time": "1:13:13"}
|
141 |
+
{"current_steps": 1410, "total_steps": 1875, "loss": 0.1829, "lr": 1.4423216139535734e-05, "epoch": 2.2560000000000002, "percentage": 75.2, "elapsed_time": "3:37:21", "remaining_time": "1:11:40"}
|
142 |
+
{"current_steps": 1420, "total_steps": 1875, "loss": 0.2131, "lr": 1.3839586734232906e-05, "epoch": 2.2720000000000002, "percentage": 75.73, "elapsed_time": "3:38:53", "remaining_time": "1:10:08"}
|
143 |
+
{"current_steps": 1430, "total_steps": 1875, "loss": 0.2099, "lr": 1.3266108600032929e-05, "epoch": 2.288, "percentage": 76.27, "elapsed_time": "3:40:25", "remaining_time": "1:08:35"}
|
144 |
+
{"current_steps": 1440, "total_steps": 1875, "loss": 0.203, "lr": 1.2702942728790895e-05, "epoch": 2.304, "percentage": 76.8, "elapsed_time": "3:41:56", "remaining_time": "1:07:02"}
|
145 |
+
{"current_steps": 1450, "total_steps": 1875, "loss": 0.2154, "lr": 1.2150247217412186e-05, "epoch": 2.32, "percentage": 77.33, "elapsed_time": "3:43:28", "remaining_time": "1:05:30"}
|
146 |
+
{"current_steps": 1460, "total_steps": 1875, "loss": 0.1994, "lr": 1.160817722347014e-05, "epoch": 2.336, "percentage": 77.87, "elapsed_time": "3:44:59", "remaining_time": "1:03:57"}
|
147 |
+
{"current_steps": 1470, "total_steps": 1875, "loss": 0.2255, "lr": 1.1076884921648834e-05, "epoch": 2.352, "percentage": 78.4, "elapsed_time": "3:46:31", "remaining_time": "1:02:24"}
|
148 |
+
{"current_steps": 1480, "total_steps": 1875, "loss": 0.2216, "lr": 1.0556519461023301e-05, "epoch": 2.368, "percentage": 78.93, "elapsed_time": "3:48:03", "remaining_time": "1:00:51"}
|
149 |
+
{"current_steps": 1490, "total_steps": 1875, "loss": 0.1979, "lr": 1.0047226923189024e-05, "epoch": 2.384, "percentage": 79.47, "elapsed_time": "3:49:35", "remaining_time": "0:59:19"}
|
150 |
+
{"current_steps": 1500, "total_steps": 1875, "loss": 0.2081, "lr": 9.549150281252633e-06, "epoch": 2.4, "percentage": 80.0, "elapsed_time": "3:51:07", "remaining_time": "0:57:46"}
|