Rakancorle1
commited on
Commit
•
14dce9b
1
Parent(s):
f588c0f
Training in progress, step 2500
Browse files
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 42002584
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1574cad090827b614d1a03e4f742d066a93c4c282377ab48aa72cc55e1320a0
|
3 |
size 42002584
|
runs/Dec07_20-21-29_COE-CS-sv003/events.out.tfevents.1733602903.COE-CS-sv003.1598906.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6869e0028ab9968b77957dd6ee02303ef43a98ed65ea37dc2aa20549498c9a71
|
3 |
+
size 58176
|
trainer_log.jsonl
CHANGED
@@ -198,3 +198,53 @@
|
|
198 |
{"current_steps": 1980, "total_steps": 3543, "loss": 0.318, "lr": 4.080867881544826e-05, "epoch": 1.6761904761904762, "percentage": 55.88, "elapsed_time": "5:01:50", "remaining_time": "3:58:16"}
|
199 |
{"current_steps": 1990, "total_steps": 3543, "loss": 0.3076, "lr": 4.037324908737909e-05, "epoch": 1.6846560846560847, "percentage": 56.17, "elapsed_time": "5:03:21", "remaining_time": "3:56:44"}
|
200 |
{"current_steps": 2000, "total_steps": 3543, "loss": 0.3052, "lr": 3.9938576252033256e-05, "epoch": 1.693121693121693, "percentage": 56.45, "elapsed_time": "5:04:52", "remaining_time": "3:55:12"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
198 |
{"current_steps": 1980, "total_steps": 3543, "loss": 0.318, "lr": 4.080867881544826e-05, "epoch": 1.6761904761904762, "percentage": 55.88, "elapsed_time": "5:01:50", "remaining_time": "3:58:16"}
|
199 |
{"current_steps": 1990, "total_steps": 3543, "loss": 0.3076, "lr": 4.037324908737909e-05, "epoch": 1.6846560846560847, "percentage": 56.17, "elapsed_time": "5:03:21", "remaining_time": "3:56:44"}
|
200 |
{"current_steps": 2000, "total_steps": 3543, "loss": 0.3052, "lr": 3.9938576252033256e-05, "epoch": 1.693121693121693, "percentage": 56.45, "elapsed_time": "5:04:52", "remaining_time": "3:55:12"}
|
201 |
+
{"current_steps": 2010, "total_steps": 3543, "loss": 0.3095, "lr": 3.950469448508532e-05, "epoch": 1.7015873015873015, "percentage": 56.73, "elapsed_time": "5:06:31", "remaining_time": "3:53:46"}
|
202 |
+
{"current_steps": 2020, "total_steps": 3543, "loss": 0.3246, "lr": 3.907163790001292e-05, "epoch": 1.71005291005291, "percentage": 57.01, "elapsed_time": "5:08:02", "remaining_time": "3:52:15"}
|
203 |
+
{"current_steps": 2030, "total_steps": 3543, "loss": 0.3148, "lr": 3.863944054541474e-05, "epoch": 1.7185185185185186, "percentage": 57.3, "elapsed_time": "5:09:34", "remaining_time": "3:50:43"}
|
204 |
+
{"current_steps": 2040, "total_steps": 3543, "loss": 0.3256, "lr": 3.8208136402333314e-05, "epoch": 1.726984126984127, "percentage": 57.58, "elapsed_time": "5:11:05", "remaining_time": "3:49:12"}
|
205 |
+
{"current_steps": 2050, "total_steps": 3543, "loss": 0.2897, "lr": 3.7777759381583495e-05, "epoch": 1.7354497354497354, "percentage": 57.86, "elapsed_time": "5:12:37", "remaining_time": "3:47:40"}
|
206 |
+
{"current_steps": 2060, "total_steps": 3543, "loss": 0.3051, "lr": 3.73483433210861e-05, "epoch": 1.7439153439153439, "percentage": 58.14, "elapsed_time": "5:14:08", "remaining_time": "3:46:09"}
|
207 |
+
{"current_steps": 2070, "total_steps": 3543, "loss": 0.3165, "lr": 3.691992198320753e-05, "epoch": 1.7523809523809524, "percentage": 58.43, "elapsed_time": "5:15:39", "remaining_time": "3:44:37"}
|
208 |
+
{"current_steps": 2080, "total_steps": 3543, "loss": 0.2911, "lr": 3.649252905210519e-05, "epoch": 1.7608465608465609, "percentage": 58.71, "elapsed_time": "5:17:11", "remaining_time": "3:43:06"}
|
209 |
+
{"current_steps": 2090, "total_steps": 3543, "loss": 0.3129, "lr": 3.6066198131079146e-05, "epoch": 1.7693121693121694, "percentage": 58.99, "elapsed_time": "5:18:43", "remaining_time": "3:41:34"}
|
210 |
+
{"current_steps": 2100, "total_steps": 3543, "loss": 0.313, "lr": 3.564096273993012e-05, "epoch": 1.7777777777777777, "percentage": 59.27, "elapsed_time": "5:20:14", "remaining_time": "3:40:03"}
|
211 |
+
{"current_steps": 2110, "total_steps": 3543, "loss": 0.3202, "lr": 3.521685631232392e-05, "epoch": 1.7862433862433862, "percentage": 59.55, "elapsed_time": "5:21:46", "remaining_time": "3:38:31"}
|
212 |
+
{"current_steps": 2120, "total_steps": 3543, "loss": 0.3058, "lr": 3.479391219316291e-05, "epoch": 1.7947089947089947, "percentage": 59.84, "elapsed_time": "5:23:18", "remaining_time": "3:37:00"}
|
213 |
+
{"current_steps": 2130, "total_steps": 3543, "loss": 0.3192, "lr": 3.437216363596418e-05, "epoch": 1.8031746031746032, "percentage": 60.12, "elapsed_time": "5:24:49", "remaining_time": "3:35:28"}
|
214 |
+
{"current_steps": 2140, "total_steps": 3543, "loss": 0.3239, "lr": 3.395164380024512e-05, "epoch": 1.8116402116402117, "percentage": 60.4, "elapsed_time": "5:26:20", "remaining_time": "3:33:57"}
|
215 |
+
{"current_steps": 2150, "total_steps": 3543, "loss": 0.3229, "lr": 3.3532385748916164e-05, "epoch": 1.82010582010582, "percentage": 60.68, "elapsed_time": "5:27:52", "remaining_time": "3:32:25"}
|
216 |
+
{"current_steps": 2160, "total_steps": 3543, "loss": 0.3136, "lr": 3.3114422445681425e-05, "epoch": 1.8285714285714287, "percentage": 60.97, "elapsed_time": "5:29:23", "remaining_time": "3:30:54"}
|
217 |
+
{"current_steps": 2170, "total_steps": 3543, "loss": 0.2882, "lr": 3.269778675244684e-05, "epoch": 1.837037037037037, "percentage": 61.25, "elapsed_time": "5:30:55", "remaining_time": "3:29:22"}
|
218 |
+
{"current_steps": 2180, "total_steps": 3543, "loss": 0.295, "lr": 3.22825114267364e-05, "epoch": 1.8455026455026455, "percentage": 61.53, "elapsed_time": "5:32:26", "remaining_time": "3:27:51"}
|
219 |
+
{"current_steps": 2190, "total_steps": 3543, "loss": 0.3176, "lr": 3.1868629119116794e-05, "epoch": 1.853968253968254, "percentage": 61.81, "elapsed_time": "5:33:58", "remaining_time": "3:26:19"}
|
220 |
+
{"current_steps": 2200, "total_steps": 3543, "loss": 0.3324, "lr": 3.1456172370630124e-05, "epoch": 1.8624338624338623, "percentage": 62.09, "elapsed_time": "5:35:30", "remaining_time": "3:24:48"}
|
221 |
+
{"current_steps": 2210, "total_steps": 3543, "loss": 0.3091, "lr": 3.10451736102355e-05, "epoch": 1.870899470899471, "percentage": 62.38, "elapsed_time": "5:37:01", "remaining_time": "3:23:17"}
|
222 |
+
{"current_steps": 2220, "total_steps": 3543, "loss": 0.2955, "lr": 3.0635665152259295e-05, "epoch": 1.8793650793650793, "percentage": 62.66, "elapsed_time": "5:38:33", "remaining_time": "3:21:45"}
|
223 |
+
{"current_steps": 2230, "total_steps": 3543, "loss": 0.3195, "lr": 3.0227679193854513e-05, "epoch": 1.8878306878306879, "percentage": 62.94, "elapsed_time": "5:40:04", "remaining_time": "3:20:14"}
|
224 |
+
{"current_steps": 2240, "total_steps": 3543, "loss": 0.3039, "lr": 2.982124781246932e-05, "epoch": 1.8962962962962964, "percentage": 63.22, "elapsed_time": "5:41:36", "remaining_time": "3:18:42"}
|
225 |
+
{"current_steps": 2250, "total_steps": 3543, "loss": 0.2742, "lr": 2.9416402963324896e-05, "epoch": 1.9047619047619047, "percentage": 63.51, "elapsed_time": "5:43:07", "remaining_time": "3:17:10"}
|
226 |
+
{"current_steps": 2260, "total_steps": 3543, "loss": 0.3048, "lr": 2.9013176476903147e-05, "epoch": 1.9132275132275134, "percentage": 63.79, "elapsed_time": "5:44:38", "remaining_time": "3:15:39"}
|
227 |
+
{"current_steps": 2270, "total_steps": 3543, "loss": 0.3206, "lr": 2.8611600056443944e-05, "epoch": 1.9216931216931217, "percentage": 64.07, "elapsed_time": "5:46:09", "remaining_time": "3:14:07"}
|
228 |
+
{"current_steps": 2280, "total_steps": 3543, "loss": 0.2952, "lr": 2.821170527545254e-05, "epoch": 1.9301587301587302, "percentage": 64.35, "elapsed_time": "5:47:40", "remaining_time": "3:12:35"}
|
229 |
+
{"current_steps": 2290, "total_steps": 3543, "loss": 0.3037, "lr": 2.7813523575217103e-05, "epoch": 1.9386243386243387, "percentage": 64.63, "elapsed_time": "5:49:12", "remaining_time": "3:11:04"}
|
230 |
+
{"current_steps": 2300, "total_steps": 3543, "loss": 0.3054, "lr": 2.7417086262336777e-05, "epoch": 1.947089947089947, "percentage": 64.92, "elapsed_time": "5:50:43", "remaining_time": "3:09:32"}
|
231 |
+
{"current_steps": 2310, "total_steps": 3543, "loss": 0.3161, "lr": 2.7022424506260113e-05, "epoch": 1.9555555555555557, "percentage": 65.2, "elapsed_time": "5:52:14", "remaining_time": "3:08:00"}
|
232 |
+
{"current_steps": 2320, "total_steps": 3543, "loss": 0.3171, "lr": 2.662956933683443e-05, "epoch": 1.964021164021164, "percentage": 65.48, "elapsed_time": "5:53:45", "remaining_time": "3:06:28"}
|
233 |
+
{"current_steps": 2330, "total_steps": 3543, "loss": 0.2773, "lr": 2.623855164186625e-05, "epoch": 1.9724867724867725, "percentage": 65.76, "elapsed_time": "5:55:16", "remaining_time": "3:04:57"}
|
234 |
+
{"current_steps": 2340, "total_steps": 3543, "loss": 0.3122, "lr": 2.5849402164692593e-05, "epoch": 1.980952380952381, "percentage": 66.05, "elapsed_time": "5:56:47", "remaining_time": "3:03:25"}
|
235 |
+
{"current_steps": 2350, "total_steps": 3543, "loss": 0.3002, "lr": 2.546215150176394e-05, "epoch": 1.9894179894179893, "percentage": 66.33, "elapsed_time": "5:58:18", "remaining_time": "3:01:53"}
|
236 |
+
{"current_steps": 2360, "total_steps": 3543, "loss": 0.3006, "lr": 2.507683010023857e-05, "epoch": 1.997883597883598, "percentage": 66.61, "elapsed_time": "5:59:49", "remaining_time": "3:00:22"}
|
237 |
+
{"current_steps": 2370, "total_steps": 3543, "loss": 0.2681, "lr": 2.4693468255588752e-05, "epoch": 2.0063492063492063, "percentage": 66.89, "elapsed_time": "6:01:20", "remaining_time": "2:58:50"}
|
238 |
+
{"current_steps": 2380, "total_steps": 3543, "loss": 0.2509, "lr": 2.4312096109218684e-05, "epoch": 2.0148148148148146, "percentage": 67.17, "elapsed_time": "6:02:51", "remaining_time": "2:57:18"}
|
239 |
+
{"current_steps": 2390, "total_steps": 3543, "loss": 0.2495, "lr": 2.3932743646094736e-05, "epoch": 2.0232804232804233, "percentage": 67.46, "elapsed_time": "6:04:22", "remaining_time": "2:55:47"}
|
240 |
+
{"current_steps": 2400, "total_steps": 3543, "loss": 0.2394, "lr": 2.3555440692387947e-05, "epoch": 2.0317460317460316, "percentage": 67.74, "elapsed_time": "6:05:53", "remaining_time": "2:54:15"}
|
241 |
+
{"current_steps": 2410, "total_steps": 3543, "loss": 0.2344, "lr": 2.3180216913128872e-05, "epoch": 2.0402116402116404, "percentage": 68.02, "elapsed_time": "6:07:24", "remaining_time": "2:52:43"}
|
242 |
+
{"current_steps": 2420, "total_steps": 3543, "loss": 0.243, "lr": 2.2807101809875275e-05, "epoch": 2.0486772486772487, "percentage": 68.3, "elapsed_time": "6:08:55", "remaining_time": "2:51:12"}
|
243 |
+
{"current_steps": 2430, "total_steps": 3543, "loss": 0.248, "lr": 2.2436124718392565e-05, "epoch": 2.057142857142857, "percentage": 68.59, "elapsed_time": "6:10:26", "remaining_time": "2:49:40"}
|
244 |
+
{"current_steps": 2440, "total_steps": 3543, "loss": 0.2434, "lr": 2.206731480634739e-05, "epoch": 2.0656084656084657, "percentage": 68.87, "elapsed_time": "6:11:57", "remaining_time": "2:48:08"}
|
245 |
+
{"current_steps": 2450, "total_steps": 3543, "loss": 0.2417, "lr": 2.1700701071014222e-05, "epoch": 2.074074074074074, "percentage": 69.15, "elapsed_time": "6:13:28", "remaining_time": "2:46:37"}
|
246 |
+
{"current_steps": 2460, "total_steps": 3543, "loss": 0.2402, "lr": 2.1336312336995572e-05, "epoch": 2.0825396825396827, "percentage": 69.43, "elapsed_time": "6:14:59", "remaining_time": "2:45:05"}
|
247 |
+
{"current_steps": 2470, "total_steps": 3543, "loss": 0.2476, "lr": 2.0974177253955657e-05, "epoch": 2.091005291005291, "percentage": 69.71, "elapsed_time": "6:16:30", "remaining_time": "2:43:33"}
|
248 |
+
{"current_steps": 2480, "total_steps": 3543, "loss": 0.242, "lr": 2.0614324294367882e-05, "epoch": 2.0994708994708993, "percentage": 70.0, "elapsed_time": "6:18:02", "remaining_time": "2:42:02"}
|
249 |
+
{"current_steps": 2490, "total_steps": 3543, "loss": 0.247, "lr": 2.025678175127623e-05, "epoch": 2.107936507936508, "percentage": 70.28, "elapsed_time": "6:19:33", "remaining_time": "2:40:30"}
|
250 |
+
{"current_steps": 2500, "total_steps": 3543, "loss": 0.2418, "lr": 1.9901577736070598e-05, "epoch": 2.1164021164021163, "percentage": 70.56, "elapsed_time": "6:21:03", "remaining_time": "2:38:58"}
|