Training in progress, step 3500
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +50 -0
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 645976488
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd8dd796d6baa0f42af20a5c6207b9d02fb58f2f4a5d0d0a02aaaac7e0cbdbb2
|
3 |
size 645976488
|
trainer_log.jsonl
CHANGED
@@ -303,3 +303,53 @@
|
|
303 |
{"current_steps": 2990, "total_steps": 3573, "loss": 1.0833, "lr": 3.948274213717015e-06, "epoch": 2.510495382031906, "percentage": 83.68, "elapsed_time": "1:05:29", "remaining_time": "0:12:46"}
|
304 |
{"current_steps": 3000, "total_steps": 3573, "loss": 1.0794, "lr": 3.817517754917802e-06, "epoch": 2.5188916876574305, "percentage": 83.96, "elapsed_time": "1:05:41", "remaining_time": "0:12:32"}
|
305 |
{"current_steps": 3000, "total_steps": 3573, "eval_loss": 1.271108627319336, "epoch": 2.5188916876574305, "percentage": 83.96, "elapsed_time": "1:06:19", "remaining_time": "0:12:40"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
303 |
{"current_steps": 2990, "total_steps": 3573, "loss": 1.0833, "lr": 3.948274213717015e-06, "epoch": 2.510495382031906, "percentage": 83.68, "elapsed_time": "1:05:29", "remaining_time": "0:12:46"}
|
304 |
{"current_steps": 3000, "total_steps": 3573, "loss": 1.0794, "lr": 3.817517754917802e-06, "epoch": 2.5188916876574305, "percentage": 83.96, "elapsed_time": "1:05:41", "remaining_time": "0:12:32"}
|
305 |
{"current_steps": 3000, "total_steps": 3573, "eval_loss": 1.271108627319336, "epoch": 2.5188916876574305, "percentage": 83.96, "elapsed_time": "1:06:19", "remaining_time": "0:12:40"}
|
306 |
+
{"current_steps": 3010, "total_steps": 3573, "loss": 1.0797, "lr": 3.6887839016293807e-06, "epoch": 2.5272879932829557, "percentage": 84.24, "elapsed_time": "1:06:53", "remaining_time": "0:12:30"}
|
307 |
+
{"current_steps": 3020, "total_steps": 3573, "loss": 1.0809, "lr": 3.5620849459805983e-06, "epoch": 2.53568429890848, "percentage": 84.52, "elapsed_time": "1:07:05", "remaining_time": "0:12:17"}
|
308 |
+
{"current_steps": 3030, "total_steps": 3573, "loss": 1.0841, "lr": 3.4374329857984637e-06, "epoch": 2.544080604534005, "percentage": 84.8, "elapsed_time": "1:07:17", "remaining_time": "0:12:03"}
|
309 |
+
{"current_steps": 3040, "total_steps": 3573, "loss": 1.0783, "lr": 3.314839923453003e-06, "epoch": 2.55247691015953, "percentage": 85.08, "elapsed_time": "1:07:29", "remaining_time": "0:11:50"}
|
310 |
+
{"current_steps": 3050, "total_steps": 3573, "loss": 1.0657, "lr": 3.1943174647207474e-06, "epoch": 2.5608732157850547, "percentage": 85.36, "elapsed_time": "1:07:42", "remaining_time": "0:11:36"}
|
311 |
+
{"current_steps": 3060, "total_steps": 3573, "loss": 1.0811, "lr": 3.0758771176669948e-06, "epoch": 2.5692695214105794, "percentage": 85.64, "elapsed_time": "1:07:54", "remaining_time": "0:11:23"}
|
312 |
+
{"current_steps": 3070, "total_steps": 3573, "loss": 1.085, "lr": 2.9595301915470246e-06, "epoch": 2.577665827036104, "percentage": 85.92, "elapsed_time": "1:08:06", "remaining_time": "0:11:09"}
|
313 |
+
{"current_steps": 3080, "total_steps": 3573, "loss": 1.0682, "lr": 2.8452877957261537e-06, "epoch": 2.586062132661629, "percentage": 86.2, "elapsed_time": "1:08:18", "remaining_time": "0:10:56"}
|
314 |
+
{"current_steps": 3090, "total_steps": 3573, "loss": 1.0705, "lr": 2.73316083861902e-06, "epoch": 2.5944584382871536, "percentage": 86.48, "elapsed_time": "1:08:31", "remaining_time": "0:10:42"}
|
315 |
+
{"current_steps": 3100, "total_steps": 3573, "loss": 1.08, "lr": 2.623160026647978e-06, "epoch": 2.6028547439126783, "percentage": 86.76, "elapsed_time": "1:08:43", "remaining_time": "0:10:29"}
|
316 |
+
{"current_steps": 3110, "total_steps": 3573, "loss": 1.055, "lr": 2.515295863220796e-06, "epoch": 2.611251049538203, "percentage": 87.04, "elapsed_time": "1:08:55", "remaining_time": "0:10:15"}
|
317 |
+
{"current_steps": 3120, "total_steps": 3573, "loss": 1.0541, "lr": 2.4095786477277253e-06, "epoch": 2.619647355163728, "percentage": 87.32, "elapsed_time": "1:09:07", "remaining_time": "0:10:02"}
|
318 |
+
{"current_steps": 3130, "total_steps": 3573, "loss": 1.0712, "lr": 2.3060184745580972e-06, "epoch": 2.6280436607892526, "percentage": 87.6, "elapsed_time": "1:09:20", "remaining_time": "0:09:48"}
|
319 |
+
{"current_steps": 3140, "total_steps": 3573, "loss": 1.0785, "lr": 2.2046252321364368e-06, "epoch": 2.6364399664147777, "percentage": 87.88, "elapsed_time": "1:09:32", "remaining_time": "0:09:35"}
|
320 |
+
{"current_steps": 3150, "total_steps": 3573, "loss": 1.0623, "lr": 2.1054086019782785e-06, "epoch": 2.644836272040302, "percentage": 88.16, "elapsed_time": "1:09:44", "remaining_time": "0:09:21"}
|
321 |
+
{"current_steps": 3160, "total_steps": 3573, "loss": 1.0629, "lr": 2.008378057765725e-06, "epoch": 2.653232577665827, "percentage": 88.44, "elapsed_time": "1:09:56", "remaining_time": "0:09:08"}
|
322 |
+
{"current_steps": 3170, "total_steps": 3573, "loss": 1.0682, "lr": 1.913542864442849e-06, "epoch": 2.661628883291352, "percentage": 88.72, "elapsed_time": "1:10:08", "remaining_time": "0:08:55"}
|
323 |
+
{"current_steps": 3180, "total_steps": 3573, "loss": 1.0352, "lr": 1.8209120773310468e-06, "epoch": 2.6700251889168767, "percentage": 89.0, "elapsed_time": "1:10:21", "remaining_time": "0:08:41"}
|
324 |
+
{"current_steps": 3190, "total_steps": 3573, "loss": 1.0617, "lr": 1.7304945412643825e-06, "epoch": 2.6784214945424014, "percentage": 89.28, "elapsed_time": "1:10:33", "remaining_time": "0:08:28"}
|
325 |
+
{"current_steps": 3200, "total_steps": 3573, "loss": 1.0712, "lr": 1.6422988897450392e-06, "epoch": 2.686817800167926, "percentage": 89.56, "elapsed_time": "1:10:45", "remaining_time": "0:08:14"}
|
326 |
+
{"current_steps": 3210, "total_steps": 3573, "loss": 1.0735, "lr": 1.5563335441189458e-06, "epoch": 2.695214105793451, "percentage": 89.84, "elapsed_time": "1:10:57", "remaining_time": "0:08:01"}
|
327 |
+
{"current_steps": 3220, "total_steps": 3573, "loss": 1.0621, "lr": 1.4726067127716958e-06, "epoch": 2.7036104114189756, "percentage": 90.12, "elapsed_time": "1:11:10", "remaining_time": "0:07:48"}
|
328 |
+
{"current_steps": 3230, "total_steps": 3573, "loss": 1.0652, "lr": 1.3911263903447241e-06, "epoch": 2.7120067170445004, "percentage": 90.4, "elapsed_time": "1:11:22", "remaining_time": "0:07:34"}
|
329 |
+
{"current_steps": 3240, "total_steps": 3573, "loss": 1.0622, "lr": 1.3119003569719789e-06, "epoch": 2.720403022670025, "percentage": 90.68, "elapsed_time": "1:11:34", "remaining_time": "0:07:21"}
|
330 |
+
{"current_steps": 3250, "total_steps": 3573, "loss": 1.063, "lr": 1.2349361775370245e-06, "epoch": 2.72879932829555, "percentage": 90.96, "elapsed_time": "1:11:46", "remaining_time": "0:07:08"}
|
331 |
+
{"current_steps": 3260, "total_steps": 3573, "loss": 1.0598, "lr": 1.1602412009507014e-06, "epoch": 2.7371956339210746, "percentage": 91.24, "elapsed_time": "1:11:59", "remaining_time": "0:06:54"}
|
332 |
+
{"current_steps": 3270, "total_steps": 3573, "loss": 1.037, "lr": 1.087822559449425e-06, "epoch": 2.7455919395465997, "percentage": 91.52, "elapsed_time": "1:12:11", "remaining_time": "0:06:41"}
|
333 |
+
{"current_steps": 3280, "total_steps": 3573, "loss": 1.0721, "lr": 1.0176871679141664e-06, "epoch": 2.753988245172124, "percentage": 91.8, "elapsed_time": "1:12:23", "remaining_time": "0:06:28"}
|
334 |
+
{"current_steps": 3290, "total_steps": 3573, "loss": 1.0624, "lr": 9.49841723210182e-07, "epoch": 2.762384550797649, "percentage": 92.08, "elapsed_time": "1:12:35", "remaining_time": "0:06:14"}
|
335 |
+
{"current_steps": 3300, "total_steps": 3573, "loss": 1.0868, "lr": 8.842927035475763e-07, "epoch": 2.770780856423174, "percentage": 92.36, "elapsed_time": "1:12:48", "remaining_time": "0:06:01"}
|
336 |
+
{"current_steps": 3310, "total_steps": 3573, "loss": 1.0509, "lr": 8.210463678626989e-07, "epoch": 2.7791771620486987, "percentage": 92.64, "elapsed_time": "1:13:00", "remaining_time": "0:05:48"}
|
337 |
+
{"current_steps": 3320, "total_steps": 3573, "loss": 1.0568, "lr": 7.601087552205621e-07, "epoch": 2.7875734676742234, "percentage": 92.92, "elapsed_time": "1:13:12", "remaining_time": "0:05:34"}
|
338 |
+
{"current_steps": 3330, "total_steps": 3573, "loss": 1.0745, "lr": 7.014856842381484e-07, "epoch": 2.795969773299748, "percentage": 93.2, "elapsed_time": "1:13:24", "remaining_time": "0:05:21"}
|
339 |
+
{"current_steps": 3340, "total_steps": 3573, "loss": 1.0708, "lr": 6.451827525288612e-07, "epoch": 2.804366078925273, "percentage": 93.48, "elapsed_time": "1:13:36", "remaining_time": "0:05:08"}
|
340 |
+
{"current_steps": 3350, "total_steps": 3573, "loss": 1.0772, "lr": 5.912053361680159e-07, "epoch": 2.8127623845507976, "percentage": 93.76, "elapsed_time": "1:13:48", "remaining_time": "0:04:54"}
|
341 |
+
{"current_steps": 3360, "total_steps": 3573, "loss": 1.0437, "lr": 5.395585891795174e-07, "epoch": 2.8211586901763224, "percentage": 94.04, "elapsed_time": "1:14:01", "remaining_time": "0:04:41"}
|
342 |
+
{"current_steps": 3370, "total_steps": 3573, "loss": 1.064, "lr": 4.90247443043712e-07, "epoch": 2.829554995801847, "percentage": 94.32, "elapsed_time": "1:14:13", "remaining_time": "0:04:28"}
|
343 |
+
{"current_steps": 3380, "total_steps": 3573, "loss": 1.0702, "lr": 4.43276606226542e-07, "epoch": 2.837951301427372, "percentage": 94.6, "elapsed_time": "1:14:25", "remaining_time": "0:04:14"}
|
344 |
+
{"current_steps": 3390, "total_steps": 3573, "loss": 1.0731, "lr": 3.9865056372990763e-07, "epoch": 2.8463476070528966, "percentage": 94.88, "elapsed_time": "1:14:37", "remaining_time": "0:04:01"}
|
345 |
+
{"current_steps": 3400, "total_steps": 3573, "loss": 1.0576, "lr": 3.563735766634629e-07, "epoch": 2.8547439126784218, "percentage": 95.16, "elapsed_time": "1:14:49", "remaining_time": "0:03:48"}
|
346 |
+
{"current_steps": 3410, "total_steps": 3573, "loss": 1.0526, "lr": 3.164496818377188e-07, "epoch": 2.863140218303946, "percentage": 95.44, "elapsed_time": "1:15:01", "remaining_time": "0:03:35"}
|
347 |
+
{"current_steps": 3420, "total_steps": 3573, "loss": 1.0631, "lr": 2.7888269137860413e-07, "epoch": 2.8715365239294712, "percentage": 95.72, "elapsed_time": "1:15:14", "remaining_time": "0:03:21"}
|
348 |
+
{"current_steps": 3430, "total_steps": 3573, "loss": 1.1013, "lr": 2.436761923634456e-07, "epoch": 2.879932829554996, "percentage": 96.0, "elapsed_time": "1:15:26", "remaining_time": "0:03:08"}
|
349 |
+
{"current_steps": 3440, "total_steps": 3573, "loss": 1.0737, "lr": 2.108335464784811e-07, "epoch": 2.8883291351805207, "percentage": 96.28, "elapsed_time": "1:15:38", "remaining_time": "0:02:55"}
|
350 |
+
{"current_steps": 3450, "total_steps": 3573, "loss": 1.0823, "lr": 1.8035788969784638e-07, "epoch": 2.8967254408060454, "percentage": 96.56, "elapsed_time": "1:15:50", "remaining_time": "0:02:42"}
|
351 |
+
{"current_steps": 3460, "total_steps": 3573, "loss": 1.0692, "lr": 1.522521319841541e-07, "epoch": 2.90512174643157, "percentage": 96.84, "elapsed_time": "1:16:03", "remaining_time": "0:02:29"}
|
352 |
+
{"current_steps": 3470, "total_steps": 3573, "loss": 1.0698, "lr": 1.2651895701063233e-07, "epoch": 2.913518052057095, "percentage": 97.12, "elapsed_time": "1:16:15", "remaining_time": "0:02:15"}
|
353 |
+
{"current_steps": 3480, "total_steps": 3573, "loss": 1.0746, "lr": 1.0316082190486298e-07, "epoch": 2.9219143576826196, "percentage": 97.4, "elapsed_time": "1:16:27", "remaining_time": "0:02:02"}
|
354 |
+
{"current_steps": 3490, "total_steps": 3573, "loss": 1.0454, "lr": 8.217995701418624e-08, "epoch": 2.9303106633081444, "percentage": 97.68, "elapsed_time": "1:16:39", "remaining_time": "0:01:49"}
|
355 |
+
{"current_steps": 3500, "total_steps": 3573, "loss": 1.056, "lr": 6.35783656927097e-08, "epoch": 2.938706968933669, "percentage": 97.96, "elapsed_time": "1:16:51", "remaining_time": "0:01:36"}
|