Rakancorle1 commited on
Commit
e961f72
1 Parent(s): 14dce9b

Training in progress, step 3000

Browse files
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c1574cad090827b614d1a03e4f742d066a93c4c282377ab48aa72cc55e1320a0
3
  size 42002584
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4bfc7e3cbcda370ad03aaa2862e737045de8dad10bfd6823a46761cb2644e7c
3
  size 42002584
runs/Dec07_20-21-29_COE-CS-sv003/events.out.tfevents.1733602903.COE-CS-sv003.1598906.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6869e0028ab9968b77957dd6ee02303ef43a98ed65ea37dc2aa20549498c9a71
3
- size 58176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b06a449db1233c0490470cd5dfa26042a2e4dc712bdd5427bf209711579d3fee
3
+ size 68726
trainer_log.jsonl CHANGED
@@ -248,3 +248,53 @@
248
  {"current_steps": 2480, "total_steps": 3543, "loss": 0.242, "lr": 2.0614324294367882e-05, "epoch": 2.0994708994708993, "percentage": 70.0, "elapsed_time": "6:18:02", "remaining_time": "2:42:02"}
249
  {"current_steps": 2490, "total_steps": 3543, "loss": 0.247, "lr": 2.025678175127623e-05, "epoch": 2.107936507936508, "percentage": 70.28, "elapsed_time": "6:19:33", "remaining_time": "2:40:30"}
250
  {"current_steps": 2500, "total_steps": 3543, "loss": 0.2418, "lr": 1.9901577736070598e-05, "epoch": 2.1164021164021163, "percentage": 70.56, "elapsed_time": "6:21:03", "remaining_time": "2:38:58"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
248
  {"current_steps": 2480, "total_steps": 3543, "loss": 0.242, "lr": 2.0614324294367882e-05, "epoch": 2.0994708994708993, "percentage": 70.0, "elapsed_time": "6:18:02", "remaining_time": "2:42:02"}
249
  {"current_steps": 2490, "total_steps": 3543, "loss": 0.247, "lr": 2.025678175127623e-05, "epoch": 2.107936507936508, "percentage": 70.28, "elapsed_time": "6:19:33", "remaining_time": "2:40:30"}
250
  {"current_steps": 2500, "total_steps": 3543, "loss": 0.2418, "lr": 1.9901577736070598e-05, "epoch": 2.1164021164021163, "percentage": 70.56, "elapsed_time": "6:21:03", "remaining_time": "2:38:58"}
251
+ {"current_steps": 2510, "total_steps": 3543, "loss": 0.2504, "lr": 1.954874017627684e-05, "epoch": 2.124867724867725, "percentage": 70.84, "elapsed_time": "6:22:42", "remaining_time": "2:37:30"}
252
+ {"current_steps": 2520, "total_steps": 3543, "loss": 0.2442, "lr": 1.9198296813360777e-05, "epoch": 2.1333333333333333, "percentage": 71.13, "elapsed_time": "6:24:13", "remaining_time": "2:35:58"}
253
+ {"current_steps": 2530, "total_steps": 3543, "loss": 0.2453, "lr": 1.8850275200547142e-05, "epoch": 2.1417989417989416, "percentage": 71.41, "elapsed_time": "6:25:44", "remaining_time": "2:34:26"}
254
+ {"current_steps": 2540, "total_steps": 3543, "loss": 0.2488, "lr": 1.8504702700653194e-05, "epoch": 2.1502645502645503, "percentage": 71.69, "elapsed_time": "6:27:15", "remaining_time": "2:32:55"}
255
+ {"current_steps": 2550, "total_steps": 3543, "loss": 0.2377, "lr": 1.8161606483937433e-05, "epoch": 2.1587301587301586, "percentage": 71.97, "elapsed_time": "6:28:45", "remaining_time": "2:31:23"}
256
+ {"current_steps": 2560, "total_steps": 3543, "loss": 0.2571, "lr": 1.7821013525963316e-05, "epoch": 2.1671957671957673, "percentage": 72.26, "elapsed_time": "6:30:17", "remaining_time": "2:29:51"}
257
+ {"current_steps": 2570, "total_steps": 3543, "loss": 0.2449, "lr": 1.748295060547823e-05, "epoch": 2.1756613756613756, "percentage": 72.54, "elapsed_time": "6:31:48", "remaining_time": "2:28:20"}
258
+ {"current_steps": 2580, "total_steps": 3543, "loss": 0.2348, "lr": 1.7147444302308273e-05, "epoch": 2.1841269841269844, "percentage": 72.82, "elapsed_time": "6:33:19", "remaining_time": "2:26:48"}
259
+ {"current_steps": 2590, "total_steps": 3543, "loss": 0.2578, "lr": 1.6814520995268207e-05, "epoch": 2.1925925925925926, "percentage": 73.1, "elapsed_time": "6:34:50", "remaining_time": "2:25:16"}
260
+ {"current_steps": 2600, "total_steps": 3543, "loss": 0.2358, "lr": 1.6484206860087653e-05, "epoch": 2.201058201058201, "percentage": 73.38, "elapsed_time": "6:36:21", "remaining_time": "2:23:45"}
261
+ {"current_steps": 2610, "total_steps": 3543, "loss": 0.2288, "lr": 1.6156527867352845e-05, "epoch": 2.2095238095238097, "percentage": 73.67, "elapsed_time": "6:37:52", "remaining_time": "2:22:13"}
262
+ {"current_steps": 2620, "total_steps": 3543, "loss": 0.2478, "lr": 1.5831509780464947e-05, "epoch": 2.217989417989418, "percentage": 73.95, "elapsed_time": "6:39:23", "remaining_time": "2:20:42"}
263
+ {"current_steps": 2630, "total_steps": 3543, "loss": 0.2462, "lr": 1.5509178153614233e-05, "epoch": 2.2264550264550262, "percentage": 74.23, "elapsed_time": "6:40:54", "remaining_time": "2:19:10"}
264
+ {"current_steps": 2640, "total_steps": 3543, "loss": 0.2475, "lr": 1.5189558329771092e-05, "epoch": 2.234920634920635, "percentage": 74.51, "elapsed_time": "6:42:25", "remaining_time": "2:17:38"}
265
+ {"current_steps": 2650, "total_steps": 3543, "loss": 0.2577, "lr": 1.48726754386933e-05, "epoch": 2.2433862433862433, "percentage": 74.8, "elapsed_time": "6:43:56", "remaining_time": "2:16:07"}
266
+ {"current_steps": 2660, "total_steps": 3543, "loss": 0.2257, "lr": 1.4558554394950319e-05, "epoch": 2.251851851851852, "percentage": 75.08, "elapsed_time": "6:45:28", "remaining_time": "2:14:35"}
267
+ {"current_steps": 2670, "total_steps": 3543, "loss": 0.2366, "lr": 1.4247219895964458e-05, "epoch": 2.2603174603174603, "percentage": 75.36, "elapsed_time": "6:46:59", "remaining_time": "2:13:04"}
268
+ {"current_steps": 2680, "total_steps": 3543, "loss": 0.246, "lr": 1.3938696420068887e-05, "epoch": 2.268783068783069, "percentage": 75.64, "elapsed_time": "6:48:31", "remaining_time": "2:11:32"}
269
+ {"current_steps": 2690, "total_steps": 3543, "loss": 0.2362, "lr": 1.3633008224583276e-05, "epoch": 2.2772486772486773, "percentage": 75.92, "elapsed_time": "6:50:02", "remaining_time": "2:10:01"}
270
+ {"current_steps": 2700, "total_steps": 3543, "loss": 0.2271, "lr": 1.3330179343906424e-05, "epoch": 2.2857142857142856, "percentage": 76.21, "elapsed_time": "6:51:34", "remaining_time": "2:08:30"}
271
+ {"current_steps": 2710, "total_steps": 3543, "loss": 0.2349, "lr": 1.303023358762669e-05, "epoch": 2.2941798941798943, "percentage": 76.49, "elapsed_time": "6:53:05", "remaining_time": "2:06:58"}
272
+ {"current_steps": 2720, "total_steps": 3543, "loss": 0.2586, "lr": 1.27331945386499e-05, "epoch": 2.3026455026455026, "percentage": 76.77, "elapsed_time": "6:54:37", "remaining_time": "2:05:27"}
273
+ {"current_steps": 2730, "total_steps": 3543, "loss": 0.2417, "lr": 1.2439085551345209e-05, "epoch": 2.311111111111111, "percentage": 77.05, "elapsed_time": "6:56:08", "remaining_time": "2:03:55"}
274
+ {"current_steps": 2740, "total_steps": 3543, "loss": 0.2412, "lr": 1.2147929749708931e-05, "epoch": 2.3195767195767196, "percentage": 77.34, "elapsed_time": "6:57:40", "remaining_time": "2:02:24"}
275
+ {"current_steps": 2750, "total_steps": 3543, "loss": 0.235, "lr": 1.1859750025546362e-05, "epoch": 2.328042328042328, "percentage": 77.62, "elapsed_time": "6:59:11", "remaining_time": "2:00:52"}
276
+ {"current_steps": 2760, "total_steps": 3543, "loss": 0.2429, "lr": 1.1574569036671978e-05, "epoch": 2.3365079365079366, "percentage": 77.9, "elapsed_time": "7:00:43", "remaining_time": "1:59:21"}
277
+ {"current_steps": 2770, "total_steps": 3543, "loss": 0.2359, "lr": 1.129240920512798e-05, "epoch": 2.344973544973545, "percentage": 78.18, "elapsed_time": "7:02:14", "remaining_time": "1:57:49"}
278
+ {"current_steps": 2780, "total_steps": 3543, "loss": 0.2382, "lr": 1.101329271542143e-05, "epoch": 2.3534391534391537, "percentage": 78.46, "elapsed_time": "7:03:46", "remaining_time": "1:56:18"}
279
+ {"current_steps": 2790, "total_steps": 3543, "loss": 0.2458, "lr": 1.0737241512779928e-05, "epoch": 2.361904761904762, "percentage": 78.75, "elapsed_time": "7:05:17", "remaining_time": "1:54:47"}
280
+ {"current_steps": 2800, "total_steps": 3543, "loss": 0.2487, "lr": 1.046427730142625e-05, "epoch": 2.3703703703703702, "percentage": 79.03, "elapsed_time": "7:06:49", "remaining_time": "1:53:15"}
281
+ {"current_steps": 2810, "total_steps": 3543, "loss": 0.2369, "lr": 1.0194421542871918e-05, "epoch": 2.378835978835979, "percentage": 79.31, "elapsed_time": "7:08:20", "remaining_time": "1:51:44"}
282
+ {"current_steps": 2820, "total_steps": 3543, "loss": 0.2448, "lr": 9.927695454229713e-06, "epoch": 2.3873015873015873, "percentage": 79.59, "elapsed_time": "7:09:52", "remaining_time": "1:50:12"}
283
+ {"current_steps": 2830, "total_steps": 3543, "loss": 0.2419, "lr": 9.664120006545573e-06, "epoch": 2.3957671957671955, "percentage": 79.88, "elapsed_time": "7:11:24", "remaining_time": "1:48:41"}
284
+ {"current_steps": 2840, "total_steps": 3543, "loss": 0.2551, "lr": 9.403715923149742e-06, "epoch": 2.4042328042328043, "percentage": 80.16, "elapsed_time": "7:12:55", "remaining_time": "1:47:09"}
285
+ {"current_steps": 2850, "total_steps": 3543, "loss": 0.2178, "lr": 9.146503678027451e-06, "epoch": 2.4126984126984126, "percentage": 80.44, "elapsed_time": "7:14:26", "remaining_time": "1:45:38"}
286
+ {"current_steps": 2860, "total_steps": 3543, "loss": 0.227, "lr": 8.892503494209132e-06, "epoch": 2.4211640211640213, "percentage": 80.72, "elapsed_time": "7:15:58", "remaining_time": "1:44:06"}
287
+ {"current_steps": 2870, "total_steps": 3543, "loss": 0.2449, "lr": 8.641735342180402e-06, "epoch": 2.4296296296296296, "percentage": 81.0, "elapsed_time": "7:17:29", "remaining_time": "1:42:35"}
288
+ {"current_steps": 2880, "total_steps": 3543, "loss": 0.2287, "lr": 8.394218938311982e-06, "epoch": 2.4380952380952383, "percentage": 81.29, "elapsed_time": "7:19:01", "remaining_time": "1:41:03"}
289
+ {"current_steps": 2890, "total_steps": 3543, "loss": 0.2488, "lr": 8.149973743309414e-06, "epoch": 2.4465608465608466, "percentage": 81.57, "elapsed_time": "7:20:32", "remaining_time": "1:39:32"}
290
+ {"current_steps": 2900, "total_steps": 3543, "loss": 0.2339, "lr": 7.909018960683052e-06, "epoch": 2.455026455026455, "percentage": 81.85, "elapsed_time": "7:22:04", "remaining_time": "1:38:01"}
291
+ {"current_steps": 2910, "total_steps": 3543, "loss": 0.25, "lr": 7.671373535238168e-06, "epoch": 2.4634920634920636, "percentage": 82.13, "elapsed_time": "7:23:35", "remaining_time": "1:36:29"}
292
+ {"current_steps": 2920, "total_steps": 3543, "loss": 0.2348, "lr": 7.437056151585514e-06, "epoch": 2.471957671957672, "percentage": 82.42, "elapsed_time": "7:25:07", "remaining_time": "1:34:58"}
293
+ {"current_steps": 2930, "total_steps": 3543, "loss": 0.2319, "lr": 7.206085232672155e-06, "epoch": 2.48042328042328, "percentage": 82.7, "elapsed_time": "7:26:38", "remaining_time": "1:33:26"}
294
+ {"current_steps": 2940, "total_steps": 3543, "loss": 0.23, "lr": 6.978478938333055e-06, "epoch": 2.488888888888889, "percentage": 82.98, "elapsed_time": "7:28:10", "remaining_time": "1:31:55"}
295
+ {"current_steps": 2950, "total_steps": 3543, "loss": 0.2571, "lr": 6.75425516386326e-06, "epoch": 2.497354497354497, "percentage": 83.26, "elapsed_time": "7:29:41", "remaining_time": "1:30:23"}
296
+ {"current_steps": 2960, "total_steps": 3543, "loss": 0.2291, "lr": 6.533431538610923e-06, "epoch": 2.505820105820106, "percentage": 83.55, "elapsed_time": "7:31:13", "remaining_time": "1:28:52"}
297
+ {"current_steps": 2970, "total_steps": 3543, "loss": 0.2393, "lr": 6.3160254245911825e-06, "epoch": 2.5142857142857142, "percentage": 83.83, "elapsed_time": "7:32:45", "remaining_time": "1:27:20"}
298
+ {"current_steps": 2980, "total_steps": 3543, "loss": 0.2595, "lr": 6.102053915121092e-06, "epoch": 2.522751322751323, "percentage": 84.11, "elapsed_time": "7:34:16", "remaining_time": "1:25:49"}
299
+ {"current_steps": 2990, "total_steps": 3543, "loss": 0.2505, "lr": 5.891533833475732e-06, "epoch": 2.5312169312169313, "percentage": 84.39, "elapsed_time": "7:35:47", "remaining_time": "1:24:18"}
300
+ {"current_steps": 3000, "total_steps": 3543, "loss": 0.2415, "lr": 5.684481731565433e-06, "epoch": 2.5396825396825395, "percentage": 84.67, "elapsed_time": "7:37:19", "remaining_time": "1:22:46"}