Rakancorle1 commited on
Commit
84bdd16
1 Parent(s): eea8296

Training in progress, step 1500

Browse files
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b983eca3e9d7567d6effd2767b03728dd61f9c14ad8dabb8c6e0bcfe8587e16
3
  size 42002584
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa25ea539de469ee986d49b19492b15be1514ac82d19e087a8a1799ba0f802e5
3
  size 42002584
runs/Dec07_20-21-29_COE-CS-sv003/events.out.tfevents.1733602903.COE-CS-sv003.1598906.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd006138a112a346f9c6fca4de785b41eb794be9eb4ac94b5d0dcf9d35e3b0f6
3
- size 26526
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aefeb1c0dd1401b70880110fcca8f94736ba9c323249f77ccfe4fa4000e1dc02
3
+ size 37076
trainer_log.jsonl CHANGED
@@ -98,3 +98,53 @@
98
  {"current_steps": 980, "total_steps": 3543, "loss": 0.3968, "lr": 8.228067221736595e-05, "epoch": 0.8296296296296296, "percentage": 27.66, "elapsed_time": "2:29:39", "remaining_time": "6:31:24"}
99
  {"current_steps": 990, "total_steps": 3543, "loss": 0.4025, "lr": 8.19408354678804e-05, "epoch": 0.8380952380952381, "percentage": 27.94, "elapsed_time": "2:31:10", "remaining_time": "6:29:52"}
100
  {"current_steps": 1000, "total_steps": 3543, "loss": 0.4189, "lr": 8.159848740526723e-05, "epoch": 0.8465608465608465, "percentage": 28.22, "elapsed_time": "2:32:42", "remaining_time": "6:28:19"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
98
  {"current_steps": 980, "total_steps": 3543, "loss": 0.3968, "lr": 8.228067221736595e-05, "epoch": 0.8296296296296296, "percentage": 27.66, "elapsed_time": "2:29:39", "remaining_time": "6:31:24"}
99
  {"current_steps": 990, "total_steps": 3543, "loss": 0.4025, "lr": 8.19408354678804e-05, "epoch": 0.8380952380952381, "percentage": 27.94, "elapsed_time": "2:31:10", "remaining_time": "6:29:52"}
100
  {"current_steps": 1000, "total_steps": 3543, "loss": 0.4189, "lr": 8.159848740526723e-05, "epoch": 0.8465608465608465, "percentage": 28.22, "elapsed_time": "2:32:42", "remaining_time": "6:28:19"}
101
+ {"current_steps": 1010, "total_steps": 3543, "loss": 0.4062, "lr": 8.125365494626706e-05, "epoch": 0.855026455026455, "percentage": 28.51, "elapsed_time": "2:34:20", "remaining_time": "6:27:05"}
102
+ {"current_steps": 1020, "total_steps": 3543, "loss": 0.4064, "lr": 8.090636520295348e-05, "epoch": 0.8634920634920635, "percentage": 28.79, "elapsed_time": "2:35:52", "remaining_time": "6:25:33"}
103
+ {"current_steps": 1030, "total_steps": 3543, "loss": 0.4085, "lr": 8.055664548060131e-05, "epoch": 0.8719576719576719, "percentage": 29.07, "elapsed_time": "2:37:23", "remaining_time": "6:24:01"}
104
+ {"current_steps": 1040, "total_steps": 3543, "loss": 0.4206, "lr": 8.020452327553986e-05, "epoch": 0.8804232804232804, "percentage": 29.35, "elapsed_time": "2:38:55", "remaining_time": "6:22:28"}
105
+ {"current_steps": 1050, "total_steps": 3543, "loss": 0.4139, "lr": 7.9850026272991e-05, "epoch": 0.8888888888888888, "percentage": 29.64, "elapsed_time": "2:40:26", "remaining_time": "6:20:55"}
106
+ {"current_steps": 1060, "total_steps": 3543, "loss": 0.4152, "lr": 7.94931823448924e-05, "epoch": 0.8973544973544973, "percentage": 29.92, "elapsed_time": "2:41:57", "remaining_time": "6:19:22"}
107
+ {"current_steps": 1070, "total_steps": 3543, "loss": 0.3971, "lr": 7.913401954770622e-05, "epoch": 0.9058201058201059, "percentage": 30.2, "elapsed_time": "2:43:28", "remaining_time": "6:17:48"}
108
+ {"current_steps": 1080, "total_steps": 3543, "loss": 0.4147, "lr": 7.877256612021312e-05, "epoch": 0.9142857142857143, "percentage": 30.48, "elapsed_time": "2:44:59", "remaining_time": "6:16:15"}
109
+ {"current_steps": 1090, "total_steps": 3543, "loss": 0.4012, "lr": 7.84088504812921e-05, "epoch": 0.9227513227513228, "percentage": 30.76, "elapsed_time": "2:46:30", "remaining_time": "6:14:42"}
110
+ {"current_steps": 1100, "total_steps": 3543, "loss": 0.3925, "lr": 7.804290122768601e-05, "epoch": 0.9312169312169312, "percentage": 31.05, "elapsed_time": "2:48:01", "remaining_time": "6:13:09"}
111
+ {"current_steps": 1110, "total_steps": 3543, "loss": 0.4102, "lr": 7.767474713175321e-05, "epoch": 0.9396825396825397, "percentage": 31.33, "elapsed_time": "2:49:32", "remaining_time": "6:11:36"}
112
+ {"current_steps": 1120, "total_steps": 3543, "loss": 0.4065, "lr": 7.73044171392054e-05, "epoch": 0.9481481481481482, "percentage": 31.61, "elapsed_time": "2:51:03", "remaining_time": "6:10:04"}
113
+ {"current_steps": 1130, "total_steps": 3543, "loss": 0.3827, "lr": 7.69319403668317e-05, "epoch": 0.9566137566137566, "percentage": 31.89, "elapsed_time": "2:52:34", "remaining_time": "6:08:31"}
114
+ {"current_steps": 1140, "total_steps": 3543, "loss": 0.4088, "lr": 7.655734610020952e-05, "epoch": 0.9650793650793651, "percentage": 32.18, "elapsed_time": "2:54:06", "remaining_time": "6:06:59"}
115
+ {"current_steps": 1150, "total_steps": 3543, "loss": 0.4154, "lr": 7.618066379140186e-05, "epoch": 0.9735449735449735, "percentage": 32.46, "elapsed_time": "2:55:38", "remaining_time": "6:05:28"}
116
+ {"current_steps": 1160, "total_steps": 3543, "loss": 0.3986, "lr": 7.580192305664174e-05, "epoch": 0.982010582010582, "percentage": 32.74, "elapsed_time": "2:57:09", "remaining_time": "6:03:56"}
117
+ {"current_steps": 1170, "total_steps": 3543, "loss": 0.3929, "lr": 7.542115367400376e-05, "epoch": 0.9904761904761905, "percentage": 33.02, "elapsed_time": "2:58:40", "remaining_time": "6:02:23"}
118
+ {"current_steps": 1180, "total_steps": 3543, "loss": 0.3868, "lr": 7.503838558106263e-05, "epoch": 0.9989417989417989, "percentage": 33.31, "elapsed_time": "3:00:11", "remaining_time": "6:00:51"}
119
+ {"current_steps": 1190, "total_steps": 3543, "loss": 0.3725, "lr": 7.465364887253949e-05, "epoch": 1.0074074074074073, "percentage": 33.59, "elapsed_time": "3:01:42", "remaining_time": "5:59:18"}
120
+ {"current_steps": 1200, "total_steps": 3543, "loss": 0.3436, "lr": 7.426697379793572e-05, "epoch": 1.0158730158730158, "percentage": 33.87, "elapsed_time": "3:03:13", "remaining_time": "5:57:45"}
121
+ {"current_steps": 1210, "total_steps": 3543, "loss": 0.3434, "lr": 7.387839075915465e-05, "epoch": 1.0243386243386243, "percentage": 34.15, "elapsed_time": "3:04:45", "remaining_time": "5:56:13"}
122
+ {"current_steps": 1220, "total_steps": 3543, "loss": 0.3333, "lr": 7.348793030811111e-05, "epoch": 1.0328042328042328, "percentage": 34.43, "elapsed_time": "3:06:16", "remaining_time": "5:54:41"}
123
+ {"current_steps": 1230, "total_steps": 3543, "loss": 0.3205, "lr": 7.309562314432952e-05, "epoch": 1.0412698412698413, "percentage": 34.72, "elapsed_time": "3:07:47", "remaining_time": "5:53:08"}
124
+ {"current_steps": 1240, "total_steps": 3543, "loss": 0.3426, "lr": 7.270150011252994e-05, "epoch": 1.0497354497354496, "percentage": 35.0, "elapsed_time": "3:09:18", "remaining_time": "5:51:36"}
125
+ {"current_steps": 1250, "total_steps": 3543, "loss": 0.3197, "lr": 7.230559220020319e-05, "epoch": 1.0582010582010581, "percentage": 35.28, "elapsed_time": "3:10:50", "remaining_time": "5:50:03"}
126
+ {"current_steps": 1260, "total_steps": 3543, "loss": 0.3317, "lr": 7.190793053517424e-05, "epoch": 1.0666666666666667, "percentage": 35.56, "elapsed_time": "3:12:21", "remaining_time": "5:48:31"}
127
+ {"current_steps": 1270, "total_steps": 3543, "loss": 0.3264, "lr": 7.1508546383155e-05, "epoch": 1.0751322751322752, "percentage": 35.85, "elapsed_time": "3:13:52", "remaining_time": "5:46:59"}
128
+ {"current_steps": 1280, "total_steps": 3543, "loss": 0.3294, "lr": 7.110747114528604e-05, "epoch": 1.0835978835978837, "percentage": 36.13, "elapsed_time": "3:15:23", "remaining_time": "5:45:26"}
129
+ {"current_steps": 1290, "total_steps": 3543, "loss": 0.3272, "lr": 7.070473635566768e-05, "epoch": 1.0920634920634922, "percentage": 36.41, "elapsed_time": "3:16:54", "remaining_time": "5:43:54"}
130
+ {"current_steps": 1300, "total_steps": 3543, "loss": 0.3382, "lr": 7.030037367888069e-05, "epoch": 1.1005291005291005, "percentage": 36.69, "elapsed_time": "3:18:25", "remaining_time": "5:42:22"}
131
+ {"current_steps": 1310, "total_steps": 3543, "loss": 0.313, "lr": 6.989441490749662e-05, "epoch": 1.108994708994709, "percentage": 36.97, "elapsed_time": "3:19:57", "remaining_time": "5:40:50"}
132
+ {"current_steps": 1320, "total_steps": 3543, "loss": 0.3261, "lr": 6.948689195957829e-05, "epoch": 1.1174603174603175, "percentage": 37.26, "elapsed_time": "3:21:28", "remaining_time": "5:39:18"}
133
+ {"current_steps": 1330, "total_steps": 3543, "loss": 0.3295, "lr": 6.907783687617017e-05, "epoch": 1.125925925925926, "percentage": 37.54, "elapsed_time": "3:22:59", "remaining_time": "5:37:45"}
134
+ {"current_steps": 1340, "total_steps": 3543, "loss": 0.3208, "lr": 6.866728181877914e-05, "epoch": 1.1343915343915345, "percentage": 37.82, "elapsed_time": "3:24:30", "remaining_time": "5:36:13"}
135
+ {"current_steps": 1350, "total_steps": 3543, "loss": 0.2993, "lr": 6.825525906684593e-05, "epoch": 1.1428571428571428, "percentage": 38.1, "elapsed_time": "3:26:01", "remaining_time": "5:34:41"}
136
+ {"current_steps": 1360, "total_steps": 3543, "loss": 0.3519, "lr": 6.784180101520717e-05, "epoch": 1.1513227513227513, "percentage": 38.39, "elapsed_time": "3:27:32", "remaining_time": "5:33:08"}
137
+ {"current_steps": 1370, "total_steps": 3543, "loss": 0.3468, "lr": 6.74269401715483e-05, "epoch": 1.1597883597883598, "percentage": 38.67, "elapsed_time": "3:29:03", "remaining_time": "5:31:36"}
138
+ {"current_steps": 1380, "total_steps": 3543, "loss": 0.3666, "lr": 6.701070915384776e-05, "epoch": 1.1682539682539683, "percentage": 38.95, "elapsed_time": "3:30:35", "remaining_time": "5:30:04"}
139
+ {"current_steps": 1390, "total_steps": 3543, "loss": 0.3516, "lr": 6.659314068781241e-05, "epoch": 1.1767195767195768, "percentage": 39.23, "elapsed_time": "3:32:06", "remaining_time": "5:28:31"}
140
+ {"current_steps": 1400, "total_steps": 3543, "loss": 0.3444, "lr": 6.617426760430457e-05, "epoch": 1.1851851851851851, "percentage": 39.51, "elapsed_time": "3:33:37", "remaining_time": "5:26:59"}
141
+ {"current_steps": 1410, "total_steps": 3543, "loss": 0.3246, "lr": 6.575412283676063e-05, "epoch": 1.1936507936507936, "percentage": 39.8, "elapsed_time": "3:35:08", "remaining_time": "5:25:27"}
142
+ {"current_steps": 1420, "total_steps": 3543, "loss": 0.3406, "lr": 6.533273941860174e-05, "epoch": 1.2021164021164021, "percentage": 40.08, "elapsed_time": "3:36:39", "remaining_time": "5:23:55"}
143
+ {"current_steps": 1430, "total_steps": 3543, "loss": 0.3383, "lr": 6.491015048063662e-05, "epoch": 1.2105820105820106, "percentage": 40.36, "elapsed_time": "3:38:10", "remaining_time": "5:22:22"}
144
+ {"current_steps": 1440, "total_steps": 3543, "loss": 0.3217, "lr": 6.448638924845662e-05, "epoch": 1.2190476190476192, "percentage": 40.64, "elapsed_time": "3:39:41", "remaining_time": "5:20:50"}
145
+ {"current_steps": 1450, "total_steps": 3543, "loss": 0.3481, "lr": 6.40614890398235e-05, "epoch": 1.2275132275132274, "percentage": 40.93, "elapsed_time": "3:41:12", "remaining_time": "5:19:18"}
146
+ {"current_steps": 1460, "total_steps": 3543, "loss": 0.3313, "lr": 6.36354832620497e-05, "epoch": 1.235978835978836, "percentage": 41.21, "elapsed_time": "3:42:43", "remaining_time": "5:17:46"}
147
+ {"current_steps": 1470, "total_steps": 3543, "loss": 0.3286, "lr": 6.320840540937196e-05, "epoch": 1.2444444444444445, "percentage": 41.49, "elapsed_time": "3:44:15", "remaining_time": "5:16:14"}
148
+ {"current_steps": 1480, "total_steps": 3543, "loss": 0.337, "lr": 6.278028906031757e-05, "epoch": 1.252910052910053, "percentage": 41.77, "elapsed_time": "3:45:46", "remaining_time": "5:14:43"}
149
+ {"current_steps": 1490, "total_steps": 3543, "loss": 0.3373, "lr": 6.235116787506458e-05, "epoch": 1.2613756613756615, "percentage": 42.05, "elapsed_time": "3:47:18", "remaining_time": "5:13:12"}
150
+ {"current_steps": 1500, "total_steps": 3543, "loss": 0.344, "lr": 6.192107559279513e-05, "epoch": 1.2698412698412698, "percentage": 42.34, "elapsed_time": "3:48:50", "remaining_time": "5:11:40"}