RodrigoSalazar-U commited on
Commit
699bad1
·
verified ·
1 Parent(s): 7012682

Training in progress, step 2500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:466fbce9975c9c05303ad2e9f3211bd116287df8f6b5fe724fff725117351d68
3
  size 4785762744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f256054f75ca529de3de3d31d968831168d96bd93b26db8cfb78737f117fa5f
3
  size 4785762744
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00654d0986b4c2807a076dcd6fb04da902863d7591267af0d0f07d64685e5591
3
  size 3497859804
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01e19a66b263f1d6b622f520ca1c19416aeecac18d947e4eebc62fbd930353fd
3
  size 3497859804
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91357e6edb760a8623172a8598e28f7bde5a301ce8f9e8873076c6ef6d8599e4
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5247c071411b90e6abc28dfd3094729155dc46bfcf927ecdb927c420369d449
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.1040574109853711,
5
  "eval_steps": 500,
6
- "global_step": 2000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -147,6 +147,41 @@
147
  "learning_rate": 9.561854333075736e-05,
148
  "loss": 0.3029,
149
  "step": 2000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
150
  }
151
  ],
152
  "logging_steps": 100,
@@ -166,7 +201,7 @@
166
  "attributes": {}
167
  }
168
  },
169
- "total_flos": 1.0607056890750566e+18,
170
  "train_batch_size": 16,
171
  "trial_name": null,
172
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.380071763731714,
5
  "eval_steps": 500,
6
+ "global_step": 2500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
147
  "learning_rate": 9.561854333075736e-05,
148
  "loss": 0.3029,
149
  "step": 2000
150
+ },
151
+ {
152
+ "epoch": 1.1592602815346398,
153
+ "grad_norm": 1.305432915687561,
154
+ "learning_rate": 9.479575396130191e-05,
155
+ "loss": 0.2974,
156
+ "step": 2100
157
+ },
158
+ {
159
+ "epoch": 1.2144631520839084,
160
+ "grad_norm": 1.2165225744247437,
161
+ "learning_rate": 9.390639526418681e-05,
162
+ "loss": 0.2999,
163
+ "step": 2200
164
+ },
165
+ {
166
+ "epoch": 1.2696660226331768,
167
+ "grad_norm": 1.5560479164123535,
168
+ "learning_rate": 9.295178888276614e-05,
169
+ "loss": 0.2957,
170
+ "step": 2300
171
+ },
172
+ {
173
+ "epoch": 1.3248688931824455,
174
+ "grad_norm": 1.236303448677063,
175
+ "learning_rate": 9.193335342258558e-05,
176
+ "loss": 0.3,
177
+ "step": 2400
178
+ },
179
+ {
180
+ "epoch": 1.380071763731714,
181
+ "grad_norm": 1.3867113590240479,
182
+ "learning_rate": 9.08526023432446e-05,
183
+ "loss": 0.3113,
184
+ "step": 2500
185
  }
186
  ],
187
  "logging_steps": 100,
 
201
  "attributes": {}
202
  }
203
  },
204
+ "total_flos": 1.3266286871642112e+18,
205
  "train_batch_size": 16,
206
  "trial_name": null,
207
  "trial_params": null