RodrigoSalazar-U commited on
Commit
6f9e45e
·
verified ·
1 Parent(s): 380bcb8

Training in progress, step 3000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f256054f75ca529de3de3d31d968831168d96bd93b26db8cfb78737f117fa5f
3
  size 4785762744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:196dba7b25c0a4c68d7a023c577d7e08c52e76d0408d8bc30c27ca039dbe9a92
3
  size 4785762744
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01e19a66b263f1d6b622f520ca1c19416aeecac18d947e4eebc62fbd930353fd
3
  size 3497859804
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68c232c70d72ff63954a64510b19045d431ee3cf56e8201d12f051c97760d891
3
  size 3497859804
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a5247c071411b90e6abc28dfd3094729155dc46bfcf927ecdb927c420369d449
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20c9aaea8c26c5e4232cacfa8dd7d43278b636bf8b016e620006628dcd43298e
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.380071763731714,
5
  "eval_steps": 500,
6
- "global_step": 2500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -182,6 +182,41 @@
182
  "learning_rate": 9.08526023432446e-05,
183
  "loss": 0.3113,
184
  "step": 2500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
185
  }
186
  ],
187
  "logging_steps": 100,
@@ -201,7 +236,7 @@
201
  "attributes": {}
202
  }
203
  },
204
- "total_flos": 1.3266286871642112e+18,
205
  "train_batch_size": 16,
206
  "trial_name": null,
207
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.6560861164780567,
5
  "eval_steps": 500,
6
+ "global_step": 3000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
182
  "learning_rate": 9.08526023432446e-05,
183
  "loss": 0.3113,
184
  "step": 2500
185
+ },
186
+ {
187
+ "epoch": 1.4352746342809826,
188
+ "grad_norm": 1.3542137145996094,
189
+ "learning_rate": 8.971114170929969e-05,
190
+ "loss": 0.2965,
191
+ "step": 2600
192
+ },
193
+ {
194
+ "epoch": 1.4904775048302512,
195
+ "grad_norm": 1.0694419145584106,
196
+ "learning_rate": 8.851066780355073e-05,
197
+ "loss": 0.2907,
198
+ "step": 2700
199
+ },
200
+ {
201
+ "epoch": 1.5456803753795199,
202
+ "grad_norm": 1.2589095830917358,
203
+ "learning_rate": 8.72529646062573e-05,
204
+ "loss": 0.2881,
205
+ "step": 2800
206
+ },
207
+ {
208
+ "epoch": 1.6008832459287883,
209
+ "grad_norm": 0.9907445311546326,
210
+ "learning_rate": 8.593990114403092e-05,
211
+ "loss": 0.2833,
212
+ "step": 2900
213
+ },
214
+ {
215
+ "epoch": 1.6560861164780567,
216
+ "grad_norm": 1.1165964603424072,
217
+ "learning_rate": 8.45734287123433e-05,
218
+ "loss": 0.279,
219
+ "step": 3000
220
  }
221
  ],
222
  "logging_steps": 100,
 
236
  "attributes": {}
237
  }
238
  },
239
+ "total_flos": 1.5884360163671409e+18,
240
  "train_batch_size": 16,
241
  "trial_name": null,
242
  "trial_params": null