BayesTensor commited on
Commit
d1d2433
·
verified ·
1 Parent(s): 99bd500

Training in progress, epoch 14, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f182ddc6a42f969c70c3ba45c6b66632e4c2357bc2d736ef52aebb2d32d424d0
3
  size 598442860
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd16e9b6f9345a4d55b0c6b3d9a0fe4562e07fba5825db705d2f8b1d40e04371
3
  size 598442860
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e100b9ab84b2ed7eba0c8e1e9d9d999e12f2ff3b481ee0e28a17333b39dc4c61
3
  size 1196973562
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d657efc862343e4ca0ff3dfe06b1a7a466d3b1dc217bb753b8649e31097031fb
3
  size 1196973562
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21c2425b85b819f329f6809df4ca360e34a2b44b18e94e8e0472ab0b59df0b2a
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55eb9a50a24203e1f00ac6c722a2a24e52518f0efb376c58a3d9a8931f29ae83
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:347def11e7102864029b8bcdabdb4164ecba7c15bc54daa499824d15db0ad9cc
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65e5841a697daa9e5cf070050f5e101ef959328015c7c818070e14f85bca96d7
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.6671065935820338,
3
  "best_model_checkpoint": "modernbert-medical-classifier/checkpoint-1196",
4
- "epoch": 13.0,
5
  "eval_steps": 500,
6
- "global_step": 1196,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -201,6 +201,22 @@
201
  "eval_samples_per_second": 12.589,
202
  "eval_steps_per_second": 3.147,
203
  "step": 1196
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
204
  }
205
  ],
206
  "logging_steps": 100,
@@ -220,7 +236,7 @@
220
  "attributes": {}
221
  }
222
  },
223
- "total_flos": 8210856818034000.0,
224
  "train_batch_size": 4,
225
  "trial_name": null,
226
  "trial_params": null
 
1
  {
2
  "best_metric": 0.6671065935820338,
3
  "best_model_checkpoint": "modernbert-medical-classifier/checkpoint-1196",
4
+ "epoch": 14.0,
5
  "eval_steps": 500,
6
+ "global_step": 1288,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
201
  "eval_samples_per_second": 12.589,
202
  "eval_steps_per_second": 3.147,
203
  "step": 1196
204
+ },
205
+ {
206
+ "epoch": 13.043478260869565,
207
+ "grad_norm": 5.261804580688477,
208
+ "learning_rate": 1.0628019323671499e-05,
209
+ "loss": 0.4901,
210
+ "step": 1200
211
+ },
212
+ {
213
+ "epoch": 14.0,
214
+ "eval_f1": 0.6347571828121027,
215
+ "eval_loss": 2.9827301502227783,
216
+ "eval_runtime": 7.2649,
217
+ "eval_samples_per_second": 12.664,
218
+ "eval_steps_per_second": 3.166,
219
+ "step": 1288
220
  }
221
  ],
222
  "logging_steps": 100,
 
236
  "attributes": {}
237
  }
238
  },
239
+ "total_flos": 8842461188652000.0,
240
  "train_batch_size": 4,
241
  "trial_name": null,
242
  "trial_params": null