BayesTensor commited on
Commit
b1b3834
·
verified ·
1 Parent(s): 3c94a56

Training in progress, epoch 21, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:170668e0f882239f6d921c391d98d535e2dd0d797e483f542f28113b25e94747
3
  size 598442860
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a75e651b7dedf26c76800365f26f62ec83c75ac7eb4bc15e6dc3f953d658978
3
  size 598442860
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f5cb54bebba1f486784e4f8ef5bfd42e3532aa41a4b5240748e5073470faef87
3
  size 1196973562
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4cfe62004e5a561d9d643bca65ac0c62d1d489b276b30033f099d5b42b27b4c
3
  size 1196973562
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:58445eff8cfea6167d69710c1c3e8b46f4af1c16da39f8fe17f7ddecfb128b91
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d2633b30d6f8bc95e53ac59f43880033523b63ea88408f92c1df3391a619329
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e5ab1dcb06669a31ebabc3e63609c7c26f69246b855cc653dd9ef7e33657817
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0b2a69adca1463351b69368d25a268701f4b4da518acb587bddfef084570a7d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.6820012787723785,
3
  "best_model_checkpoint": "modernbert-medical-classifier/checkpoint-1748",
4
- "epoch": 20.0,
5
  "eval_steps": 500,
6
- "global_step": 1840,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -313,6 +313,22 @@
313
  "eval_samples_per_second": 12.561,
314
  "eval_steps_per_second": 3.14,
315
  "step": 1840
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
316
  }
317
  ],
318
  "logging_steps": 100,
@@ -332,7 +348,7 @@
332
  "attributes": {}
333
  }
334
  },
335
- "total_flos": 1.263208741236e+16,
336
  "train_batch_size": 4,
337
  "trial_name": null,
338
  "trial_params": null
 
1
  {
2
  "best_metric": 0.6820012787723785,
3
  "best_model_checkpoint": "modernbert-medical-classifier/checkpoint-1748",
4
+ "epoch": 21.0,
5
  "eval_steps": 500,
6
+ "global_step": 1932,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
313
  "eval_samples_per_second": 12.561,
314
  "eval_steps_per_second": 3.14,
315
  "step": 1840
316
+ },
317
+ {
318
+ "epoch": 20.652173913043477,
319
+ "grad_norm": 0.002304959110915661,
320
+ "learning_rate": 3.864734299516908e-06,
321
+ "loss": 0.031,
322
+ "step": 1900
323
+ },
324
+ {
325
+ "epoch": 21.0,
326
+ "eval_f1": 0.6777883740084095,
327
+ "eval_loss": 3.6255407333374023,
328
+ "eval_runtime": 7.3281,
329
+ "eval_samples_per_second": 12.554,
330
+ "eval_steps_per_second": 3.139,
331
+ "step": 1932
332
  }
333
  ],
334
  "logging_steps": 100,
 
348
  "attributes": {}
349
  }
350
  },
351
+ "total_flos": 1.3263691782978e+16,
352
  "train_batch_size": 4,
353
  "trial_name": null,
354
  "trial_params": null