BayesTensor commited on
Commit
408be4e
·
verified ·
1 Parent(s): bb5ed48

Training in progress, epoch 23, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44fcdc2cfb219a2c3d6d06bb6b8f65f721af1da85763755c70ac45f1c76d0940
3
  size 598442860
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccaa285f634999614d76916fa26ad8586b367298697a9ba5d5674744d4bc4433
3
  size 598442860
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cf7d32cb95a343ca2e2f6541c74e46395757dfb63b9b680af02fa19b05e27bce
3
  size 1196973562
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2897be83473030817c6ff78446c8bb0dfc829bb54d41c6eb71287e1885905e70
3
  size 1196973562
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a446f0425374fa045ac6c683a19a8525794cbf14fa7b3d3378d950e0a4a18370
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23c03a4de3b86963ec287522a2181427c3374e2dc539cb28bf29e0a8cece77ca
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2781561764a9942969e7875697d4ccf980e5e34725eac1719d27c20514c80f73
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:483f4ecfb311e0d8ab1c4c2d39a345ad988e3534065d1820a6f78e949cfb8296
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.685027729264332,
3
  "best_model_checkpoint": "modernbert-medical-classifier/checkpoint-2024",
4
- "epoch": 22.0,
5
  "eval_steps": 500,
6
- "global_step": 2024,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -345,6 +345,22 @@
345
  "eval_samples_per_second": 12.694,
346
  "eval_steps_per_second": 3.173,
347
  "step": 2024
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
348
  }
349
  ],
350
  "logging_steps": 100,
@@ -364,7 +380,7 @@
364
  "attributes": {}
365
  }
366
  },
367
- "total_flos": 1.3895296153596e+16,
368
  "train_batch_size": 4,
369
  "trial_name": null,
370
  "trial_params": null
 
1
  {
2
  "best_metric": 0.685027729264332,
3
  "best_model_checkpoint": "modernbert-medical-classifier/checkpoint-2024",
4
+ "epoch": 23.0,
5
  "eval_steps": 500,
6
+ "global_step": 2116,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
345
  "eval_samples_per_second": 12.694,
346
  "eval_steps_per_second": 3.173,
347
  "step": 2024
348
+ },
349
+ {
350
+ "epoch": 22.82608695652174,
351
+ "grad_norm": 0.00998605228960514,
352
+ "learning_rate": 1.932367149758454e-06,
353
+ "loss": 0.0,
354
+ "step": 2100
355
+ },
356
+ {
357
+ "epoch": 23.0,
358
+ "eval_f1": 0.6675544814093237,
359
+ "eval_loss": 3.6375534534454346,
360
+ "eval_runtime": 7.3379,
361
+ "eval_samples_per_second": 12.538,
362
+ "eval_steps_per_second": 3.134,
363
+ "step": 2116
364
  }
365
  ],
366
  "logging_steps": 100,
 
380
  "attributes": {}
381
  }
382
  },
383
+ "total_flos": 1.4526900524214e+16,
384
  "train_batch_size": 4,
385
  "trial_name": null,
386
  "trial_params": null