BayesTensor commited on
Commit
7f54da4
·
verified ·
1 Parent(s): 31a1209

Training in progress, epoch 4, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b082d9f7f07aa3218c210cddb092957f01f3072c9ec6bf41b03953a6ec3da23d
3
  size 598442860
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2639907b39e9287fc30fb2f169b8b0719e332db07ffa1b53b1080a4e49447c90
3
  size 598442860
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ed1975b50a000839c6999b4cbd155ecd04a9bab206b47eb28bcff6fbf95376d
3
  size 1196973562
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ea202c16703886b5552b0170b5700a4d0c8dc6a0e9e5f0f8944c5e3dc82b4c0
3
  size 1196973562
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c062f7f375beded48b5337f5a3f3a5cb38807fa3e85dbf3e294c0ab6b627bfc2
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9899ccda7f0d8d9511991180b93aab508ce6e8489de708c88ad1188e7e1d90d6
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f17bc159752e862802fb5566308be6d1ff306dc0599471317a224de8cb8930a4
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20da6727f873a83d1abd00f92a4cb1727d12d4e0e9bf6e453f25b70594840b9a
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.2623751468860165,
3
- "best_model_checkpoint": "modernbert-medical-classifier/checkpoint-276",
4
- "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 276,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -48,6 +48,22 @@
48
  "eval_samples_per_second": 12.708,
49
  "eval_steps_per_second": 3.177,
50
  "step": 276
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
51
  }
52
  ],
53
  "logging_steps": 100,
@@ -67,7 +83,7 @@
67
  "attributes": {}
68
  }
69
  },
70
- "total_flos": 1894813111854000.0,
71
  "train_batch_size": 4,
72
  "trial_name": null,
73
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.46725195094760313,
3
+ "best_model_checkpoint": "modernbert-medical-classifier/checkpoint-368",
4
+ "epoch": 4.0,
5
  "eval_steps": 500,
6
+ "global_step": 368,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
48
  "eval_samples_per_second": 12.708,
49
  "eval_steps_per_second": 3.177,
50
  "step": 276
51
+ },
52
+ {
53
+ "epoch": 3.260869565217391,
54
+ "grad_norm": 8.205018997192383,
55
+ "learning_rate": 1.932367149758454e-05,
56
+ "loss": 1.0924,
57
+ "step": 300
58
+ },
59
+ {
60
+ "epoch": 4.0,
61
+ "eval_f1": 0.46725195094760313,
62
+ "eval_loss": 0.9543380737304688,
63
+ "eval_runtime": 7.257,
64
+ "eval_samples_per_second": 12.677,
65
+ "eval_steps_per_second": 3.169,
66
+ "step": 368
67
  }
68
  ],
69
  "logging_steps": 100,
 
83
  "attributes": {}
84
  }
85
  },
86
+ "total_flos": 2526417482472000.0,
87
  "train_batch_size": 4,
88
  "trial_name": null,
89
  "trial_params": null