BayesTensor commited on
Commit
1666697
·
verified ·
1 Parent(s): 8eb1f09

Training in progress, epoch 16, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fda8a3a0cfe96a5a51e15c0690d5e1c48857832e5d77678267e42e6fa3a1817f
3
  size 737722356
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:657ca3021e5b6baff883b9156c24a243272d9ecbbb03b48fafaad921c72c3310
3
  size 737722356
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a9df2f5f97e9f862467508980e69acf0eb0956f6b4e75ecc2902800e27e088f7
3
  size 1475564538
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91959ee2247f551a280486183f80d9acc6e81bee811aba741ba2d237950de18b
3
  size 1475564538
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2971d2339194afcfd80aff922bc915204e0778014c7d2e047351d6f30e3bd3fc
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20616955913563c641cbdf6bd0c2164643c9c28e79d9473d76717848b530b4b5
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:091031ae22eb7d8dfa24111bac44553b71f40bb7016aeefd4960b0ea3e4c04a6
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0098baefc5d839aa49a31b29141de8bb1790117b396c3d13f4b14674b6b436f2
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.2747629944426283,
3
  "best_model_checkpoint": "debertalarge-medical-classifier/checkpoint-366",
4
- "epoch": 15.0,
5
  "eval_steps": 500,
6
- "global_step": 2745,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -331,6 +331,29 @@
331
  "eval_samples_per_second": 7.047,
332
  "eval_steps_per_second": 3.524,
333
  "step": 2745
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
334
  }
335
  ],
336
  "logging_steps": 100,
@@ -350,7 +373,7 @@
350
  "attributes": {}
351
  }
352
  },
353
- "total_flos": 7315403653350000.0,
354
  "train_batch_size": 2,
355
  "trial_name": null,
356
  "trial_params": null
 
1
  {
2
  "best_metric": 0.2747629944426283,
3
  "best_model_checkpoint": "debertalarge-medical-classifier/checkpoint-366",
4
+ "epoch": 16.0,
5
  "eval_steps": 500,
6
+ "global_step": 2928,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
331
  "eval_samples_per_second": 7.047,
332
  "eval_steps_per_second": 3.524,
333
  "step": 2745
334
+ },
335
+ {
336
+ "epoch": 15.300546448087431,
337
+ "grad_norm": 4.447215557098389,
338
+ "learning_rate": 1.9398907103825135e-05,
339
+ "loss": 1.0086,
340
+ "step": 2800
341
+ },
342
+ {
343
+ "epoch": 15.846994535519126,
344
+ "grad_norm": 3.9617857933044434,
345
+ "learning_rate": 1.830601092896175e-05,
346
+ "loss": 1.0938,
347
+ "step": 2900
348
+ },
349
+ {
350
+ "epoch": 16.0,
351
+ "eval_f1": 0.2747629944426283,
352
+ "eval_loss": 1.1148039102554321,
353
+ "eval_runtime": 13.0531,
354
+ "eval_samples_per_second": 7.048,
355
+ "eval_steps_per_second": 3.524,
356
+ "step": 2928
357
  }
358
  ],
359
  "logging_steps": 100,
 
373
  "attributes": {}
374
  }
375
  },
376
+ "total_flos": 7803097230240000.0,
377
  "train_batch_size": 2,
378
  "trial_name": null,
379
  "trial_params": null