BayesTensor commited on
Commit
277fb62
·
verified ·
1 Parent(s): e7210ed

Training in progress, epoch 17, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:657ca3021e5b6baff883b9156c24a243272d9ecbbb03b48fafaad921c72c3310
3
  size 737722356
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47e2acf1a516b89ef3ac486410bd891b1eb4c2f07ff0811e7bedaf2c93821c60
3
  size 737722356
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91959ee2247f551a280486183f80d9acc6e81bee811aba741ba2d237950de18b
3
  size 1475564538
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6084d5e39532668a29a9a7adfc8f7e6d954178d10523bcc4bb14b505beebe42
3
  size 1475564538
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20616955913563c641cbdf6bd0c2164643c9c28e79d9473d76717848b530b4b5
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:177f4600c463df4ac0fab58eca4d20530489d85799600cbe5c332b74b2834cd3
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0098baefc5d839aa49a31b29141de8bb1790117b396c3d13f4b14674b6b436f2
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52d9926229eece8ee772f15833f4e38d9c72b87fe1d5554bff5cd38f9587a548
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.2747629944426283,
3
  "best_model_checkpoint": "debertalarge-medical-classifier/checkpoint-366",
4
- "epoch": 16.0,
5
  "eval_steps": 500,
6
- "global_step": 2928,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -354,6 +354,29 @@
354
  "eval_samples_per_second": 7.048,
355
  "eval_steps_per_second": 3.524,
356
  "step": 2928
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
357
  }
358
  ],
359
  "logging_steps": 100,
@@ -373,7 +396,7 @@
373
  "attributes": {}
374
  }
375
  },
376
- "total_flos": 7803097230240000.0,
377
  "train_batch_size": 2,
378
  "trial_name": null,
379
  "trial_params": null
 
1
  {
2
  "best_metric": 0.2747629944426283,
3
  "best_model_checkpoint": "debertalarge-medical-classifier/checkpoint-366",
4
+ "epoch": 17.0,
5
  "eval_steps": 500,
6
+ "global_step": 3111,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
354
  "eval_samples_per_second": 7.048,
355
  "eval_steps_per_second": 3.524,
356
  "step": 2928
357
+ },
358
+ {
359
+ "epoch": 16.39344262295082,
360
+ "grad_norm": 4.644863605499268,
361
+ "learning_rate": 1.721311475409836e-05,
362
+ "loss": 1.021,
363
+ "step": 3000
364
+ },
365
+ {
366
+ "epoch": 16.939890710382514,
367
+ "grad_norm": 4.022730827331543,
368
+ "learning_rate": 1.6120218579234975e-05,
369
+ "loss": 1.0961,
370
+ "step": 3100
371
+ },
372
+ {
373
+ "epoch": 17.0,
374
+ "eval_f1": 0.2747629944426283,
375
+ "eval_loss": 1.0970044136047363,
376
+ "eval_runtime": 13.0521,
377
+ "eval_samples_per_second": 7.049,
378
+ "eval_steps_per_second": 3.524,
379
+ "step": 3111
380
  }
381
  ],
382
  "logging_steps": 100,
 
396
  "attributes": {}
397
  }
398
  },
399
+ "total_flos": 8290790807130000.0,
400
  "train_batch_size": 2,
401
  "trial_name": null,
402
  "trial_params": null