cruiser commited on
Commit
c152c03
·
1 Parent(s): 8e7a1fb

Training in progress, epoch 6

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6e1c223396647ec6cd656de23825a29d0b48e7604b035244b865ef38f29e3860
3
  size 535707205
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c0c1d1a95437c66f3b33782453ba953526f8464f92697184d90ab42e75da749
3
  size 535707205
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:baa6af60d43b89da681db440da8a020b36a0b01e397bfdbfa5cadddbecad87e9
3
  size 267858605
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01d5637896d55577cf0684e7637e84e8f4c33d9073c7e06191b4e34550d125b3
3
  size 267858605
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b791a681be555893dfbd95c23212b7e4bb4caeadabeaa1d70cda36c90dd2d59
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d1ef6c19d1da5881da2b52af355c48c53b4c2bfee4f7173b57bcdd9c9f982a1
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46401517fc71e91b2dd9b90629550fd134d44611879929c50967203772c36029
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f54966d1ee4bd994df4b5052604ad6e750e8df78e56abd97418b5274aebd354c
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 1.614416241645813,
3
  "best_model_checkpoint": "distilbert_weight_decay_final_metrics/checkpoint-6872",
4
- "epoch": 5.0,
5
- "global_step": 8590,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -158,11 +158,39 @@
158
  "eval_samples_per_second": 436.48,
159
  "eval_steps_per_second": 27.295,
160
  "step": 8590
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
161
  }
162
  ],
163
  "max_steps": 34360,
164
  "num_train_epochs": 20,
165
- "total_flos": 3910587551729100.0,
166
  "trial_name": null,
167
  "trial_params": null
168
  }
 
1
  {
2
  "best_metric": 1.614416241645813,
3
  "best_model_checkpoint": "distilbert_weight_decay_final_metrics/checkpoint-6872",
4
+ "epoch": 6.0,
5
+ "global_step": 10308,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
158
  "eval_samples_per_second": 436.48,
159
  "eval_steps_per_second": 27.295,
160
  "step": 8590
161
+ },
162
+ {
163
+ "epoch": 5.24,
164
+ "learning_rate": 1.4761350407450526e-05,
165
+ "loss": 0.0338,
166
+ "step": 9000
167
+ },
168
+ {
169
+ "epoch": 5.53,
170
+ "learning_rate": 1.4470314318975553e-05,
171
+ "loss": 0.0272,
172
+ "step": 9500
173
+ },
174
+ {
175
+ "epoch": 5.82,
176
+ "learning_rate": 1.4179278230500584e-05,
177
+ "loss": 0.0269,
178
+ "step": 10000
179
+ },
180
+ {
181
+ "epoch": 6.0,
182
+ "eval_accuracy": 0.7795698924731183,
183
+ "eval_f1": 0.7833736396261405,
184
+ "eval_loss": 1.8119807243347168,
185
+ "eval_runtime": 8.1074,
186
+ "eval_samples_per_second": 435.896,
187
+ "eval_steps_per_second": 27.259,
188
+ "step": 10308
189
  }
190
  ],
191
  "max_steps": 34360,
192
  "num_train_epochs": 20,
193
+ "total_flos": 4692705062074920.0,
194
  "trial_name": null,
195
  "trial_params": null
196
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:baa6af60d43b89da681db440da8a020b36a0b01e397bfdbfa5cadddbecad87e9
3
  size 267858605
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01d5637896d55577cf0684e7637e84e8f4c33d9073c7e06191b4e34550d125b3
3
  size 267858605
runs/May01_06-16-39_af1ffd0a72ec/events.out.tfevents.1682921804.af1ffd0a72ec.975.12 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70d0db1c3c0e3d580bd1448f2ac155ec3e8c5720747e83b0d871beb017d6700b
3
- size 8701
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e68e8f757384349da25c9e530dcd72b5bc2f95b73c7e34539718bd1ad185d81
3
+ size 9541