daydrill commited on
Commit
04fee03
1 Parent(s): 20f1907

Training in progress, step 4500

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0dbdc000392478004ae6d96779bf4278d1ef18251780930b9f3c799384f5bbf7
3
  size 880446181
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:296884f8588ae11c789462b9ab6e20c460d4c0f1b7b2d6b3806519e2be1cb1fa
3
  size 880446181
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:542d1e98b1496a58397fda14504ca6f3da4a82106acb16e6eafe2d17041fd830
3
  size 440235825
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce844822fcb696b8539ca3538ccdea01a77975cab4e2ec3196980e2dbe1c1ad4
3
  size 440235825
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a051295dd5bb8f79e33c3a2c94c1992b07d17d0b91ccf5450842b8cded54f3c
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66ec5ba0ff534ae4b578054646a37353be9d69d556d75ac7a2f52dbaffa0899a
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d93f82e70bcd6a3d62cba6e3e991ff9feff4305521c6596bf00d78e8721b10d1
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bd11ac4acb363f0f2dbf1363ac5864a6658c25a0462f1e1f627317732521b0c
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.41657987919183503,
5
- "global_step": 4000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -134,11 +134,27 @@
134
  "eval_samples_per_second": 91.858,
135
  "eval_steps_per_second": 11.485,
136
  "step": 4000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
137
  }
138
  ],
139
  "max_steps": 28806,
140
  "num_train_epochs": 3,
141
- "total_flos": 8361496215552000.0,
142
  "trial_name": null,
143
  "trial_params": null
144
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.4686523640908144,
5
+ "global_step": 4500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
134
  "eval_samples_per_second": 91.858,
135
  "eval_steps_per_second": 11.485,
136
  "step": 4000
137
+ },
138
+ {
139
+ "epoch": 0.47,
140
+ "learning_rate": 2.5313476359091858e-05,
141
+ "loss": 0.8031,
142
+ "step": 4500
143
+ },
144
+ {
145
+ "epoch": 0.47,
146
+ "eval_exact_match": 62.44131455399061,
147
+ "eval_f1": 66.50570614180938,
148
+ "eval_loss": 0.6731235980987549,
149
+ "eval_runtime": 154.5393,
150
+ "eval_samples_per_second": 91.918,
151
+ "eval_steps_per_second": 11.492,
152
+ "step": 4500
153
  }
154
  ],
155
  "max_steps": 28806,
156
  "num_train_epochs": 3,
157
+ "total_flos": 9406683242496000.0,
158
  "trial_name": null,
159
  "trial_params": null
160
  }
nbest_predictions.json CHANGED
The diff for this file is too large to render. See raw diff
 
predictions.json CHANGED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:542d1e98b1496a58397fda14504ca6f3da4a82106acb16e6eafe2d17041fd830
3
  size 440235825
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce844822fcb696b8539ca3538ccdea01a77975cab4e2ec3196980e2dbe1c1ad4
3
  size 440235825