Training in progress, step 30000

Files changed (9) hide show

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:96afa5b935c4ba0d2f5a64c6c549d5cce4e378b683d7e5c0c4ec6ee8a7caa7b1
 size 943333453

 version https://git-lfs.github.com/spec/v1
+oid sha256:3f3b5dbaaab2ff80c51aab2baf4b9611bddb09fa3492187cd0c4986ca1141032
 size 943333453

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bab3cb9aef35a7f62022e8366c00ec1553f006427b61616b2d9605a2064469f1
 size 471708325

 version https://git-lfs.github.com/spec/v1
+oid sha256:96429bbd5357a90f82f7fd61e1d44d34485eab7d138167bde3c41c27c7bd86a2
 size 471708325

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8ce17dd362010b9febb4c382825dfdcaf98b66d0f2a90b38a39446ca8e56c66a
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:78b2b81bf435885ea6240f0db616b814b3385f70f79a69209da25c250c62b15a
 size 14503

last-checkpoint/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9c7d6ae114f124f82b43c783fc16b8f427729c24044a8a223ba79e1f91d66047
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:ed10c31fea80c2ece39edbebb48082a88208ed521f76de5c0a075b1acc6dcb0d
 size 559

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c019e460b0a3b004dbe486f597f54f4d81a353de840b5f0d23f56053d32e0dd3
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:2476364d95c8b4b965537ee7922cb55dcd03a38898d51c99d2f0db9b4afb3995
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.8144383633046651,
-  "global_step": 25000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -86,11 +86,27 @@
       "eval_samples_per_second": 7.498,
       "eval_steps_per_second": 3.749,
       "step": 25000
     }
   ],
   "max_steps": 92088,
   "num_train_epochs": 3,
-  "total_flos": 5.51617572864e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.9773260359655981,
+  "global_step": 30000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 7.498,
       "eval_steps_per_second": 3.749,
       "step": 25000
+    },
+    {
+      "epoch": 0.98,
+      "learning_rate": 2.0232277821214492e-05,
+      "loss": 0.8913,
+      "step": 30000
+    },
+    {
+      "epoch": 0.98,
+      "eval_exact_match": 81.92488262910798,
+      "eval_f1": 85.96065424027016,
+      "eval_loss": 0.7569286227226257,
+      "eval_runtime": 1529.0019,
+      "eval_samples_per_second": 7.53,
+      "eval_steps_per_second": 3.765,
+      "step": 30000
     }
   ],
   "max_steps": 92088,
   "num_train_epochs": 3,
+  "total_flos": 6.619410874368e+16,
   "trial_name": null,
   "trial_params": null
 }

nbest_predictions.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

predictions.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bab3cb9aef35a7f62022e8366c00ec1553f006427b61616b2d9605a2064469f1
 size 471708325

 version https://git-lfs.github.com/spec/v1
+oid sha256:96429bbd5357a90f82f7fd61e1d44d34485eab7d138167bde3c41c27c7bd86a2
 size 471708325