Training in progress, step 524

Browse files

Files changed (7) hide show

adapter_model.bin +1 -1
last-checkpoint/adapter_model.bin +1 -1
last-checkpoint/optimizer.pt +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +63 -3
runs/Jul30_21-45-15_04d48b04b124/events.out.tfevents.1690753519.04d48b04b124.12710.0 +2 -2

adapter_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cb3c4343d5b79891e68e969b5db2e8b5a3bba2fc92883108865dd3097a7d1357
 size 3163457

 version https://git-lfs.github.com/spec/v1
+oid sha256:cb3e39c69cf87ac8f88f27ce6f33ebc40816ea621b5669a014b039c0efc7f541
 size 3163457

last-checkpoint/adapter_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cb3c4343d5b79891e68e969b5db2e8b5a3bba2fc92883108865dd3097a7d1357
 size 3163457

 version https://git-lfs.github.com/spec/v1
+oid sha256:cb3e39c69cf87ac8f88f27ce6f33ebc40816ea621b5669a014b039c0efc7f541
 size 3163457

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e8901fba30f9688d20aa8e15379a7066e298045a8bb0b9de8851afdbe035d623
 size 6319689

 version https://git-lfs.github.com/spec/v1
+oid sha256:d687ffed6510ec1c76cffe4448a4eb5c5312677e63e6ba40479737f7ad1b8a7f
 size 6319689

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c5063f67e2c88884cab54e05296e5e83ac9a3c954c9e23cfb2d9a21a6c8d8e10
 size 14639

 version https://git-lfs.github.com/spec/v1
+oid sha256:6227a8020263fdf5f88e2d88cee5778418bbde4b0cf3767c692dc92f26c6f75d
 size 14639

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a55327b521b10efdd88cd32140805678860f8977b7eba62e5ac86192f50bb738
 size 627

 version https://git-lfs.github.com/spec/v1
+oid sha256:f0efecc10e44e390de6dc6bd5194bdbd19c81b879ba1d4cdb7a5e0d951d3f168
 size 627

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.1501432664756447,
-  "global_step": 262,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -72,11 +72,71 @@
       "learning_rate": 1.702005730659026e-05,
       "loss": 2.7529,
       "step": 260
     }
   ],
   "max_steps": 1745,
   "num_train_epochs": 1,
-  "total_flos": 487908402266112.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.3002865329512894,
+  "global_step": 524,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 1.702005730659026e-05,
       "loss": 2.7529,
       "step": 260
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 1.6722063037249286e-05,
+      "loss": 2.7147,
+      "step": 286
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 1.642406876790831e-05,
+      "loss": 2.695,
+      "step": 312
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 1.6137535816618913e-05,
+      "loss": 2.7071,
+      "step": 338
+    },
+    {
+      "epoch": 0.21,
+      "learning_rate": 1.583954154727794e-05,
+      "loss": 2.7039,
+      "step": 364
+    },
+    {
+      "epoch": 0.22,
+      "learning_rate": 1.5541547277936964e-05,
+      "loss": 2.7586,
+      "step": 390
+    },
+    {
+      "epoch": 0.24,
+      "learning_rate": 1.5243553008595991e-05,
+      "loss": 2.8132,
+      "step": 416
+    },
+    {
+      "epoch": 0.25,
+      "learning_rate": 1.495702005730659e-05,
+      "loss": 2.7552,
+      "step": 442
+    },
+    {
+      "epoch": 0.27,
+      "learning_rate": 1.4659025787965618e-05,
+      "loss": 2.7388,
+      "step": 468
+    },
+    {
+      "epoch": 0.28,
+      "learning_rate": 1.4361031518624645e-05,
+      "loss": 2.6576,
+      "step": 494
+    },
+    {
+      "epoch": 0.3,
+      "learning_rate": 1.4063037249283669e-05,
+      "loss": 2.6962,
+      "step": 520
     }
   ],
   "max_steps": 1745,
   "num_train_epochs": 1,
+  "total_flos": 975816804532224.0,
   "trial_name": null,
   "trial_params": null
 }

runs/Jul30_21-45-15_04d48b04b124/events.out.tfevents.1690753519.04d48b04b124.12710.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:862ab2bfec1ac04bfcc6c7b6745e05a9197bf0013e1824069f79c8e70bec11ee
-size 5915

 version https://git-lfs.github.com/spec/v1
+oid sha256:08b8b3fba46577efad57cda38fc4207645b4446372c05c26f20f746cc1d5014e
+size 7485