Training in progress, step 3100, checkpoint

Browse files

Files changed (6) hide show

last-checkpoint/model.safetensors +1 -1
last-checkpoint/optimizer.pt +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +69 -3
last-checkpoint/training_args.bin +1 -1

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4322cb52e7375952b1b7c62f67285f280a31e123ef3ec661fb690ab98ec4501d
 size 966995080

 version https://git-lfs.github.com/spec/v1
+oid sha256:9d1c2e4ed987aee90e725ecff305fed01d3e4cec3c313446fbf4acd8456b8756
 size 966995080

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0c8b1e94006a0bd0b5433a91a8d0f2efb9acd8c8debe0a4db87187d4f3df0549
 size 1925064044

 version https://git-lfs.github.com/spec/v1
+oid sha256:9d53577f76fdefe8556c65117e1ab17e94a9394b496e89807249258044e5ec7e
 size 1925064044

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aabc5988751cca3ac2633ffd4f8fdf9b2babdfb7020d9a25c5dd343ea5e806c4
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:b41d2e987cb5c78d26dab771fe721c2da517630b617af0cac6deeb8db36562a9
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7b8eb592d2fee38e792ebd9f77ad72aad42bb0e171607f9852785836391c11e4
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:1ea257fad0fa492e3a9fc46adc164d21d7f8ad016c3f3e68a0c6df4900fed1ab
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": 70.1955074875208,
   "best_model_checkpoint": "./whisper-it/checkpoint-300",
-  "epoch": 5.534351145038168,
   "eval_steps": 100,
-  "global_step": 2900,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -964,6 +964,72 @@
       "eval_steps_per_second": 0.116,
       "eval_wer": 157.52218524681086,
       "step": 2900
     }
   ],
   "logging_steps": 25,
@@ -971,7 +1037,7 @@
   "num_input_tokens_seen": 0,
   "num_train_epochs": 8,
   "save_steps": 100,
-  "total_flos": 2.67706246606848e+19,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": 70.1955074875208,
   "best_model_checkpoint": "./whisper-it/checkpoint-300",
+  "epoch": 5.916030534351145,
   "eval_steps": 100,
+  "global_step": 3100,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_steps_per_second": 0.116,
       "eval_wer": 157.52218524681086,
       "step": 2900
+    },
+    {
+      "epoch": 5.58,
+      "learning_rate": 3.0885714285714284e-06,
+      "loss": 0.009,
+      "step": 2925
+    },
+    {
+      "epoch": 5.63,
+      "learning_rate": 3.0171428571428574e-06,
+      "loss": 0.0092,
+      "step": 2950
+    },
+    {
+      "epoch": 5.68,
+      "learning_rate": 2.945714285714286e-06,
+      "loss": 0.0086,
+      "step": 2975
+    },
+    {
+      "epoch": 5.73,
+      "learning_rate": 2.8742857142857146e-06,
+      "loss": 0.0076,
+      "step": 3000
+    },
+    {
+      "epoch": 5.73,
+      "eval_loss": 0.43520399928092957,
+      "eval_runtime": 1605.7035,
+      "eval_samples_per_second": 0.934,
+      "eval_steps_per_second": 0.117,
+      "eval_wer": 154.5410427066001,
+      "step": 3000
+    },
+    {
+      "epoch": 5.77,
+      "learning_rate": 2.802857142857143e-06,
+      "loss": 0.0089,
+      "step": 3025
+    },
+    {
+      "epoch": 5.82,
+      "learning_rate": 2.7314285714285714e-06,
+      "loss": 0.0074,
+      "step": 3050
+    },
+    {
+      "epoch": 5.87,
+      "learning_rate": 2.6600000000000004e-06,
+      "loss": 0.0084,
+      "step": 3075
+    },
+    {
+      "epoch": 5.92,
+      "learning_rate": 2.5885714285714285e-06,
+      "loss": 0.0089,
+      "step": 3100
+    },
+    {
+      "epoch": 5.92,
+      "eval_loss": 0.4393894076347351,
+      "eval_runtime": 1680.0289,
+      "eval_samples_per_second": 0.893,
+      "eval_steps_per_second": 0.112,
+      "eval_wer": 184.29007210205214,
+      "step": 3100
     }
   ],
   "logging_steps": 25,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 8,
   "save_steps": 100,
+  "total_flos": 2.86175712227328e+19,
   "trial_name": null,
   "trial_params": null
 }

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e2c92dac35d16dc814e0a1581e1901c1f2948813ba744cab88f1ca1434e0d291
 size 4856

 version https://git-lfs.github.com/spec/v1
+oid sha256:41aeb0de3cf3c068ad356f23e2a4d52e468d71a8f1523974035aff9cc867de12
 size 4856