Training in progress, step 900, checkpoint

Files changed (12) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0798aea0ea2601e4960663935fa97da490cf86178204f31bf0ed2460a4c1275a
 size 109069176

 version https://git-lfs.github.com/spec/v1
+oid sha256:8cbcd9310e10d5fe993b5cf333d88aae96e554801b55f9a8223e27e60cbd5ee7
 size 109069176

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b20acc8c2819b5238fc1968b8d432b732f623548f82ab694b4ebbabb55974942
 size 218182650

 version https://git-lfs.github.com/spec/v1
+oid sha256:27dd51826701f4f4caf7650fd69a5e61f897e08b55abc61a1a1af22c824d7a70
 size 218182650

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:799585410cb48cfae2f789d2ae91c06eb6aa0b91dbbd43b4a7d3a3b3448266dc
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:fdf88252bee8ee3fad27d73acc6775e5c54e36b432cba2ce38bd28d90a91cedc
 size 15920

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:73a76caeeb6399337d47bab4ebb168d6f60ae74361a415444a8e490366d03706
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:41e967c2ecc8fedac9e0009a302b7be7b77330e19189247194492952af17ea64
 size 15920

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:06ebbd589aa551ebe217b92a81b1199984cb4118d028495561fb7b19c201549f
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:66a8969a338902975b0c4c705afc719c7c7b10b35ea13c9c67faffb439307f43
 size 15920

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:84c1c6c5271cfaf6419b5a12231eb5d7600d7b42ef8c3bd0ff7dde7c75cefbaf
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:8196d74df85addf8f6045699aed4bb233236ff60e0fc4a401041aedc4272b347
 size 15920

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:220694a8a21316fb5495170fa14c9ab96f29551ca78215f11476de1f24e9c350
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:03a4c643870f71e5714f51cca20015821a04ab9ad622a0412916ee78037f3515
 size 15920

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fad915d890a280310c92a5d19f0fde015486a9c1d34abcbeaa4bf2e4e71d1fb5
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:794ce6be94cae7a6fbdda053c500122338e8c247918fbe8eb826684e5bd3ca24
 size 15920

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8dbbfa09bb18061b9f644197b93813100b6fe337d1917f4dc506c498674d7ff8
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:e5ca5a1485292bda09ae1ddd0869d5b7f3aa39d96a8386b1e8f008804f4026e8
 size 15920

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:654da67a15b5302e79b90f93fddb5fa6b1c1256c8d14ba5597acfc2cb0e4c564
 size 15920

 version https://git-lfs.github.com/spec/v1
+oid sha256:df39b202ceea5786d852b9d29b95d90e78cf3ccd25f2d593dfc4b4c2a64d2ca2
 size 15920

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a2f55da614670472de86d5296be3e0d18a3a22605c545bf5c0c35d23ec73b3c8
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:647afc85c56b5d55d82459efd014f4044d90b731c734f1c96dfdd388b51e583f
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.0,
   "eval_steps": 100,
-  "global_step": 800,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -78,6 +78,14 @@
       "eval_samples_per_second": 9.354,
       "eval_steps_per_second": 0.292,
       "step": 800
     }
   ],
   "logging_steps": 500,
@@ -97,7 +105,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 1.1847107222280602e+18,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.25,
   "eval_steps": 100,
+  "global_step": 900,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 9.354,
       "eval_steps_per_second": 0.292,
       "step": 800
+    },
+    {
+      "epoch": 2.25,
+      "eval_loss": 0.012095152400434017,
+      "eval_runtime": 3.4203,
+      "eval_samples_per_second": 9.356,
+      "eval_steps_per_second": 0.292,
+      "step": 900
     }
   ],
   "logging_steps": 500,
       "attributes": {}
     }
   },
+  "total_flos": 1.3327995625065677e+18,
   "train_batch_size": 4,
   "trial_name": null,
   "trial_params": null