ZeroUniqueness commited on
Commit
aa0242f
β€’
1 Parent(s): 7b65909

Training in progress, step 7400

Browse files
Files changed (25) hide show
  1. adapter_model.bin +1 -1
  2. {checkpoint-7000 β†’ checkpoint-7300/adapter_model}/README.md +0 -0
  3. {checkpoint-7000 β†’ checkpoint-7300/adapter_model}/adapter_config.json +0 -0
  4. {checkpoint-7000 β†’ checkpoint-7300/adapter_model}/adapter_model.bin +1 -1
  5. {checkpoint-7000/adapter_model β†’ checkpoint-7400}/README.md +0 -0
  6. {checkpoint-7000/adapter_model β†’ checkpoint-7400}/adapter_config.json +0 -0
  7. {checkpoint-7000/adapter_model β†’ checkpoint-7400}/adapter_model.bin +1 -1
  8. {checkpoint-7000 β†’ checkpoint-7400}/optimizer.pt +1 -1
  9. {checkpoint-7000 β†’ checkpoint-7400}/rng_state_0.pth +1 -1
  10. {checkpoint-7000 β†’ checkpoint-7400}/rng_state_1.pth +1 -1
  11. {checkpoint-7000 β†’ checkpoint-7400}/rng_state_10.pth +1 -1
  12. {checkpoint-7000 β†’ checkpoint-7400}/rng_state_11.pth +1 -1
  13. {checkpoint-7000 β†’ checkpoint-7400}/rng_state_12.pth +1 -1
  14. {checkpoint-7000 β†’ checkpoint-7400}/rng_state_13.pth +1 -1
  15. {checkpoint-7000 β†’ checkpoint-7400}/rng_state_2.pth +1 -1
  16. {checkpoint-7000 β†’ checkpoint-7400}/rng_state_3.pth +1 -1
  17. {checkpoint-7000 β†’ checkpoint-7400}/rng_state_4.pth +1 -1
  18. {checkpoint-7000 β†’ checkpoint-7400}/rng_state_5.pth +1 -1
  19. {checkpoint-7000 β†’ checkpoint-7400}/rng_state_6.pth +1 -1
  20. {checkpoint-7000 β†’ checkpoint-7400}/rng_state_7.pth +1 -1
  21. {checkpoint-7000 β†’ checkpoint-7400}/rng_state_8.pth +1 -1
  22. {checkpoint-7000 β†’ checkpoint-7400}/rng_state_9.pth +1 -1
  23. {checkpoint-7000 β†’ checkpoint-7400}/scheduler.pt +1 -1
  24. {checkpoint-7000 β†’ checkpoint-7400}/trainer_state.json +99 -3
  25. {checkpoint-7000 β†’ checkpoint-7400}/training_args.bin +0 -0
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2aae85b4318efc26db922c4214aefd89c824feffab65eaf0292127550a92cb40
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:993d2c02240ed3801ddacece59d263018042d38b315c16b83c4dac141857f97b
3
  size 500897101
{checkpoint-7000 β†’ checkpoint-7300/adapter_model}/README.md RENAMED
File without changes
{checkpoint-7000 β†’ checkpoint-7300/adapter_model}/adapter_config.json RENAMED
File without changes
{checkpoint-7000 β†’ checkpoint-7300/adapter_model}/adapter_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:829e114ab5a9e821c62f695524a70db8ca49a86641b2859ce77fb48a06a52662
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2aae85b4318efc26db922c4214aefd89c824feffab65eaf0292127550a92cb40
3
  size 500897101
{checkpoint-7000/adapter_model β†’ checkpoint-7400}/README.md RENAMED
File without changes
{checkpoint-7000/adapter_model β†’ checkpoint-7400}/adapter_config.json RENAMED
File without changes
{checkpoint-7000/adapter_model β†’ checkpoint-7400}/adapter_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:829e114ab5a9e821c62f695524a70db8ca49a86641b2859ce77fb48a06a52662
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:993d2c02240ed3801ddacece59d263018042d38b315c16b83c4dac141857f97b
3
  size 500897101
{checkpoint-7000 β†’ checkpoint-7400}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a9f18d0ef7f096d1b7c973f10ec3ff7564492d5356b822823b9290813bd22af
3
  size 1001752701
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5ac5841d6300001f54af872136a81e878a172b63fcdf912ced5de86015b3e27
3
  size 1001752701
{checkpoint-7000 β†’ checkpoint-7400}/rng_state_0.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ffb463444805a626686fb368559bb528c8cad11a439e94e0669fbefa155f5a9
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3baf5ebf20ebf0458b7f556b1ed46afc501b40d8898ffabbab842d9757c22ace
3
  size 27772
{checkpoint-7000 β†’ checkpoint-7400}/rng_state_1.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:23a0c530aab0bbf04ce6a7cdc9a43f74cface45e607ab049dd048298af780c63
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcb43bb85439f18b615f2f71cf79f0c2e1281b44d62f3d40ae2b4ab32bfed6b6
3
  size 27772
{checkpoint-7000 β†’ checkpoint-7400}/rng_state_10.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a1729a7aa500d02af4fd9210e649b1e1990a9626a717d3df685f3e8d4bbd8972
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ae80861e273facc235ec70bbe5d5897cd7b8e6e7064d4329ebd0a0ab34e1d83
3
  size 27789
{checkpoint-7000 β†’ checkpoint-7400}/rng_state_11.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:19e5b4b85191400cd5e64e2f8237e15f18b8b594925371005270709c6fdead8f
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f6fe88b89271d4a3fa17461b406b6c31a71b39d5723c9bddfec471d0b453f52
3
  size 27789
{checkpoint-7000 β†’ checkpoint-7400}/rng_state_12.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3b402b3eb4de19ff6a9f8883a5fcd04a43806b59a03e4efdc8bf4fb9e09b013
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ed06c69a78e8e7e71cef531884e74a692b1da2ec797510707214943cd99a6fa
3
  size 27789
{checkpoint-7000 β†’ checkpoint-7400}/rng_state_13.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c4fc3b0264037c6adeffe7738e3557c467ef0d8ed53839e47a410daf2fe89dca
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec128429973cc3bb99daaa414691d0aeab3f2d28aee2d016ae8f463e87b75303
3
  size 27789
{checkpoint-7000 β†’ checkpoint-7400}/rng_state_2.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:010c3d33f4e3de2781a9f0ba558acdebc4c7141cfd907d61f3e048d2e7d39993
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e45af4ddead7ac0471e44bdb014890d3f531bc098ade5a3ab94e4f5c007daa14
3
  size 27772
{checkpoint-7000 β†’ checkpoint-7400}/rng_state_3.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21817ffe90861ca50df336908db88de597bc45f8e09a83382b7c14f1fdacb1a7
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0726836b26d946d9ec17bbbfbed9fc3fb492a97e91e7991b6ab928fed4a42e2
3
  size 27772
{checkpoint-7000 β†’ checkpoint-7400}/rng_state_4.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:94aae1471cb561bdfae8fb9883b0a5cf60945ea0575bb647c07aa05ae3d4ac36
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7680747019af759345214a0de04c2e158d916ec42b26667797f489cb55c93074
3
  size 27772
{checkpoint-7000 β†’ checkpoint-7400}/rng_state_5.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3f9bd490917bf4ae8dd3759559f6bd62286b84a1bf4861c8a1e987719cae69b
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:104035968b4a9d767346eeb077e90657b713ffc767eecaf4489cc350db37de17
3
  size 27772
{checkpoint-7000 β†’ checkpoint-7400}/rng_state_6.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a072639d1100cd5b5b95d4b5e5ca774464ea41404ceeb55917b006dc3bcd0cf
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:376c584f7b44a727d446458afe9c9fb5c3b8c31c1f0b9e7689635a8cf4335021
3
  size 27772
{checkpoint-7000 β†’ checkpoint-7400}/rng_state_7.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ee4287283869a9044a5fb4c2a9726e7e1f6ee58c3cb254a6f7d766de60a14a8
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8d4800aad8ec372345e6c696ae6bf61c09269149665d2aa4232991019c99fa5
3
  size 27772
{checkpoint-7000 β†’ checkpoint-7400}/rng_state_8.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:39077828ac43bedfceb19708273b4a740799cc80eb0725b8973a8ef021c0925e
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79c38e0f0a96baa9834ace5a5012a3f25863c8a6354659645637e9614927dcd8
3
  size 27772
{checkpoint-7000 β†’ checkpoint-7400}/rng_state_9.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b29f83ff1993eda2c6298d90ac20110f504235dc369af2574075117cf97cf573
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54c80796b044f5acabd3fa7243d13e4ec5f5acc43be402329b2d31af2e4c25d1
3
  size 27772
{checkpoint-7000 β†’ checkpoint-7400}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78b2e1a7576f141a45b1812083ab858caaac51d2b76c32d2a01e78f578acf12e
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6741d217f31a08d86b6f339348ff73c807bdf74225de0696d612e4cc95a34759
3
  size 627
{checkpoint-7000 β†’ checkpoint-7400}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.7142303218301667,
5
- "global_step": 7000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1718,11 +1718,107 @@
1718
  "eval_samples_per_second": 12.427,
1719
  "eval_steps_per_second": 0.902,
1720
  "step": 7000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1721
  }
1722
  ],
1723
  "max_steps": 7737,
1724
  "num_train_epochs": 3,
1725
- "total_flos": 3.0145536634921157e+19,
1726
  "trial_name": null,
1727
  "trial_params": null
1728
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.869329197363319,
5
+ "global_step": 7400,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1718
  "eval_samples_per_second": 12.427,
1719
  "eval_steps_per_second": 0.902,
1720
  "step": 7000
1721
+ },
1722
+ {
1723
+ "epoch": 2.72,
1724
+ "learning_rate": 4.160763312197513e-06,
1725
+ "loss": 0.7724,
1726
+ "step": 7025
1727
+ },
1728
+ {
1729
+ "epoch": 2.73,
1730
+ "learning_rate": 3.875573860006421e-06,
1731
+ "loss": 0.7696,
1732
+ "step": 7050
1733
+ },
1734
+ {
1735
+ "epoch": 2.74,
1736
+ "learning_rate": 3.6003152929641624e-06,
1737
+ "loss": 0.7625,
1738
+ "step": 7075
1739
+ },
1740
+ {
1741
+ "epoch": 2.75,
1742
+ "learning_rate": 3.335016048808437e-06,
1743
+ "loss": 0.7733,
1744
+ "step": 7100
1745
+ },
1746
+ {
1747
+ "epoch": 2.76,
1748
+ "learning_rate": 3.0797035363512193e-06,
1749
+ "loss": 0.7685,
1750
+ "step": 7125
1751
+ },
1752
+ {
1753
+ "epoch": 2.77,
1754
+ "learning_rate": 2.834404132647128e-06,
1755
+ "loss": 0.769,
1756
+ "step": 7150
1757
+ },
1758
+ {
1759
+ "epoch": 2.78,
1760
+ "learning_rate": 2.5991431802683262e-06,
1761
+ "loss": 0.7647,
1762
+ "step": 7175
1763
+ },
1764
+ {
1765
+ "epoch": 2.79,
1766
+ "learning_rate": 2.3739449846862826e-06,
1767
+ "loss": 0.7634,
1768
+ "step": 7200
1769
+ },
1770
+ {
1771
+ "epoch": 2.8,
1772
+ "learning_rate": 2.158832811760736e-06,
1773
+ "loss": 0.7617,
1774
+ "step": 7225
1775
+ },
1776
+ {
1777
+ "epoch": 2.81,
1778
+ "learning_rate": 1.95382888533604e-06,
1779
+ "loss": 0.768,
1780
+ "step": 7250
1781
+ },
1782
+ {
1783
+ "epoch": 2.82,
1784
+ "learning_rate": 1.7589543849450996e-06,
1785
+ "loss": 0.7712,
1786
+ "step": 7275
1787
+ },
1788
+ {
1789
+ "epoch": 2.83,
1790
+ "learning_rate": 1.5742294436213223e-06,
1791
+ "loss": 0.7703,
1792
+ "step": 7300
1793
+ },
1794
+ {
1795
+ "epoch": 2.84,
1796
+ "learning_rate": 1.3996731458185697e-06,
1797
+ "loss": 0.7618,
1798
+ "step": 7325
1799
+ },
1800
+ {
1801
+ "epoch": 2.85,
1802
+ "learning_rate": 1.2353035254395352e-06,
1803
+ "loss": 0.7767,
1804
+ "step": 7350
1805
+ },
1806
+ {
1807
+ "epoch": 2.86,
1808
+ "learning_rate": 1.0811375639725341e-06,
1809
+ "loss": 0.7659,
1810
+ "step": 7375
1811
+ },
1812
+ {
1813
+ "epoch": 2.87,
1814
+ "learning_rate": 9.371911887371965e-07,
1815
+ "loss": 0.774,
1816
+ "step": 7400
1817
  }
1818
  ],
1819
  "max_steps": 7737,
1820
  "num_train_epochs": 3,
1821
+ "total_flos": 3.1867824817039213e+19,
1822
  "trial_name": null,
1823
  "trial_params": null
1824
  }
{checkpoint-7000 β†’ checkpoint-7400}/training_args.bin RENAMED
File without changes