ZeroUniqueness commited on
Commit
7b2562e
β€’
1 Parent(s): aa0242f

Training in progress, step 7500

Browse files
Files changed (25) hide show
  1. adapter_model.bin +1 -1
  2. {checkpoint-7100 β†’ checkpoint-7400/adapter_model}/README.md +0 -0
  3. {checkpoint-7100 β†’ checkpoint-7400/adapter_model}/adapter_config.json +0 -0
  4. {checkpoint-7100 β†’ checkpoint-7400/adapter_model}/adapter_model.bin +1 -1
  5. {checkpoint-7100/adapter_model β†’ checkpoint-7500}/README.md +0 -0
  6. {checkpoint-7100/adapter_model β†’ checkpoint-7500}/adapter_config.json +0 -0
  7. {checkpoint-7100/adapter_model β†’ checkpoint-7500}/adapter_model.bin +1 -1
  8. {checkpoint-7100 β†’ checkpoint-7500}/optimizer.pt +1 -1
  9. {checkpoint-7100 β†’ checkpoint-7500}/rng_state_0.pth +1 -1
  10. {checkpoint-7100 β†’ checkpoint-7500}/rng_state_1.pth +1 -1
  11. {checkpoint-7100 β†’ checkpoint-7500}/rng_state_10.pth +1 -1
  12. {checkpoint-7100 β†’ checkpoint-7500}/rng_state_11.pth +1 -1
  13. {checkpoint-7100 β†’ checkpoint-7500}/rng_state_12.pth +1 -1
  14. {checkpoint-7100 β†’ checkpoint-7500}/rng_state_13.pth +1 -1
  15. {checkpoint-7100 β†’ checkpoint-7500}/rng_state_2.pth +1 -1
  16. {checkpoint-7100 β†’ checkpoint-7500}/rng_state_3.pth +1 -1
  17. {checkpoint-7100 β†’ checkpoint-7500}/rng_state_4.pth +1 -1
  18. {checkpoint-7100 β†’ checkpoint-7500}/rng_state_5.pth +1 -1
  19. {checkpoint-7100 β†’ checkpoint-7500}/rng_state_6.pth +1 -1
  20. {checkpoint-7100 β†’ checkpoint-7500}/rng_state_7.pth +1 -1
  21. {checkpoint-7100 β†’ checkpoint-7500}/rng_state_8.pth +1 -1
  22. {checkpoint-7100 β†’ checkpoint-7500}/rng_state_9.pth +1 -1
  23. {checkpoint-7100 β†’ checkpoint-7500}/scheduler.pt +1 -1
  24. {checkpoint-7100 β†’ checkpoint-7500}/trainer_state.json +99 -3
  25. {checkpoint-7100 β†’ checkpoint-7500}/training_args.bin +0 -0
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:993d2c02240ed3801ddacece59d263018042d38b315c16b83c4dac141857f97b
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:599a7200aa4c479d11103aabf574f030fbcfd8ec950c813b2ed33cb39a745288
3
  size 500897101
{checkpoint-7100 β†’ checkpoint-7400/adapter_model}/README.md RENAMED
File without changes
{checkpoint-7100 β†’ checkpoint-7400/adapter_model}/adapter_config.json RENAMED
File without changes
{checkpoint-7100 β†’ checkpoint-7400/adapter_model}/adapter_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7994cd2bdb16f74437b3f74bb9b30d22b607685dff2fbbddd6503caf3ecfc9c
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:993d2c02240ed3801ddacece59d263018042d38b315c16b83c4dac141857f97b
3
  size 500897101
{checkpoint-7100/adapter_model β†’ checkpoint-7500}/README.md RENAMED
File without changes
{checkpoint-7100/adapter_model β†’ checkpoint-7500}/adapter_config.json RENAMED
File without changes
{checkpoint-7100/adapter_model β†’ checkpoint-7500}/adapter_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7994cd2bdb16f74437b3f74bb9b30d22b607685dff2fbbddd6503caf3ecfc9c
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:599a7200aa4c479d11103aabf574f030fbcfd8ec950c813b2ed33cb39a745288
3
  size 500897101
{checkpoint-7100 β†’ checkpoint-7500}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:08bb8b622161de17af40582eb3ed678e87e25a018cf69b2de05646628dfca429
3
  size 1001752701
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fbb0b5a10201f46c10a18c381ad9781e7f0c8efb247be7229f7b7a1d0f59669
3
  size 1001752701
{checkpoint-7100 β†’ checkpoint-7500}/rng_state_0.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:23c8a5bc289147cb5929165f36a3fc53769326cf76122f4e6c3653db9207d22b
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbda122ed6aeb142e9806e2c60595c0fb0345e050a46424ae7e6121a274bdf8f
3
  size 27772
{checkpoint-7100 β†’ checkpoint-7500}/rng_state_1.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:13d75987ce8c09a29b765dd85cdd96b7a9a16698e6e223be594288e44b77c0ef
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edfe82be00b7fdfa29bc639a42272a413c2f745e99a7dd4e7c019268bffb3c1c
3
  size 27772
{checkpoint-7100 β†’ checkpoint-7500}/rng_state_10.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9194e62944ef0d0d95beb53e67dd3ad85f824a5c4c4367f1ae922d8f0252511a
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfbeff8b08e4ff89601ec54eda1fbaada8fa06897aded9396ba9e47eb6a98ac9
3
  size 27789
{checkpoint-7100 β†’ checkpoint-7500}/rng_state_11.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8b2f0d2bdab9bb6a53039c3d6d49fe1efd65d83e7c14abc55131fd39c7a8087
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e488c693c827c1c1bc8761677e2e18ebf62ff097e6a8845c75725b08ee364123
3
  size 27789
{checkpoint-7100 β†’ checkpoint-7500}/rng_state_12.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5afbd024ed5e83de312b869416218e006a8c440bcfa8eb583f35096bfb0c4720
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70e177e7485bfc4621fd67465543e8b8af515ce3eb17dbc796a813aa9189ca2f
3
  size 27789
{checkpoint-7100 β†’ checkpoint-7500}/rng_state_13.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0cab3d1d84a4ad05749470c8f5dc01e60bfcb95467f434ca95e7e4ea22f5d250
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d25a7d7bcfccc3ae06e04a8dd31e3a14472b8b1c02eeae89ff0b880b6032932
3
  size 27789
{checkpoint-7100 β†’ checkpoint-7500}/rng_state_2.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97044b073aa474e262f429ff1b481848b303cc0cfb213657542fc577a8f0b9fd
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eae779e6cba58f785b1d5fb960336448e1e9e5fc24e9a8e12bca601df697886f
3
  size 27772
{checkpoint-7100 β†’ checkpoint-7500}/rng_state_3.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:574b4b605f5956d0c7871af3ec3d18dbf8d8e7ed9b553e22b08e100a70e567fa
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1608635b1c766955f0811a53d4bd5951addb57bb03975fa838eda4e0ae41f71d
3
  size 27772
{checkpoint-7100 β†’ checkpoint-7500}/rng_state_4.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:40164a2ca96b5ba33c934479558b3008f70a14394bc47f822b3d87cfe904a19e
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7941a1be97c26b733e1df942d0fd78e6aadc9a0e9eb0828e07b31662264008a
3
  size 27772
{checkpoint-7100 β†’ checkpoint-7500}/rng_state_5.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5f952d85ac6565b75dbbb768259288b5b0dd464f3cb12806854d43d36838e07
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e298e6676cd57f41db105eaecc5bd07d4c75370e7d33e163ca2de445996b0d5e
3
  size 27772
{checkpoint-7100 β†’ checkpoint-7500}/rng_state_6.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:86c477a0ba385b263d319ebf01a2681a100d7e5c60aaec444e59be567c2e2eab
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:149cb26a6e8eca2a8f06334ca36fc633cc4ddf79e4509a782ff5cbe8d8e3dc8d
3
  size 27772
{checkpoint-7100 β†’ checkpoint-7500}/rng_state_7.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dadf17ecf19fb0e7d5796316055a7f6a2ff58b559ee65fb247152209c0f58e0c
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0fdf62330e049e160395841276b2da25c8f736f4fabca874aa5b00ac0bdedf4
3
  size 27772
{checkpoint-7100 β†’ checkpoint-7500}/rng_state_8.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54df0035f6989468f459c9adfac4aab9e79d3416ce505281cf38f0c89b6df8d0
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a4f0e9da27258f0f79f9d608144e718b994434a9d87531d3afba0531bb1e29f
3
  size 27772
{checkpoint-7100 β†’ checkpoint-7500}/rng_state_9.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:697f5513e941f30e44819a138ad4df97f3c4871e837c83e79cd6dcfa2561da90
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8a8b6af1d78ab083fc6250edfc937e9898abf345d67eb89a8a91af6cbca15e4
3
  size 27772
{checkpoint-7100 β†’ checkpoint-7500}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28d2cff1b78513eaa3664c14381155eeb1b4cabe349547de751fa001fc41f348
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70dbbed2d23faf20ab6dcce74542b56e86868c5259dd618df042286187825260
3
  size 627
{checkpoint-7100 β†’ checkpoint-7500}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.7530050407134548,
5
- "global_step": 7100,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1742,11 +1742,107 @@
1742
  "learning_rate": 3.335016048808437e-06,
1743
  "loss": 0.7733,
1744
  "step": 7100
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1745
  }
1746
  ],
1747
  "max_steps": 7737,
1748
  "num_train_epochs": 3,
1749
- "total_flos": 3.0575605849301975e+19,
1750
  "trial_name": null,
1751
  "trial_params": null
1752
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.908103916246607,
5
+ "global_step": 7500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1742
  "learning_rate": 3.335016048808437e-06,
1743
  "loss": 0.7733,
1744
  "step": 7100
1745
+ },
1746
+ {
1747
+ "epoch": 2.76,
1748
+ "learning_rate": 3.0797035363512193e-06,
1749
+ "loss": 0.7685,
1750
+ "step": 7125
1751
+ },
1752
+ {
1753
+ "epoch": 2.77,
1754
+ "learning_rate": 2.834404132647128e-06,
1755
+ "loss": 0.769,
1756
+ "step": 7150
1757
+ },
1758
+ {
1759
+ "epoch": 2.78,
1760
+ "learning_rate": 2.5991431802683262e-06,
1761
+ "loss": 0.7647,
1762
+ "step": 7175
1763
+ },
1764
+ {
1765
+ "epoch": 2.79,
1766
+ "learning_rate": 2.3739449846862826e-06,
1767
+ "loss": 0.7634,
1768
+ "step": 7200
1769
+ },
1770
+ {
1771
+ "epoch": 2.8,
1772
+ "learning_rate": 2.158832811760736e-06,
1773
+ "loss": 0.7617,
1774
+ "step": 7225
1775
+ },
1776
+ {
1777
+ "epoch": 2.81,
1778
+ "learning_rate": 1.95382888533604e-06,
1779
+ "loss": 0.768,
1780
+ "step": 7250
1781
+ },
1782
+ {
1783
+ "epoch": 2.82,
1784
+ "learning_rate": 1.7589543849450996e-06,
1785
+ "loss": 0.7712,
1786
+ "step": 7275
1787
+ },
1788
+ {
1789
+ "epoch": 2.83,
1790
+ "learning_rate": 1.5742294436213223e-06,
1791
+ "loss": 0.7703,
1792
+ "step": 7300
1793
+ },
1794
+ {
1795
+ "epoch": 2.84,
1796
+ "learning_rate": 1.3996731458185697e-06,
1797
+ "loss": 0.7618,
1798
+ "step": 7325
1799
+ },
1800
+ {
1801
+ "epoch": 2.85,
1802
+ "learning_rate": 1.2353035254395352e-06,
1803
+ "loss": 0.7767,
1804
+ "step": 7350
1805
+ },
1806
+ {
1807
+ "epoch": 2.86,
1808
+ "learning_rate": 1.0811375639725341e-06,
1809
+ "loss": 0.7659,
1810
+ "step": 7375
1811
+ },
1812
+ {
1813
+ "epoch": 2.87,
1814
+ "learning_rate": 9.371911887371965e-07,
1815
+ "loss": 0.774,
1816
+ "step": 7400
1817
+ },
1818
+ {
1819
+ "epoch": 2.88,
1820
+ "learning_rate": 8.034792712388828e-07,
1821
+ "loss": 0.7658,
1822
+ "step": 7425
1823
+ },
1824
+ {
1825
+ "epoch": 2.89,
1826
+ "learning_rate": 6.800156256323243e-07,
1827
+ "loss": 0.7626,
1828
+ "step": 7450
1829
+ },
1830
+ {
1831
+ "epoch": 2.9,
1832
+ "learning_rate": 5.6681300729442e-07,
1833
+ "loss": 0.7744,
1834
+ "step": 7475
1835
+ },
1836
+ {
1837
+ "epoch": 2.91,
1838
+ "learning_rate": 4.6388311150644683e-07,
1839
+ "loss": 0.7768,
1840
+ "step": 7500
1841
  }
1842
  ],
1843
  "max_steps": 7737,
1844
  "num_train_epochs": 3,
1845
+ "total_flos": 3.2299438278321373e+19,
1846
  "trial_name": null,
1847
  "trial_params": null
1848
  }
{checkpoint-7100 β†’ checkpoint-7500}/training_args.bin RENAMED
File without changes