ZeroUniqueness commited on
Commit
44b1d94
β€’
1 Parent(s): 7b2562e

Training in progress, step 7600

Browse files
Files changed (25) hide show
  1. adapter_model.bin +1 -1
  2. {checkpoint-7200 β†’ checkpoint-7500/adapter_model}/README.md +0 -0
  3. {checkpoint-7200 β†’ checkpoint-7500/adapter_model}/adapter_config.json +0 -0
  4. {checkpoint-7200 β†’ checkpoint-7500/adapter_model}/adapter_model.bin +1 -1
  5. {checkpoint-7200/adapter_model β†’ checkpoint-7600}/README.md +0 -0
  6. {checkpoint-7200/adapter_model β†’ checkpoint-7600}/adapter_config.json +0 -0
  7. {checkpoint-7200/adapter_model β†’ checkpoint-7600}/adapter_model.bin +1 -1
  8. {checkpoint-7200 β†’ checkpoint-7600}/optimizer.pt +1 -1
  9. {checkpoint-7200 β†’ checkpoint-7600}/rng_state_0.pth +1 -1
  10. {checkpoint-7200 β†’ checkpoint-7600}/rng_state_1.pth +1 -1
  11. {checkpoint-7200 β†’ checkpoint-7600}/rng_state_10.pth +1 -1
  12. {checkpoint-7200 β†’ checkpoint-7600}/rng_state_11.pth +1 -1
  13. {checkpoint-7200 β†’ checkpoint-7600}/rng_state_12.pth +1 -1
  14. {checkpoint-7200 β†’ checkpoint-7600}/rng_state_13.pth +1 -1
  15. {checkpoint-7200 β†’ checkpoint-7600}/rng_state_2.pth +1 -1
  16. {checkpoint-7200 β†’ checkpoint-7600}/rng_state_3.pth +1 -1
  17. {checkpoint-7200 β†’ checkpoint-7600}/rng_state_4.pth +1 -1
  18. {checkpoint-7200 β†’ checkpoint-7600}/rng_state_5.pth +1 -1
  19. {checkpoint-7200 β†’ checkpoint-7600}/rng_state_6.pth +1 -1
  20. {checkpoint-7200 β†’ checkpoint-7600}/rng_state_7.pth +1 -1
  21. {checkpoint-7200 β†’ checkpoint-7600}/rng_state_8.pth +1 -1
  22. {checkpoint-7200 β†’ checkpoint-7600}/rng_state_9.pth +1 -1
  23. {checkpoint-7200 β†’ checkpoint-7600}/scheduler.pt +1 -1
  24. {checkpoint-7200 β†’ checkpoint-7600}/trainer_state.json +99 -3
  25. {checkpoint-7200 β†’ checkpoint-7600}/training_args.bin +0 -0
adapter_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:599a7200aa4c479d11103aabf574f030fbcfd8ec950c813b2ed33cb39a745288
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5ab034d117a0225da8be2f42841fdd56781cdd412727c42b29659f8fe5e1326
3
  size 500897101
{checkpoint-7200 β†’ checkpoint-7500/adapter_model}/README.md RENAMED
File without changes
{checkpoint-7200 β†’ checkpoint-7500/adapter_model}/adapter_config.json RENAMED
File without changes
{checkpoint-7200 β†’ checkpoint-7500/adapter_model}/adapter_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4ed435f77b8aaa468d0a026e8247b6e75dcc7152deb57502bce336e2ea4128e
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:599a7200aa4c479d11103aabf574f030fbcfd8ec950c813b2ed33cb39a745288
3
  size 500897101
{checkpoint-7200/adapter_model β†’ checkpoint-7600}/README.md RENAMED
File without changes
{checkpoint-7200/adapter_model β†’ checkpoint-7600}/adapter_config.json RENAMED
File without changes
{checkpoint-7200/adapter_model β†’ checkpoint-7600}/adapter_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4ed435f77b8aaa468d0a026e8247b6e75dcc7152deb57502bce336e2ea4128e
3
  size 500897101
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5ab034d117a0225da8be2f42841fdd56781cdd412727c42b29659f8fe5e1326
3
  size 500897101
{checkpoint-7200 β†’ checkpoint-7600}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:58080885ae3c7e810fac9015f40f367426ce410c7f99ba7b48feda9529653b88
3
  size 1001752701
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fb53c8a12296e035ec70bf89911c9255494b238ffbb8f9c7a06d814a5410c87
3
  size 1001752701
{checkpoint-7200 β†’ checkpoint-7600}/rng_state_0.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e78a8c7990f0b5fabbe6277b9b978a79ef9d902e28f476c9e2d7ad38be8f683c
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d92f7eabe45011214c515bfd61da30217ce7b19e595578b578aa64ad13935f7b
3
  size 27772
{checkpoint-7200 β†’ checkpoint-7600}/rng_state_1.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7b8c7955910d1e491c12afee87720b150c2f84104325ab9c838c1295ee23834
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8faed179788c5f007e70cd65b68283fb43b650dd4050572bbd5baf4bdcfbd924
3
  size 27772
{checkpoint-7200 β†’ checkpoint-7600}/rng_state_10.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b248c3f8c2f9ee32893e76f2912253473328a82703a9e9cf774a7ddf60d42191
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61d79bf1140d29880b77d5b59d675f6cde7b6f8b23df1963240456b4cab72a92
3
  size 27789
{checkpoint-7200 β†’ checkpoint-7600}/rng_state_11.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80b4aace0601254c95160262eebbc86921bdf994e5b06ee7d3f592a180f3f4da
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02ce5e6c819958cba78082c54dc07c058f44ad7e3529ad00f10d119ef3398e40
3
  size 27789
{checkpoint-7200 β†’ checkpoint-7600}/rng_state_12.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbfecac90c68b3c7960f23f0a5c624343b34de925fd36e8f1553794649032b92
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:707e4aefa7d3ce06c156b57c6d9066244c741a492606832c0bb2a2ec62ce93f7
3
  size 27789
{checkpoint-7200 β†’ checkpoint-7600}/rng_state_13.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3aaab3904ce6b40c88c9ba5f75918dcc2286b14b28ff6f552b1e33426b307a4
3
  size 27789
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c580d943a9c6477c835e2ef1177fc05e74400a0ecb8d1179ca11160dbf4f9e3f
3
  size 27789
{checkpoint-7200 β†’ checkpoint-7600}/rng_state_2.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7cea57a52a03e3e2ba53900bfa4f24480bd064ae5ee54082744c8d66479e3392
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3851048fcf00e460a46c0d0afa742a3479d7e22eff758002fb06f5fc4aff5360
3
  size 27772
{checkpoint-7200 β†’ checkpoint-7600}/rng_state_3.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:183c5a8964dcebb4403f961f817d27e57f34a8aca9d588c50a976a55c7fd2dcc
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ad8fccbd226cbad25059f183dbac39878c755c6293504a7508201420371a326
3
  size 27772
{checkpoint-7200 β†’ checkpoint-7600}/rng_state_4.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72dde9fbb9f6a3d30beec6e7a6a331f1c07cc41bc3e421c95d5fc51337163858
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d169e4e502924fcdcd3c9029b7721729912abdfee723bf2f5b143e0c52278a80
3
  size 27772
{checkpoint-7200 β†’ checkpoint-7600}/rng_state_5.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:240e0b564b5f72f61c5e9bf130c09d6b7a884041c6817f283c0db8dce9514c6d
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2e8219f1f38af388ccb00570e48d852630fd0033dc8f43c45d502afdc72c9cc
3
  size 27772
{checkpoint-7200 β†’ checkpoint-7600}/rng_state_6.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3e782243547e75d21ba55dd4adfc01fec8df179ac5853e510085d873d508172
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4dbf4092b04aa8341ff54a7b4956a047bbc2f54e34818e66a07cba1653e5e641
3
  size 27772
{checkpoint-7200 β†’ checkpoint-7600}/rng_state_7.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a862e45bf9cf553270045d741a8187da4668bf889c171749a617824d14d63917
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cee8814ccaee8c0d5e7262c51637788ae0940c5d3a963ac9add18e67c5a5167
3
  size 27772
{checkpoint-7200 β†’ checkpoint-7600}/rng_state_8.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e864e9ec63d970372488da3e89af0a1ea00e3da41e08446b93c1ddc621af475d
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b2a094ab4a22bd185f1e49e29bfa15330df8c156a20b2a312cfefc754be4779
3
  size 27772
{checkpoint-7200 β†’ checkpoint-7600}/rng_state_9.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d8cdcdaf9565ca7ffc01e41e6463d0c5d0aaca2ff165ca019aaa7bb751b870e
3
  size 27772
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1954ff78ec289ceaa33bdc7771b54e14618e8faecc5fba2fdda2fdc84a132170
3
  size 27772
{checkpoint-7200 β†’ checkpoint-7600}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d125f3dfa4d0989c607da131ae73674dff5736961f5c5c505915b427cba21012
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7eb86c35d079e8a2b93e9e3d96c274a24bb1cdec7682fa038d76297f663d7cf
3
  size 627
{checkpoint-7200 β†’ checkpoint-7600}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.791779759596743,
5
- "global_step": 7200,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1766,11 +1766,107 @@
1766
  "learning_rate": 2.3739449846862826e-06,
1767
  "loss": 0.7634,
1768
  "step": 7200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1769
  }
1770
  ],
1771
  "max_steps": 7737,
1772
  "num_train_epochs": 3,
1773
- "total_flos": 3.100665541573791e+19,
1774
  "trial_name": null,
1775
  "trial_params": null
1776
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.9468786351298952,
5
+ "global_step": 7600,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1766
  "learning_rate": 2.3739449846862826e-06,
1767
  "loss": 0.7634,
1768
  "step": 7200
1769
+ },
1770
+ {
1771
+ "epoch": 2.8,
1772
+ "learning_rate": 2.158832811760736e-06,
1773
+ "loss": 0.7617,
1774
+ "step": 7225
1775
+ },
1776
+ {
1777
+ "epoch": 2.81,
1778
+ "learning_rate": 1.95382888533604e-06,
1779
+ "loss": 0.768,
1780
+ "step": 7250
1781
+ },
1782
+ {
1783
+ "epoch": 2.82,
1784
+ "learning_rate": 1.7589543849450996e-06,
1785
+ "loss": 0.7712,
1786
+ "step": 7275
1787
+ },
1788
+ {
1789
+ "epoch": 2.83,
1790
+ "learning_rate": 1.5742294436213223e-06,
1791
+ "loss": 0.7703,
1792
+ "step": 7300
1793
+ },
1794
+ {
1795
+ "epoch": 2.84,
1796
+ "learning_rate": 1.3996731458185697e-06,
1797
+ "loss": 0.7618,
1798
+ "step": 7325
1799
+ },
1800
+ {
1801
+ "epoch": 2.85,
1802
+ "learning_rate": 1.2353035254395352e-06,
1803
+ "loss": 0.7767,
1804
+ "step": 7350
1805
+ },
1806
+ {
1807
+ "epoch": 2.86,
1808
+ "learning_rate": 1.0811375639725341e-06,
1809
+ "loss": 0.7659,
1810
+ "step": 7375
1811
+ },
1812
+ {
1813
+ "epoch": 2.87,
1814
+ "learning_rate": 9.371911887371965e-07,
1815
+ "loss": 0.774,
1816
+ "step": 7400
1817
+ },
1818
+ {
1819
+ "epoch": 2.88,
1820
+ "learning_rate": 8.034792712388828e-07,
1821
+ "loss": 0.7658,
1822
+ "step": 7425
1823
+ },
1824
+ {
1825
+ "epoch": 2.89,
1826
+ "learning_rate": 6.800156256323243e-07,
1827
+ "loss": 0.7626,
1828
+ "step": 7450
1829
+ },
1830
+ {
1831
+ "epoch": 2.9,
1832
+ "learning_rate": 5.6681300729442e-07,
1833
+ "loss": 0.7744,
1834
+ "step": 7475
1835
+ },
1836
+ {
1837
+ "epoch": 2.91,
1838
+ "learning_rate": 4.6388311150644683e-07,
1839
+ "loss": 0.7768,
1840
+ "step": 7500
1841
+ },
1842
+ {
1843
+ "epoch": 2.92,
1844
+ "learning_rate": 3.712365722457922e-07,
1845
+ "loss": 0.7653,
1846
+ "step": 7525
1847
+ },
1848
+ {
1849
+ "epoch": 2.93,
1850
+ "learning_rate": 2.888829610873112e-07,
1851
+ "loss": 0.7675,
1852
+ "step": 7550
1853
+ },
1854
+ {
1855
+ "epoch": 2.94,
1856
+ "learning_rate": 2.168307862144725e-07,
1857
+ "loss": 0.7727,
1858
+ "step": 7575
1859
+ },
1860
+ {
1861
+ "epoch": 2.95,
1862
+ "learning_rate": 1.5508749154037327e-07,
1863
+ "loss": 0.7712,
1864
+ "step": 7600
1865
  }
1866
  ],
1867
  "max_steps": 7737,
1868
  "num_train_epochs": 3,
1869
+ "total_flos": 3.2730387222263497e+19,
1870
  "trial_name": null,
1871
  "trial_params": null
1872
  }
{checkpoint-7200 β†’ checkpoint-7600}/training_args.bin RENAMED
File without changes