ZeroUniqueness
commited on
Commit
β’
44b1d94
1
Parent(s):
7b2562e
Training in progress, step 7600
Browse files- adapter_model.bin +1 -1
- {checkpoint-7200 β checkpoint-7500/adapter_model}/README.md +0 -0
- {checkpoint-7200 β checkpoint-7500/adapter_model}/adapter_config.json +0 -0
- {checkpoint-7200 β checkpoint-7500/adapter_model}/adapter_model.bin +1 -1
- {checkpoint-7200/adapter_model β checkpoint-7600}/README.md +0 -0
- {checkpoint-7200/adapter_model β checkpoint-7600}/adapter_config.json +0 -0
- {checkpoint-7200/adapter_model β checkpoint-7600}/adapter_model.bin +1 -1
- {checkpoint-7200 β checkpoint-7600}/optimizer.pt +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_0.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_1.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_10.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_11.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_12.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_13.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_2.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_3.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_4.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_5.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_6.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_7.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_8.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/rng_state_9.pth +1 -1
- {checkpoint-7200 β checkpoint-7600}/scheduler.pt +1 -1
- {checkpoint-7200 β checkpoint-7600}/trainer_state.json +99 -3
- {checkpoint-7200 β checkpoint-7600}/training_args.bin +0 -0
adapter_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5ab034d117a0225da8be2f42841fdd56781cdd412727c42b29659f8fe5e1326
|
3 |
size 500897101
|
{checkpoint-7200 β checkpoint-7500/adapter_model}/README.md
RENAMED
File without changes
|
{checkpoint-7200 β checkpoint-7500/adapter_model}/adapter_config.json
RENAMED
File without changes
|
{checkpoint-7200 β checkpoint-7500/adapter_model}/adapter_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:599a7200aa4c479d11103aabf574f030fbcfd8ec950c813b2ed33cb39a745288
|
3 |
size 500897101
|
{checkpoint-7200/adapter_model β checkpoint-7600}/README.md
RENAMED
File without changes
|
{checkpoint-7200/adapter_model β checkpoint-7600}/adapter_config.json
RENAMED
File without changes
|
{checkpoint-7200/adapter_model β checkpoint-7600}/adapter_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5ab034d117a0225da8be2f42841fdd56781cdd412727c42b29659f8fe5e1326
|
3 |
size 500897101
|
{checkpoint-7200 β checkpoint-7600}/optimizer.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1001752701
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fb53c8a12296e035ec70bf89911c9255494b238ffbb8f9c7a06d814a5410c87
|
3 |
size 1001752701
|
{checkpoint-7200 β checkpoint-7600}/rng_state_0.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d92f7eabe45011214c515bfd61da30217ce7b19e595578b578aa64ad13935f7b
|
3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_1.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8faed179788c5f007e70cd65b68283fb43b650dd4050572bbd5baf4bdcfbd924
|
3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_10.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61d79bf1140d29880b77d5b59d675f6cde7b6f8b23df1963240456b4cab72a92
|
3 |
size 27789
|
{checkpoint-7200 β checkpoint-7600}/rng_state_11.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02ce5e6c819958cba78082c54dc07c058f44ad7e3529ad00f10d119ef3398e40
|
3 |
size 27789
|
{checkpoint-7200 β checkpoint-7600}/rng_state_12.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:707e4aefa7d3ce06c156b57c6d9066244c741a492606832c0bb2a2ec62ce93f7
|
3 |
size 27789
|
{checkpoint-7200 β checkpoint-7600}/rng_state_13.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c580d943a9c6477c835e2ef1177fc05e74400a0ecb8d1179ca11160dbf4f9e3f
|
3 |
size 27789
|
{checkpoint-7200 β checkpoint-7600}/rng_state_2.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3851048fcf00e460a46c0d0afa742a3479d7e22eff758002fb06f5fc4aff5360
|
3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_3.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ad8fccbd226cbad25059f183dbac39878c755c6293504a7508201420371a326
|
3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_4.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d169e4e502924fcdcd3c9029b7721729912abdfee723bf2f5b143e0c52278a80
|
3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_5.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2e8219f1f38af388ccb00570e48d852630fd0033dc8f43c45d502afdc72c9cc
|
3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_6.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4dbf4092b04aa8341ff54a7b4956a047bbc2f54e34818e66a07cba1653e5e641
|
3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_7.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cee8814ccaee8c0d5e7262c51637788ae0940c5d3a963ac9add18e67c5a5167
|
3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_8.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b2a094ab4a22bd185f1e49e29bfa15330df8c156a20b2a312cfefc754be4779
|
3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/rng_state_9.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1954ff78ec289ceaa33bdc7771b54e14618e8faecc5fba2fdda2fdc84a132170
|
3 |
size 27772
|
{checkpoint-7200 β checkpoint-7600}/scheduler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7eb86c35d079e8a2b93e9e3d96c274a24bb1cdec7682fa038d76297f663d7cf
|
3 |
size 627
|
{checkpoint-7200 β checkpoint-7600}/trainer_state.json
RENAMED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 2.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -1766,11 +1766,107 @@
|
|
1766 |
"learning_rate": 2.3739449846862826e-06,
|
1767 |
"loss": 0.7634,
|
1768 |
"step": 7200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1769 |
}
|
1770 |
],
|
1771 |
"max_steps": 7737,
|
1772 |
"num_train_epochs": 3,
|
1773 |
-
"total_flos": 3.
|
1774 |
"trial_name": null,
|
1775 |
"trial_params": null
|
1776 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 2.9468786351298952,
|
5 |
+
"global_step": 7600,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
1766 |
"learning_rate": 2.3739449846862826e-06,
|
1767 |
"loss": 0.7634,
|
1768 |
"step": 7200
|
1769 |
+
},
|
1770 |
+
{
|
1771 |
+
"epoch": 2.8,
|
1772 |
+
"learning_rate": 2.158832811760736e-06,
|
1773 |
+
"loss": 0.7617,
|
1774 |
+
"step": 7225
|
1775 |
+
},
|
1776 |
+
{
|
1777 |
+
"epoch": 2.81,
|
1778 |
+
"learning_rate": 1.95382888533604e-06,
|
1779 |
+
"loss": 0.768,
|
1780 |
+
"step": 7250
|
1781 |
+
},
|
1782 |
+
{
|
1783 |
+
"epoch": 2.82,
|
1784 |
+
"learning_rate": 1.7589543849450996e-06,
|
1785 |
+
"loss": 0.7712,
|
1786 |
+
"step": 7275
|
1787 |
+
},
|
1788 |
+
{
|
1789 |
+
"epoch": 2.83,
|
1790 |
+
"learning_rate": 1.5742294436213223e-06,
|
1791 |
+
"loss": 0.7703,
|
1792 |
+
"step": 7300
|
1793 |
+
},
|
1794 |
+
{
|
1795 |
+
"epoch": 2.84,
|
1796 |
+
"learning_rate": 1.3996731458185697e-06,
|
1797 |
+
"loss": 0.7618,
|
1798 |
+
"step": 7325
|
1799 |
+
},
|
1800 |
+
{
|
1801 |
+
"epoch": 2.85,
|
1802 |
+
"learning_rate": 1.2353035254395352e-06,
|
1803 |
+
"loss": 0.7767,
|
1804 |
+
"step": 7350
|
1805 |
+
},
|
1806 |
+
{
|
1807 |
+
"epoch": 2.86,
|
1808 |
+
"learning_rate": 1.0811375639725341e-06,
|
1809 |
+
"loss": 0.7659,
|
1810 |
+
"step": 7375
|
1811 |
+
},
|
1812 |
+
{
|
1813 |
+
"epoch": 2.87,
|
1814 |
+
"learning_rate": 9.371911887371965e-07,
|
1815 |
+
"loss": 0.774,
|
1816 |
+
"step": 7400
|
1817 |
+
},
|
1818 |
+
{
|
1819 |
+
"epoch": 2.88,
|
1820 |
+
"learning_rate": 8.034792712388828e-07,
|
1821 |
+
"loss": 0.7658,
|
1822 |
+
"step": 7425
|
1823 |
+
},
|
1824 |
+
{
|
1825 |
+
"epoch": 2.89,
|
1826 |
+
"learning_rate": 6.800156256323243e-07,
|
1827 |
+
"loss": 0.7626,
|
1828 |
+
"step": 7450
|
1829 |
+
},
|
1830 |
+
{
|
1831 |
+
"epoch": 2.9,
|
1832 |
+
"learning_rate": 5.6681300729442e-07,
|
1833 |
+
"loss": 0.7744,
|
1834 |
+
"step": 7475
|
1835 |
+
},
|
1836 |
+
{
|
1837 |
+
"epoch": 2.91,
|
1838 |
+
"learning_rate": 4.6388311150644683e-07,
|
1839 |
+
"loss": 0.7768,
|
1840 |
+
"step": 7500
|
1841 |
+
},
|
1842 |
+
{
|
1843 |
+
"epoch": 2.92,
|
1844 |
+
"learning_rate": 3.712365722457922e-07,
|
1845 |
+
"loss": 0.7653,
|
1846 |
+
"step": 7525
|
1847 |
+
},
|
1848 |
+
{
|
1849 |
+
"epoch": 2.93,
|
1850 |
+
"learning_rate": 2.888829610873112e-07,
|
1851 |
+
"loss": 0.7675,
|
1852 |
+
"step": 7550
|
1853 |
+
},
|
1854 |
+
{
|
1855 |
+
"epoch": 2.94,
|
1856 |
+
"learning_rate": 2.168307862144725e-07,
|
1857 |
+
"loss": 0.7727,
|
1858 |
+
"step": 7575
|
1859 |
+
},
|
1860 |
+
{
|
1861 |
+
"epoch": 2.95,
|
1862 |
+
"learning_rate": 1.5508749154037327e-07,
|
1863 |
+
"loss": 0.7712,
|
1864 |
+
"step": 7600
|
1865 |
}
|
1866 |
],
|
1867 |
"max_steps": 7737,
|
1868 |
"num_train_epochs": 3,
|
1869 |
+
"total_flos": 3.2730387222263497e+19,
|
1870 |
"trial_name": null,
|
1871 |
"trial_params": null
|
1872 |
}
|
{checkpoint-7200 β checkpoint-7600}/training_args.bin
RENAMED
File without changes
|