ZeroUniqueness
commited on
Commit
β’
aa0242f
1
Parent(s):
7b65909
Training in progress, step 7400
Browse files- adapter_model.bin +1 -1
- {checkpoint-7000 β checkpoint-7300/adapter_model}/README.md +0 -0
- {checkpoint-7000 β checkpoint-7300/adapter_model}/adapter_config.json +0 -0
- {checkpoint-7000 β checkpoint-7300/adapter_model}/adapter_model.bin +1 -1
- {checkpoint-7000/adapter_model β checkpoint-7400}/README.md +0 -0
- {checkpoint-7000/adapter_model β checkpoint-7400}/adapter_config.json +0 -0
- {checkpoint-7000/adapter_model β checkpoint-7400}/adapter_model.bin +1 -1
- {checkpoint-7000 β checkpoint-7400}/optimizer.pt +1 -1
- {checkpoint-7000 β checkpoint-7400}/rng_state_0.pth +1 -1
- {checkpoint-7000 β checkpoint-7400}/rng_state_1.pth +1 -1
- {checkpoint-7000 β checkpoint-7400}/rng_state_10.pth +1 -1
- {checkpoint-7000 β checkpoint-7400}/rng_state_11.pth +1 -1
- {checkpoint-7000 β checkpoint-7400}/rng_state_12.pth +1 -1
- {checkpoint-7000 β checkpoint-7400}/rng_state_13.pth +1 -1
- {checkpoint-7000 β checkpoint-7400}/rng_state_2.pth +1 -1
- {checkpoint-7000 β checkpoint-7400}/rng_state_3.pth +1 -1
- {checkpoint-7000 β checkpoint-7400}/rng_state_4.pth +1 -1
- {checkpoint-7000 β checkpoint-7400}/rng_state_5.pth +1 -1
- {checkpoint-7000 β checkpoint-7400}/rng_state_6.pth +1 -1
- {checkpoint-7000 β checkpoint-7400}/rng_state_7.pth +1 -1
- {checkpoint-7000 β checkpoint-7400}/rng_state_8.pth +1 -1
- {checkpoint-7000 β checkpoint-7400}/rng_state_9.pth +1 -1
- {checkpoint-7000 β checkpoint-7400}/scheduler.pt +1 -1
- {checkpoint-7000 β checkpoint-7400}/trainer_state.json +99 -3
- {checkpoint-7000 β checkpoint-7400}/training_args.bin +0 -0
adapter_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:993d2c02240ed3801ddacece59d263018042d38b315c16b83c4dac141857f97b
|
3 |
size 500897101
|
{checkpoint-7000 β checkpoint-7300/adapter_model}/README.md
RENAMED
File without changes
|
{checkpoint-7000 β checkpoint-7300/adapter_model}/adapter_config.json
RENAMED
File without changes
|
{checkpoint-7000 β checkpoint-7300/adapter_model}/adapter_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2aae85b4318efc26db922c4214aefd89c824feffab65eaf0292127550a92cb40
|
3 |
size 500897101
|
{checkpoint-7000/adapter_model β checkpoint-7400}/README.md
RENAMED
File without changes
|
{checkpoint-7000/adapter_model β checkpoint-7400}/adapter_config.json
RENAMED
File without changes
|
{checkpoint-7000/adapter_model β checkpoint-7400}/adapter_model.bin
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 500897101
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:993d2c02240ed3801ddacece59d263018042d38b315c16b83c4dac141857f97b
|
3 |
size 500897101
|
{checkpoint-7000 β checkpoint-7400}/optimizer.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1001752701
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5ac5841d6300001f54af872136a81e878a172b63fcdf912ced5de86015b3e27
|
3 |
size 1001752701
|
{checkpoint-7000 β checkpoint-7400}/rng_state_0.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3baf5ebf20ebf0458b7f556b1ed46afc501b40d8898ffabbab842d9757c22ace
|
3 |
size 27772
|
{checkpoint-7000 β checkpoint-7400}/rng_state_1.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fcb43bb85439f18b615f2f71cf79f0c2e1281b44d62f3d40ae2b4ab32bfed6b6
|
3 |
size 27772
|
{checkpoint-7000 β checkpoint-7400}/rng_state_10.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ae80861e273facc235ec70bbe5d5897cd7b8e6e7064d4329ebd0a0ab34e1d83
|
3 |
size 27789
|
{checkpoint-7000 β checkpoint-7400}/rng_state_11.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f6fe88b89271d4a3fa17461b406b6c31a71b39d5723c9bddfec471d0b453f52
|
3 |
size 27789
|
{checkpoint-7000 β checkpoint-7400}/rng_state_12.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ed06c69a78e8e7e71cef531884e74a692b1da2ec797510707214943cd99a6fa
|
3 |
size 27789
|
{checkpoint-7000 β checkpoint-7400}/rng_state_13.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27789
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec128429973cc3bb99daaa414691d0aeab3f2d28aee2d016ae8f463e87b75303
|
3 |
size 27789
|
{checkpoint-7000 β checkpoint-7400}/rng_state_2.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e45af4ddead7ac0471e44bdb014890d3f531bc098ade5a3ab94e4f5c007daa14
|
3 |
size 27772
|
{checkpoint-7000 β checkpoint-7400}/rng_state_3.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0726836b26d946d9ec17bbbfbed9fc3fb492a97e91e7991b6ab928fed4a42e2
|
3 |
size 27772
|
{checkpoint-7000 β checkpoint-7400}/rng_state_4.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7680747019af759345214a0de04c2e158d916ec42b26667797f489cb55c93074
|
3 |
size 27772
|
{checkpoint-7000 β checkpoint-7400}/rng_state_5.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:104035968b4a9d767346eeb077e90657b713ffc767eecaf4489cc350db37de17
|
3 |
size 27772
|
{checkpoint-7000 β checkpoint-7400}/rng_state_6.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:376c584f7b44a727d446458afe9c9fb5c3b8c31c1f0b9e7689635a8cf4335021
|
3 |
size 27772
|
{checkpoint-7000 β checkpoint-7400}/rng_state_7.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8d4800aad8ec372345e6c696ae6bf61c09269149665d2aa4232991019c99fa5
|
3 |
size 27772
|
{checkpoint-7000 β checkpoint-7400}/rng_state_8.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79c38e0f0a96baa9834ace5a5012a3f25863c8a6354659645637e9614927dcd8
|
3 |
size 27772
|
{checkpoint-7000 β checkpoint-7400}/rng_state_9.pth
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27772
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54c80796b044f5acabd3fa7243d13e4ec5f5acc43be402329b2d31af2e4c25d1
|
3 |
size 27772
|
{checkpoint-7000 β checkpoint-7400}/scheduler.pt
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6741d217f31a08d86b6f339348ff73c807bdf74225de0696d612e4cc95a34759
|
3 |
size 627
|
{checkpoint-7000 β checkpoint-7400}/trainer_state.json
RENAMED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 2.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -1718,11 +1718,107 @@
|
|
1718 |
"eval_samples_per_second": 12.427,
|
1719 |
"eval_steps_per_second": 0.902,
|
1720 |
"step": 7000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1721 |
}
|
1722 |
],
|
1723 |
"max_steps": 7737,
|
1724 |
"num_train_epochs": 3,
|
1725 |
-
"total_flos": 3.
|
1726 |
"trial_name": null,
|
1727 |
"trial_params": null
|
1728 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 2.869329197363319,
|
5 |
+
"global_step": 7400,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
1718 |
"eval_samples_per_second": 12.427,
|
1719 |
"eval_steps_per_second": 0.902,
|
1720 |
"step": 7000
|
1721 |
+
},
|
1722 |
+
{
|
1723 |
+
"epoch": 2.72,
|
1724 |
+
"learning_rate": 4.160763312197513e-06,
|
1725 |
+
"loss": 0.7724,
|
1726 |
+
"step": 7025
|
1727 |
+
},
|
1728 |
+
{
|
1729 |
+
"epoch": 2.73,
|
1730 |
+
"learning_rate": 3.875573860006421e-06,
|
1731 |
+
"loss": 0.7696,
|
1732 |
+
"step": 7050
|
1733 |
+
},
|
1734 |
+
{
|
1735 |
+
"epoch": 2.74,
|
1736 |
+
"learning_rate": 3.6003152929641624e-06,
|
1737 |
+
"loss": 0.7625,
|
1738 |
+
"step": 7075
|
1739 |
+
},
|
1740 |
+
{
|
1741 |
+
"epoch": 2.75,
|
1742 |
+
"learning_rate": 3.335016048808437e-06,
|
1743 |
+
"loss": 0.7733,
|
1744 |
+
"step": 7100
|
1745 |
+
},
|
1746 |
+
{
|
1747 |
+
"epoch": 2.76,
|
1748 |
+
"learning_rate": 3.0797035363512193e-06,
|
1749 |
+
"loss": 0.7685,
|
1750 |
+
"step": 7125
|
1751 |
+
},
|
1752 |
+
{
|
1753 |
+
"epoch": 2.77,
|
1754 |
+
"learning_rate": 2.834404132647128e-06,
|
1755 |
+
"loss": 0.769,
|
1756 |
+
"step": 7150
|
1757 |
+
},
|
1758 |
+
{
|
1759 |
+
"epoch": 2.78,
|
1760 |
+
"learning_rate": 2.5991431802683262e-06,
|
1761 |
+
"loss": 0.7647,
|
1762 |
+
"step": 7175
|
1763 |
+
},
|
1764 |
+
{
|
1765 |
+
"epoch": 2.79,
|
1766 |
+
"learning_rate": 2.3739449846862826e-06,
|
1767 |
+
"loss": 0.7634,
|
1768 |
+
"step": 7200
|
1769 |
+
},
|
1770 |
+
{
|
1771 |
+
"epoch": 2.8,
|
1772 |
+
"learning_rate": 2.158832811760736e-06,
|
1773 |
+
"loss": 0.7617,
|
1774 |
+
"step": 7225
|
1775 |
+
},
|
1776 |
+
{
|
1777 |
+
"epoch": 2.81,
|
1778 |
+
"learning_rate": 1.95382888533604e-06,
|
1779 |
+
"loss": 0.768,
|
1780 |
+
"step": 7250
|
1781 |
+
},
|
1782 |
+
{
|
1783 |
+
"epoch": 2.82,
|
1784 |
+
"learning_rate": 1.7589543849450996e-06,
|
1785 |
+
"loss": 0.7712,
|
1786 |
+
"step": 7275
|
1787 |
+
},
|
1788 |
+
{
|
1789 |
+
"epoch": 2.83,
|
1790 |
+
"learning_rate": 1.5742294436213223e-06,
|
1791 |
+
"loss": 0.7703,
|
1792 |
+
"step": 7300
|
1793 |
+
},
|
1794 |
+
{
|
1795 |
+
"epoch": 2.84,
|
1796 |
+
"learning_rate": 1.3996731458185697e-06,
|
1797 |
+
"loss": 0.7618,
|
1798 |
+
"step": 7325
|
1799 |
+
},
|
1800 |
+
{
|
1801 |
+
"epoch": 2.85,
|
1802 |
+
"learning_rate": 1.2353035254395352e-06,
|
1803 |
+
"loss": 0.7767,
|
1804 |
+
"step": 7350
|
1805 |
+
},
|
1806 |
+
{
|
1807 |
+
"epoch": 2.86,
|
1808 |
+
"learning_rate": 1.0811375639725341e-06,
|
1809 |
+
"loss": 0.7659,
|
1810 |
+
"step": 7375
|
1811 |
+
},
|
1812 |
+
{
|
1813 |
+
"epoch": 2.87,
|
1814 |
+
"learning_rate": 9.371911887371965e-07,
|
1815 |
+
"loss": 0.774,
|
1816 |
+
"step": 7400
|
1817 |
}
|
1818 |
],
|
1819 |
"max_steps": 7737,
|
1820 |
"num_train_epochs": 3,
|
1821 |
+
"total_flos": 3.1867824817039213e+19,
|
1822 |
"trial_name": null,
|
1823 |
"trial_params": null
|
1824 |
}
|
{checkpoint-7000 β checkpoint-7400}/training_args.bin
RENAMED
File without changes
|