Add files using large-upload tool
Browse files- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=108M_maxstep=1160/flop_2.00e+17_step_587.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=108M_maxstep=1160/flop_4.00e+17_step_1172.pt +3 -0
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=149M_maxstep=27280/flop_1.28e+19_step_27300.pt +3 -0
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=149M_maxstep=27280/flop_6.40e+18_step_13651.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=15M_maxstep=240/flop_1.25e+16_step_254.pt +3 -0
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=15M_maxstep=240/flop_6.28e+15_step_128.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=220M_maxstep=36840/flop_1.28e+19_step_18423.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=220M_maxstep=36840/flop_2.56e+19_step_36844.pt +3 -0
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=220M_maxstep=560/flop_2.00e+17_step_288.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=220M_maxstep=560/flop_4.00e+17_step_575.pt +3 -0
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=28M_maxstep=2200/flop_1.00e+17_step_1109.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=28M_maxstep=2200/flop_2.00e+17_step_2217.pt +3 -0
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=347M_maxstep=11720/flop_1.28e+19_step_11723.pt +3 -0
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=347M_maxstep=11720/flop_6.40e+18_step_5862.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=347M_maxstep=2920/flop_1.60e+18_step_1466.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=347M_maxstep=2920/flop_3.20e+18_step_2930.pt +3 -0
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=37M_maxstep=1700/flop_1.00e+17_step_858.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=37M_maxstep=1700/flop_2.00e+17_step_1715.pt +3 -0
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=455M_maxstep=4460/flop_3.20e+18_step_2235.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=455M_maxstep=4460/flop_6.40e+18_step_4468.pt +3 -0
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=611M_maxstep=13280/flop_2.56e+19_step_13298.pt +3 -0
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=611M_maxstep=6640/flop_6.40e+18_step_3325.pt +2 -2
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=9M_maxstep=100/flop_3.12e+15_step_101.pt +3 -0
- dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=9M_maxstep=40/flop_3.12e+15_step_50.pt +3 -0
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=108M_maxstep=1160/flop_2.00e+17_step_587.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dc85bd18709907e85e1a9600382819d480f6fa14dc84812daf7a817e9b1c44c8
|
| 3 |
+
size 563343738
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=108M_maxstep=1160/flop_4.00e+17_step_1172.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d82917abd18c7c80648d5b1fd7ddbe327c2a9dfc3a91ebdffb92512d0a07ed2d
|
| 3 |
+
size 563346627
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=149M_maxstep=27280/flop_1.28e+19_step_27300.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de1c3ac43db788f698bafb9a45e7c5939791c3a22d0fd40e76e9ced5148fec45
|
| 3 |
+
size 738704789
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=149M_maxstep=27280/flop_6.40e+18_step_13651.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b5d9a19f4ae1e1e5207aa24e653afd99f986ef43e912d92e5530f50db75897f2
|
| 3 |
+
size 738701525
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=15M_maxstep=240/flop_1.25e+16_step_254.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5d499c42bbdbd841a8d7efd0335ef9801b0c5b866f2f8fbe002158dc9e308485
|
| 3 |
+
size 107653147
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=15M_maxstep=240/flop_6.28e+15_step_128.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3816be56d761b1f9ca3a4c171e8fde7d0739871db0ed9ea05037c9b91828575b
|
| 3 |
+
size 107651995
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=220M_maxstep=36840/flop_1.28e+19_step_18423.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba00e0ee219de7cae91ad27571051ef0f3fdff95d1789b0b710d141e89dbb8af
|
| 3 |
+
size 1052003870
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=220M_maxstep=36840/flop_2.56e+19_step_36844.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d79d6e419894e31ee0d30fdb8107c9f4b4f65d88cda3d7381cf95b81a286ab4
|
| 3 |
+
size 1052007582
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=220M_maxstep=560/flop_2.00e+17_step_288.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cd2aa82323f66150aeb217afc7df0aa3a7b5fd99a185f7f6124c215c1b0b0f0c
|
| 3 |
+
size 1052003312
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=220M_maxstep=560/flop_4.00e+17_step_575.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea4638f2910b8322c5d7bb0e9aeaa6ee3f1bac38ff35ce6971a7170853d47f3a
|
| 3 |
+
size 1052007024
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=28M_maxstep=2200/flop_1.00e+17_step_1109.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:287f7335145c29a4e2fd4b3d7bdb8d185652618da425b7fa98bc86a76e426add
|
| 3 |
+
size 179380799
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=28M_maxstep=2200/flop_2.00e+17_step_2217.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d6749265606069e20e97b97acb38cbc37a5d6b9ff31cc20f8bd2a5495c5bd184
|
| 3 |
+
size 179382463
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=347M_maxstep=11720/flop_1.28e+19_step_11723.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4d78454468d3db7c6b68af7e647f50c2624172a21f07677077558e2d87118b3f
|
| 3 |
+
size 1595772900
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=347M_maxstep=11720/flop_6.40e+18_step_5862.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd393069ab4a01e3c8753e878aae42aec923318f093492658f0c54216c61127c
|
| 3 |
+
size 1595768499
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=347M_maxstep=2920/flop_1.60e+18_step_1466.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea9242adf84495f729f656d3bd0b1d3bc1d832ed3d0eb972306be51cc3b830f9
|
| 3 |
+
size 1595768499
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=347M_maxstep=2920/flop_3.20e+18_step_2930.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7a051c42563dbf8c56f3ee81e55b5f695261ac529f867d541c85751e4b80fd5f
|
| 3 |
+
size 1595772595
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=37M_maxstep=1700/flop_1.00e+17_step_858.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3c1958d39b34d695d66defbb2bfdcd6d71ea2682d52d33085e301dfc8b18511a
|
| 3 |
+
size 225882413
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=37M_maxstep=1700/flop_2.00e+17_step_1715.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:40dac0a093d157eda6c92badc3c6fe6bd0b52faee4974f29f286ead689470c5e
|
| 3 |
+
size 225884405
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=455M_maxstep=4460/flop_3.20e+18_step_2235.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:126615132f1999294b077bffde2b7544c700e2c4bed9eb170a66c626a1022c15
|
| 3 |
+
size 2048261653
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=455M_maxstep=4460/flop_6.40e+18_step_4468.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:66aabb4b2dd9d7d411e5699b91062566c61ee2130cda726b3dad8d03dcb98439
|
| 3 |
+
size 2048266325
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=611M_maxstep=13280/flop_2.56e+19_step_13298.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:02cb069a2d7a388890897800a68305875362b87769647cc871904dfe818fa1ba
|
| 3 |
+
size 2713751085
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=611M_maxstep=6640/flop_6.40e+18_step_3325.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3b4c5935850f10e094046dd823cda49f8a1e2b017c8e47af4cc10cb017e08591
|
| 3 |
+
size 2713746069
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=9M_maxstep=100/flop_3.12e+15_step_101.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa4588f4b31865147f4609ec44ce2309551fa7271e5be6558f895b991642ec96
|
| 3 |
+
size 71569151
|
dataset=rw/hparams=base_warmup=short_decay=chinchilla/params=9M_maxstep=40/flop_3.12e+15_step_50.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1bd3b42aa36032da466428aa59ac5d5bdfdbd8faa0b156c97102cf3e4b3a8bf8
|
| 3 |
+
size 71569016
|