Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/8/rnd_search_t_no_sched/comb_16/init/lm_head/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/lm_head/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/8/rnd_search_t_no_sched/comb_16/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:645047f57abac43d8d993e1e1a2df86ba20a4a220024a11be907b15cd670b7ab
|
3 |
+
size 205955
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:400e131d474439206381972812b72675da9bba3d960a979ccc7666baa56ee485
|
3 |
+
size 205955
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ab43114e14a515ec8b39cf3d34a3895439345b5ec79ba001d8e5d998934630d
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab456d5bc6581e818bc7fb09825f70a4f334c3f299da1554d0bc312757294f2e
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3adbc8c06b26c53c83d6b74eeb07f89919a253a937c1b8615c674a4323363c3a
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3c3a59469eeb3b84ba20fd2e28792f69b07f4aa8bcfc38c50701071c6bbc083
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ecb4bcbad586be843a596caf1d2784caf0e85e9aeccedc6c707224bb8fe8574
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05a79d8be40d25258ce59d2e798163b74cca2de3d15f4f96d0e4a28170ecdffe
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7bf9fe78267a2f8f9cee478b398d8b110c33c1ac7c87640b3c6c76ab1508950
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d649e0a85ec9227bfce8e07196794fa618c54c4cdc8fa56b70d247ddfa344f4f
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7762fc81aa5f7b2ca0acbdae55b4dd562d9c6517a374d1d8c3005b3e026f8341
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b6fd39bb09c0dec82505d75eebf6f6e38cbff2c745c4355c042c0466d738c31
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a26c5c646d2e66c363193b1be80c98935a3ccf276cf787bb47924aad571f03a
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:527fcb4f38487e9d18849b03ef36721bfa36a317186a3ee58993a7f11d040e4c
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:897d1082a8695bfad407478c5858bb5b1f91de5d048d28ae04926e3cd0f0c992
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8fd8992c962d618cec301eb2820035f4228cb17008ef5ccafaf6ac3130d25d4a
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75b01c8f9a379878f44889d4b9e981149e2e4450904e0c45ce52199eaa73b296
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09b58f8d4edcc96de6055cff64cf48739ab2fd787da0270fe3b67a0629be5924
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58c341e65440d50c70219e03c365612aeb2cd07850bb070ab94722af8156100f
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a38078d517bd7fdbab4070582531004e62feba2573c6fc16d8bd4d11301bf34d
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:087e876d52012a40d35bcb3b61d8f0d9279ef2f39d14dac88103445dffa7e4c4
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f501063bcb37d2dd5826e71a3ea4c794137777eda2adb76a916244a43b1a0ce4
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ba26a1c0b8ad8a02cd42db09445743a1954baccf61d691b5291c90de50a787f
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42fe49e81419131f9c724f9bf23a63319503db742d7276a2cf1737b19fffba6c
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5a0236f9aae8f39e62e66c9c8eecc923fb3dfa1edb2d228ce56436c3b3f4a0b
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1d23a5f7493ae8bb670042c7106ebf316d1e6cca8cbfd5df1091a09fad67153
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2d206385b4389ecff16e0d16fd5e8ef6b26a587ab93b7030c8158e22c737696
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3f7d695158d2843305cd4c7ec645069569036291bee0109bba4e9b27ad06215
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cea78eaae5a87360f8309828f37fdce9e7c86bef69b8e722780179043340b168
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9adf110f25eed3b8875d127fc26cef758658fedb5d82262fff034c738cfd3cb
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87cd3f0492b14dce98c45c2f5a0709f388420d86bf4c4bbae538047cc7a9d1ea
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18cc3c6f821158b00c733edda0569b777517eba8120eabf31eaf892f8a15fabb
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2eba1b1d058ea2ee20db4d4236af5f722731159ce6f5acbb0704d28a107f314f
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c80f083d2c93cabaf2dbb24cfca36cf35f90bede70ac9a2a539d591476680ec
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f30ac48e80bcafd3cbfb720200fc8fcfa9f896a56b879bf995673b077005758e
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b49f1888f769e76a819b1b3479a5d6c4c14b851d81853ac205a6651c156d61e
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ccdd724a1113abc65ccad67c8826b5dbcac6f8024918bd52c2d1b96ddedd6c0
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1369dbc0f6253539ca9fa8c5ccbd466d9d0e846b94846e20cfd2db9495d314a0
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48a5a47133c2ecd030f5f437a5fec88f517396ee53c5a36e0bf8c501e60304fd
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95781d585a8fb2150414fe6507b98348a490b142d362a4f6f0ff347087c39d9b
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb04daa838b47a374828c4afd6aa6fa301a5864e1cbbc39cce81e70402d4fd9a
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14ee582c7d0fe678dbb25502c2d49ab45eccc200998044151f684fdd8ec9a7c3
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09db76002b66968a57d560d5ce83999f365da7fd115262febc198cb00472d0b5
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75ce0b586f894898fbb6bbfe45fe92b62edad52c79f0b3db051970dc7fc21f53
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8e0982bc6bf953e11bce306aa9eb2b086ef21341f3a825ce57db834da2e36dc
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_16/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa0953e6b6b018c12371b2937ada65be6e164711b7de3b1cfed39a286dea177e
|
3 |
+
size 11395
|