Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/8/rnd_search_t_no_sched/comb_6/init/lm_head/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/lm_head/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/8/rnd_search_t_no_sched/comb_6/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
|
3 |
+
size 205955
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f38ca76a68848f07da7473f3885e85e24c3dfa5104c63dac0fe5d5c9cca1e7fa
|
3 |
+
size 205955
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a6292fb9a98635e5227e35c108b53c33900b448d0104d9d3e3c62a4a3f3f30c
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82123af25587db72ee5beb2bd05580e40788efa75d190bf5e1bd2ae06a241362
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c079f929b63619db4e9c7dc27d76c63305e75cceb893ff5a06016e115125aad
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ea470fc7c92720d58dd9a68ff5ae4c7f48c55d86892e087db090fba71782f93
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ad65430629afed58d0cfa9a8675c7ab37821621e834764b65d1fc7f13f2aae4
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01a01894b302c470b521e8487e07a7897fdaca16cbbdccfe3bffe581a6c6a88f
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7921d35e5695e0e13d1db3f623a18a81bbba79d9b7c1f032d36a820375ff76b1
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ea81c9154b08bfc8b00578f0c10012e13b70b9229caad4c2b10430585020264
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfb42fa290f85ae654e3ddd70bfeac36cddf28835e3c2d29e252594e8432329c
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ad7c8fe6eda5212866d9d4e29066f25e99bd52ec13baf732bea371683716b2e
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5730da20fc07bd579a63685e9c23decf61a941f4b3f4deae93c106ed5454239e
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ea1fc15646fba33fe51216e56f87af10bcddd92a1a84055fe43a48c01a8ee0c
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eaf5e7682420201ab3bd03bcaf41fdce223c27110e08dbc13a62e1ce6bd21fab
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec44f0f630dc106254d94da16d51b6ca3e45bcc8241612f55b60383f2d4dcc06
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:618cd8c68938df11cd740f55dce843716603ec267107b6a559d5b36bcc55b09d
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ae4bd3b893e3aba095d2e94f87c1dc7f680646f04abb92e62fc1b31a88665c0
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e5ffdc054d7f7db12970da2b6d5f4c0408d6633dfc07a1e5ba75cb06881c19a
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d826cf4502891c55a7e3432f5fe163048ef20a0415a56fbf7b5cf1480dc88aa3
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50bdf9a6f5c2b9fa20026943506ad42a51047afb65c96971e919ee7ab6685264
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfe1a3c62be6d9537423e7aa934051643ff89b27141a13dce9a31b0e1402b485
|
3 |
+
size 42115
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b776484b654391c28e4b820f5dba07615893a88fa17d5a4e673fc864fd43d6b
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c64a4a177f948bd60322fd9cc13b1de9935deedff0b1d55b296863b0ebdaf74
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95b4ceeedaa3fa9d17855f87b7c35571440cfd63a59f9fa0b11f67383a71d19f
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:348fea5af2d8ca47560ada4cace0037abb297b6517ac6fc0e9145f819a676cf7
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f6fb16afb25d16991c879e56894769f46fde1177e3f497e5089942d6042cf25
|
3 |
+
size 11395
|