Adding more results
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- params/phi/6/rnd_search_t_no_sched/comb_13/init/lm_head/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/lm_head/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.v_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc1/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc1/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc2/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc2/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.dense/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.dense/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.k_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.k_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.q_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.q_proj/_s.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.v_proj/_0.pt +3 -0
- params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.v_proj/_s.pt +3 -0
params/phi/6/rnd_search_t_no_sched/comb_13/init/lm_head/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9
|
3 |
+
size 205955
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/lm_head/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2cfe43065d8bfaa11d02e779b4f0ad1fa883d49250690762272b31171e2cfeb0
|
3 |
+
size 205955
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2650e41c1daa66d600d60fe60c09197ec8b5b426dd17dc4a6662da0fc35282c9
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bb8bb9614e10aedaa390b7e6824da8e343b5140e5db60fb7ee8c2d7abf824ed
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8bdab8b91d69e909209ef2ceb856cc18c608f5ebf12e2d405211b8ee1a0b3dfc
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f468206a82a8c03bc97eb9ba0011f7e1e16cec926cd310f23b22f1d0eed59f97
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a7d6380248673be1f992e2194983c580aca5b0307b9be90b66ff87e19937cd0
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:608f3e892b2395ed442a1c37f646cec5028e808a97e920b786daf3edc819df5b
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d054a8f7351feea1e3e6c4267fa8517acb7847d107b57b867d4be14e83f64135
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7703ac67a2e797b918beaeff389a7dbdccff3239725260af3729626bb0f6964d
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b74aa77d8b9c229be0125d53f17e1e683875ff243e5efec40f1fc2785992c6bf
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b5ffcd94c6dd7b37a99da32d7151e18c67b09a1ac7623b0e157306caf7c1a3c
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1246a0920dae2d44f08db377143e09f67d2895121f30eec273f2f6ea67089c5
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d658f80ac5309c0a9606d43e88ca541bdd817c746b615744e39045549bc8823
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b61afbd271d9cec4615f33a8f7fccc2f48ba81d9df293586f10ac19f25b1e55a
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:661137ba385b76e1c9d4842e14e917ab7ab8f4c1d46d3b1b0a7e880e70bc26ce
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0c7917661f5fae0c97627bd911d3b19a3bf185400ba6c196a19501359f5ca29
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de7b970b27cac4831378e2641b9d550edd95cbb4cea47e7093396c4638605e60
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e193a206b23cd3d4a619a95d0281d4e452bdc498cc86fe0e35fb90f5a229d6f
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1804dec6ca2f14277027cd49a25ae3f44d8c5b8cbde30010efb9fa3f7356ccbe
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc1/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc1/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38c7d9df872a859d2bc292da68e3389c53753bd37c086e10db6235adb79db520
|
3 |
+
size 42115
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc2/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc2/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b084e89109608e566d4ca26247d62ef719d9ff55ccc7135bdefa43dad92ad4f
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.dense/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.dense/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64cf9f73fbb571059bf882078e0aae7cd4b963eb9b0259c8104ead0d974c4a28
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.k_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.k_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc9d0dd819b1edf0ffae6b46de480971380449b9730bc7a40a9fd4f3bd7a16b5
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.q_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.q_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acdfbe00f0a5655ef20a9808684eeb5fcd454179649c592f35011e3347449758
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.v_proj/_0.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2
|
3 |
+
size 11395
|
params/phi/6/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.v_proj/_s.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:163691d2bf0cb92dbe3b47a798dce50552bda23f7e2b4b8bebf4ca871b938231
|
3 |
+
size 11395
|