diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56d3dec0f3c31bd4252706d04d5fadd7cc4cac4a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f38ca76a68848f07da7473f3885e85e24c3dfa5104c63dac0fe5d5c9cca1e7fa +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6c4c945d86fb539ba8029bacc9b806c41c387dd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a6292fb9a98635e5227e35c108b53c33900b448d0104d9d3e3c62a4a3f3f30c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..020d7ba2bb6e4e384d169e1897e2c9212a6f74e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82123af25587db72ee5beb2bd05580e40788efa75d190bf5e1bd2ae06a241362 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54140bf42fc4b2808867a1b83ca2dc43aca088f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c079f929b63619db4e9c7dc27d76c63305e75cceb893ff5a06016e115125aad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..339149aa06d762812db50155d4dd8b2a914f1b78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ea470fc7c92720d58dd9a68ff5ae4c7f48c55d86892e087db090fba71782f93 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ffd5bf8de0e3ee1fc64a78c759419d18bbc6820 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ad65430629afed58d0cfa9a8675c7ab37821621e834764b65d1fc7f13f2aae4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..754b42f2fe886d25d89712bc070c339479d6ee35 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01a01894b302c470b521e8487e07a7897fdaca16cbbdccfe3bffe581a6c6a88f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf07c9649bec0aaec5172dbcf58bed881067c43d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7921d35e5695e0e13d1db3f623a18a81bbba79d9b7c1f032d36a820375ff76b1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1250c91df7eeed04e00f7917867cccc699b66bd7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ea81c9154b08bfc8b00578f0c10012e13b70b9229caad4c2b10430585020264 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e97174af723b37796298150bb1555a8af599e0fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfb42fa290f85ae654e3ddd70bfeac36cddf28835e3c2d29e252594e8432329c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c3c5c83ea91b7884c8ee60141c4723334322318 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ad7c8fe6eda5212866d9d4e29066f25e99bd52ec13baf732bea371683716b2e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a2b7be7be1bead5bb9f45a9ce991f65b6e47e81 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5730da20fc07bd579a63685e9c23decf61a941f4b3f4deae93c106ed5454239e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a21c5a1a62e8801bdff842fcdf2e59a4f8111d1b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ea1fc15646fba33fe51216e56f87af10bcddd92a1a84055fe43a48c01a8ee0c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a5886db3d01dc1f211c8783589dc9151d402512 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaf5e7682420201ab3bd03bcaf41fdce223c27110e08dbc13a62e1ce6bd21fab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c888130045a0f4b3defd325592ad1083fb3c6e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec44f0f630dc106254d94da16d51b6ca3e45bcc8241612f55b60383f2d4dcc06 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9db9fc1eb9336c7865ef2a8f50aa31bf0e9e18b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:618cd8c68938df11cd740f55dce843716603ec267107b6a559d5b36bcc55b09d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..347c1586246e8a6d9dc6c03f8159fd20845aa61a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae4bd3b893e3aba095d2e94f87c1dc7f680646f04abb92e62fc1b31a88665c0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b7ae786bd62a384e55136852fc7a0cbba010e0f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e5ffdc054d7f7db12970da2b6d5f4c0408d6633dfc07a1e5ba75cb06881c19a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ba17e5ea21c14452239feb58efee0d2ec04878 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d826cf4502891c55a7e3432f5fe163048ef20a0415a56fbf7b5cf1480dc88aa3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e7ee5a623a70af6a4413e2bba9286174b171c18 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50bdf9a6f5c2b9fa20026943506ad42a51047afb65c96971e919ee7ab6685264 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6a2be8071517235c44843c792cb48bda8829d58 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfe1a3c62be6d9537423e7aa934051643ff89b27141a13dce9a31b0e1402b485 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a56d5ef841a782b7683b8045ba17846835bd2f4a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b776484b654391c28e4b820f5dba07615893a88fa17d5a4e673fc864fd43d6b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db418732998bfdae69b922846beb02fa37769678 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c64a4a177f948bd60322fd9cc13b1de9935deedff0b1d55b296863b0ebdaf74 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6677a882abfc2cacb46bb76e22737b99e6bdc3e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95b4ceeedaa3fa9d17855f87b7c35571440cfd63a59f9fa0b11f67383a71d19f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17e3ae0d9f1c4ca6d4d321a67bebc5130b4826ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:348fea5af2d8ca47560ada4cace0037abb297b6517ac6fc0e9145f819a676cf7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cecf8466e4928f12bbb448dd683b3ea9137912cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f6fb16afb25d16991c879e56894769f46fde1177e3f497e5089942d6042cf25 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da1707867ecc69f75805d2099f61055dc9f0c563 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45d6bd616f556cf8c1377902a9766b60e9277a74bc9be0eba25c35149a48f4cd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ff06d537f50a7f8d7829d778a5216a7c1c15afa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59fc54b3e9a2c9b18b2f3989d131ec5c0f6f346bba10606ef504451a3dacbc79 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1f7351caf7f2091de91a85f017d085a6ad98584 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c895232c2e08a61188998799904c5e5c012a600186e599b3aa5c194135629e1d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fdb5ef1d34c2cecb967ec0e79453c4d0cafaf67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7005d6e6ce383fc7477aa4a3cac26a7723d8e083e400ace08b4cfa23b7212192 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a9d95717b85c6d5bae55c29aa70acda1aa098b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb9e2754be4f68587b27c67c881618a6734991397b8db6b9ba71e44c04c0dea5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcbd59e60b9a57e3af1977d2eed7b0bfb34bd236 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48f603c6ada3b5f727ac0d02f26796672f32e502347c472bc15fda4a092a28e2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccc4a6d9be567b2db9caf9b4745ba7596301831d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4fbb3b41fb300d97d34b5c69382709a819ade7ec399e24cf306870002e4888a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be354635a53a14007aa73472cfa8ed8c12a6f4bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d012cd6050180946928bbdf064f84ad6c16bb97e2bc2856a3932ba3a7dd9030 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d494839a01f6ee41f108913c36612445aff88d47 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c9e541943303826a4ddcc4237cf902e66a877b6da9caf7866084451af85d05a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c03bb9f99732d729c4701bc2c06a2c112d2be89 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cc8ce8b64e24e1957a0698bbe143ca15f6840b55b6f3280ca62d45c4836c469 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4369b22ee4a23c667411bed880b8724913774a00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2648a3eee758933d4ea2816769b82191b32b75f4951fb3db0fa2abc90ba3cd5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd4cc7f8f9864eb68aa601c6f86b0afe3c725902 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a34629f02142532968405062ba9be5611d083779e5ac8f742e1ff8a1e2d98e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..20edcc00bc50fa88171eef4a36be8fcd358ca980 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:267376701d70bba2ab542aeccc0f16b7e7e2408e1594270f38161b0e0b8a5504 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e6290c127df889381c9e9f6c7c184b5cf507009 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fed75005086b6c7fb38f1cf17801755529d2527505c83a8dfb60e629f5e0fd1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a2aad1aa4d0dfb3fae8fbfe2e99042fbfc51389 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88dcc579ec6917fe39896a4319eadd6760abebb4d7371a0535b373cc00cbcb0d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc974147b7e6cae83f4f1d2cd4fdb48b6c668594 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5b6c46af27775293a57a16e3f178897c43b992e016ffeaf183cc7bbd533727f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed275d76a42042fb3a23511cab06c12be447aee3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69cfd2bf2043ac1f2ab271c72838891793005fe8384041c8dbb13e045bad4f10 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e8a6682c543c19ed8d847184e5942dcb051d338 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9199d621865dee5640605b890addbda76738918a80b163d2f2b57e6de0ccb52 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcac3c3ef3ca57ccf7fdc5d3d5bb53ec35117ea6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6006326acccfb4d85565da7c1a579508cf09be0126b6c1f39d6a98857554ed7b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7118a3a69bb5ecc184410aefaab637cffea24e4e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df494412deb3ab46bd88946530beda9dd03e9c48f730f15ad5c10846e0ec9e1a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..147ce2d07757790a0cbbc451caffa2e8a12ee8af --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c90b808750145c42bf6c5e483c41982233c7bc291bee09c9cbd79c3969ec017 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..948b33d4c813e2b01c15d45e0b897161d7b8001d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd5c044cfe593ef7a634d5e037e2d794b1b9a2f1c3cfbe83fff72c69847f7ac7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d7dfd414d4dfce515e1268676a3516587c73587 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41f59ec0f997dadeeafedc8e755f442712660d25936dfe90cda2e6218ef808fe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..702a3a2b873f172c520d74e595421c84ce2a0510 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eef3856d3e85fcf69c0225a9adad73362302b006d1d0f1c6cb42c4e7ebdfae2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c0b296e7044f65293ed1b31511fee683b775408 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e6e671b848105b330bee4e8a64263335974d74d4a263004b09e83ef87e6c914 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee162b4283052c6794ed9e2da1da97e6a37f2541 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae0101942edd07017f03fd0397e2c7c6262cca98bd149cad8f811426794d69c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56e8dee68edae7ebdedd334048e900bd0e63aa82 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abbcdbbf4e100cd96b793612b2b8944de153e15305f0ff597bebd5f01ce24df0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..956fe30350074e77d1fa34372187a6362ecd3857 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cd9cb85db5bba8454917d443f0d056f78b5642739f190b56dcac6a82b011c9a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c7472f10f8963eb0a5f78c4fc6ab06671458978 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89dc9c580258f2a68d059acec6b70b6a7028c561452454fa6f1ffe7bb27dc66d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f589e7cb602cd5c21b7b03cb612b208bb587080 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13cdeae7e6a48d6ba401e8e695a3ec0c5060b2233382dabd7d66c761c1c10cf1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeb913d9e70c7886fb5b0005ee317a13e7c5ec71 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90d3105d6b275685b316ceee95cbf93d6cbfae203dc0955dcbc9c77582a92560 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..213f8f5de22b1222be794397c2ff6725d4118a6b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61cfa2a63a5ded38d8098e347bd64a743c418e0f7eb1b652ff8ad0db41bdfa84 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ccbefd6aeccab989e990f76a3d6f642a113fc11 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:167efa9d59a0127064374e24ff85ece647b957202189a659631599202d194e4f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9c5a4a6ae8161ca91cbde0a2a52e05c9cc85adf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f362e02f78ab47d4baa14a104ee9d54d335c0321c8145f238455128558633c7c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..024b684fdf978960798550fcb76c93febafd9a5d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b13c8b9740ace2825621b356f9c1fa38bc5e7fc419270f19fcc1e6c83fc179fb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cc68dec5693fcba49795c99e180144faf4bbb95 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:549e8cf776f15fce224eb4e1b1868571c1d23c5962ee7892f96f244cdf153fc1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6ec0413dfb9ad69bb206a2c586fe699e61f1c46 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e79a22e59e0b841136e21b9698b4b4b257cd7a92932daa721ae65b02e04a2278 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1214068f4199d2d9cc4cbc20c6808a9ea4371e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0e74a83b2317c81b6497c9639fb05b368dfd1091dc358cb41ad84df411786d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..922529d1e1af7e7c3d37893edf3dbdae55d23f18 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51b50c9082e7c279907dd060b0793f0dc6e2ee2615e7cf115c7424a54640f2ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b689fa73a062723816e74bf8296adb2d6a89169e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4450c221d8af3ba0b7d12f50d819a7846743e1089ce02d8b95105683f6bd6fac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9df531feae7b94742779b3d6ccd20b6a63d54ab5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddfe97ad13728196900bd51f3c7718ea5beb5f318ce03bad0f60c411aafb540a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88e726edaa0120632effb65689aa16d37ece22f2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2209fd62e72f5fd96d2c212ec6ad30ee62282a46784d837ba6cbf90ee9dc7a10 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37941073b38387d6e699257ccb72653ecbe54b8e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bbea85d80fadf0cced3634167733ad446293fee17c347cf6bd5e7ef35d4863a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..67dbfaf8a1d3664ded685c13c487d914b047c298 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a3636155925214076e27888b567baac11185fc1df252b4094d801a92be4913f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21fea92c0733e80251ec986ec7d74da3a42eb47f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f1e18363b3f8025abefa610d34da303a7546f448815f9721a3c5a7ab5377d2f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3135d7c31768c18412c30cb7602c34e9e1e208fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a035b7b4252deb5fcd0386aee9f0525de201c33acb2e0a082af8eb7de7878b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71456276a44cd261816623a7062a4b4303a66e88 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5521f9d5f47e0dc42f3772882fd531ee46ae827ec8b3c3e5fb97d3a02ae0895 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e5e771a6c640ac405b29b62c0b27b2422991d77 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1096c94a7f6579c2cc6a818967a60ab729b53ba733069b7d9fcf7535a29654f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6559205d3ab8a65ec0cd11eabd146c080ce7fd54 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad8f4eaeebe96b98334941294c02187efd15e32c129c424ddda4e3fe46423f5b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e45bcd1098b4844e60ce3980fbd172fa805eb4cb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ec432a499b87dd53799968ed9d9c5fe9d162d261228908104b883b909823831 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7777cd671e1cc2150dc9185702867d1d1c2cc79e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fa9e6f4ff14f37aaa923e085f680b6833ccd1e6db132a1e8e2fe18ba5cb1909 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..893c3ad7caf98d176f65dd0cf57c16fe36320fb8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd3c367472f92465ff3f3d27d45f81493c598b646f1ca361e607318db0cb731d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5b6587db286d6e4b1b6c9355bd5f8ffda34f722 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d758bdc7c5aca26016e5a08a88fbe8f65986120c22f857b933da3475e91e8c4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b7dd1cc143722f7b2e6bd42423972afaf618b8d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b0bf14e272085f0de05acef231b9f011424e51fdf25f31415050792c2c575a7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e3623bdfa3e0bad5c44a1f547d8edc2e4d0901b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c62d68347b1978caad5d96c47fcd1d476531ff6db24f521990355bc97a52b0cd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08b7ac09c783d6353d8af42b20c763f7a93ea5cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0905fbee6c45bf6743ec0c8b779bd805e0624df443948bf313c9f914926a6c67 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8de77525f4a8951ade813942c2c81c52d1f4fdfe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b67f90432bf1e95078aac92f82357cbb8f3ea8b8dcf8aa36f17868b60762fae2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..067cb2503d64620692c6dcb75bd08ba6014938de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:740943b7736fbc8cc3929d689c0314323f244ffce76a0f5570b91e00b74dd8bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5d73eb28524db6ab5a8a96a446b2916bb79f239 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51259f1d2709b76db57fa9eeafe634152cccc5377fda5a39232562e1e70c6ba1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9925b5577b4f0acd8ea8b7d1b5a21dd5c04a801e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27544a7d4e0a793ea6a748d6a8bf38ccb4ab67d54c1a2acaca00b5788651b819 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f82bd2c0619c819a805faf330af66d5f1d7b5d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94ea6b629b7b5a1d9f329d24de8c0c890a61da3a834a216cf1124c03fef4244f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0b3c713c4804672bc9c04c4dfaac37d139c4b31 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e9cf0cea770d4c6068b520bdcd41ba1b7466bf66da3b58088b0ab2d7030a3fc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7261c57dfa0dc20eac2628f1b7c6e8d30b1757b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2104b81810febd4588cb7b5ff4e36e64f398b4d36e5092868427249be692cb7e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c315f5dc92ac23eb0a319954a44576435bfa779a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ec37e1b53c992318ad83ad137aedc72f66a98ba208aed906c6b78e1cbf5d646 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ec339e4c6d984ed7cb390fa34676f55cb3cac28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:412403dc7686c842f8d5c24f8b1de557f409c86bc0744ddd05354251a2a0de0a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21306e4c2baa1e0ada7b1b1ce7966e8795feb15c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aaa0713d46bb9b85c7f807878a8b565a518bfd3db32e51c2d02bcb5d44ac28b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d03f9f2df829d881364f9559262e3373abcfae6e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ee68b65869c42e95e5eb9170c291fda957396212768a87d31ebae849e91242c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9748243e6358be182cbd540d3c0307d37f720e12 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fc7bb4c4d71293cc356c7e0ac5ae9be4d83fcc3024ec8ee116826b7399a50bc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9afdf53d4134982116baaaad57a444977591c119 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b4152f5370182d34fcbde864568fd6b4949d5941b59ce79bf310ca1f4a0c1e6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5ea2ae3552ba240ca1b092e84eefae4d28abee6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd4da10654dea60e70a4672688b02309fd78569f340a062757d1618c10f8d1c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df008ada321a9d640c5369d3e9dcfc1085847160 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a68a089c415d55607e06ff5175a4317a7ce3ae0ccd8b1156fb607881098792f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d593d6274dfff0111f5fb7acd4504c86eabdf94 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:553c8009624b156b1fbcd0d74fdcecd1499d2093aa4ea4e5d649096559d8f8de +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d565a89f6190ce166741cb981f9ac1db3be8461e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12657a43ca38b97a8c0d23f20277e0c51ec0f6525f3fbe335b9250d8307c7d65 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e50f02c0adad36107372abfaff4891cef50ee8b9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9e45a2cd314d4de55690c916a67d720d66bc1bf1f63e220a1de593bb97a2368 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..402feed965e1c63142dccf96600963eb783ac0c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:436dab097346374e032a6de6b1de9a2eed60eabaf59e838a0d8355de737b47c5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62570ea6b22835ea23ff9251f6a9907b84e0ff1d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc605473cf7e230a88e602a7905170234b41cdfffbe73bf6b757b108ee27cb6f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fb44f17472905ffa13aef66f81a28c7f924ae91 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d19cc1e18e0578903dd1b69402537193bdfc571b394c343d342618067d21948e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c2e0c143754ce1fd25a77bd88abdbc91ff2fd17 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bdeeb2e6e88fcbc2cc3eed1b34fbaafba75be57aeb529a52619a5315065b1b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3b031d1a57c9651fb8e86a2d1b72a38a7f67226 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b83e1e6c2dc1d6cffcde986bbe417507b44a63c7ab7beef6627f062956c3c41 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73febfbca17a3ab36f365be99188b4063dcc04d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7da29fb23f5d8982dd2adbdd16793c7aefdacc9aa2c95554cadca6197803f8cb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3226d3e9546e97df2e3d372997a859e9831958ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f78af279bb22df6a3a3b825b10d3d9079b91f81cf552bf09660443a730116e74 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..599b6f851a6400b4bcb2533b2294f64e4e8511ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bb2d7c532ac761333bd85cec20e7553984b521a278161e785076546814f0934 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da40caa91fb2675bff811c5ed8519e57812e003d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fb49ab4c4862714ed0638db2290bde0b4fe2f52f85cce2b9cc7f41f4f94c33c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..162cd75ff6893a30ec4cbcccbec97667b9dbab87 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee4762beb08bf3a7dd7819e76c4a064ef0e52d5f976d359ed2efae1b0a1da406 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..131afbaa1676e00cc11b1160b9cf3079848583a6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8f51121c354803e5735276f474ff3c2b716c1fdaa0d862d7e6a741e88e6729e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..926c2866b75fc6ae8f80866477a14a74a68ef592 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ba6d0c006ffb551310cedf55425f945624accb974f8d59d66611a341e0b344d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7132a2460fea88ca56abdd03821790ea69e332a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6abb816043bb45bfa01d07f2f3633cd7f828e3cafc76d2174aeca1d3ed9ea23b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6ee4371ec3e8c1a3254a088a751a897734fce65 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98e2e38092a4a08ed5bf831e8b91742c9860ea6c8ee600c0fec06992b65ea111 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b21640ec4429f343db5098c2af098fd5c6c71c58 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff0b955242e8fa21a6d2117d10cf6092ab7ddedf0c1a35c7506562e8e4bc18e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c04b91d8bfdb099ae6440b18ba157e88144eaaab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc546795dacc37e922b3840b2bbcd4b270fea9ef8596a04e3c089bbaefffb500 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34229d4ec4528d5ebcc2ae0f907c0b14595ec0c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69c35505175db2bc690f3a328e06a8c70aeb5d8637ac0246955b4f6e1c6693d7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5352cb460c1c08b8e4753da7f0252c069b98a4bb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38ce2398535c69c2ba6dba20239f6f5bb000e4520a114a7e48983e963d543e4b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a66b9e8ebbfebe7744488a48e0277116b6ef7df7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0e478384d55463e1426ed43f93aff06e9ad80e97770ff0d55036d49f0a24e34 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..661face8f1609a497c9276b377db16c5e1939003 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd29b784465b3462c1645097ef98000114dbfba29a620fb01496f59655fb9538 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe3f96631791e6cb8c5959ba3e6f55f414b0a5ca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7e4fae9fbe106f98f5fd15fd85da4494ccba6495f3c6c4a26cb26ce13d9cf0d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5ee9a924b8e8a5b98f2ac85d038bce403c451c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:852f10e3f1565deb38c9718157c5ef7fe71662d647953cff470c1063320967e2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c56af8e2c379540ef44916b80b030666cb9764fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3a3b60a31e605293e66352cb9260a00dc4c79e84dc9d6e2368e837a13c1a62b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb9a8b0517b42e5107c35535d861c340b9f4e7ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1ab38eb38b634fa3c3f98be310b8e65a7084a0c3c2a11c3e5a86eed53c52e8c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b832e920f010f781c0c7cb1fd5982686bf7186b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eead5aea2110380b8eec8be200180d90a3665998e7a9d44daaecd60665a069e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..683cde8413566b7aa4a2f83a162c48af6dd786d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d59f9af0199e31d543d282a22c5f2684ca9d39d245e9c7e6868632e612d6f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e08ced3798332417f51f35fcc8910cc4a36e34ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b94874c3afd6b38a9934975d3a97c0bccbc26c12cd0b7a712197aa06e366cc3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c50889abbe968d4dd0f03062c2f5293db45c029 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d065ecd368f82bb3f3118d3d6e04a15bbd34e31356334f9630da978c4c0f69 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8aaeaeb466f78e25c8e674e8ed1e7aea27f12813 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b74bc2db5a16fe5c7d8ed0c42bad288474f040c8ef5019a87651e5d5a3c320cf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdc4366c4a0654fbf26f9fdaa4d90fc081dfc6b0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdbc53a7c9e6d420bbcd7a27e28d7aee4bf0b5455847a77952b6372cfa4af5cd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b52218ccb7e981e39033fdc0989487033f800df --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02897b198bd5cc0e335e11f80f020950a472c30f49805d15cc137252932544e0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2444e9bb0609927ad0254c7899a754a95316cdf2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6793b5b1876a36c42b2a441226795fa55b82c0612e57cf611c700f880bdd80f9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c7b01efeeff4a0b2bfd4f504eed10821c29d33c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71beabd3515eaf7d214d0da722bee4a877c4de6d45f66170c94f0962fdb67150 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53fc0ffacade01ddd110bf2d7f45c946e8493f9d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1982dffe628c603b9d90a2a4d5797c9ea65cd3dc24393ae424ecfc35fe8025f9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36c3acef615783c46b73e9d985417165e25264c3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e137b4088181ff1decf4faf8ff0a18d234a48993ec6bc6e5bc7d4f57da81a8f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..012d586fa54a74bbf49ce07e8fe841941ca5697e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e4a914827a55bbb9357b8263936cecde7dbc6c9a82855e0ebca3a05fe144c01 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..36da8adc27b99a2cc610f24e8325b944fd73011e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce4191213e8ac7bd3667f33be658045db4fe8b0725539501dfdc8a7540d8a7c1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42864491582b1bf6f15ffba2f4236f5dfbc029f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abc5a0e0f8ecd28364c58b2a9a6888ca0b1f8e8c9eb16e340e5ed1b4ac7f2cfb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb769dfc01cfa01cf151c0522747d32df3353b0b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86855f41ee272c2f51db6b8e3253d71da53e817a16614d9ec8b24f130502e7e6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..704c87a41804bc1e019b9690726cf770c5399792 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d96e0b2d38f7528e8dfe77c7947ec5897347e25c1cfac8b6a5b4639236bf882 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42c4a9cbab1b5ad5e415eae231fba0b6b3f8c180 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0f457e85f39143986609a5769839d2e6afe8adcd2ddefc51ff03bd0879a0c80 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17609392a3eab814dd0ca55659a1ddba5f41568d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f62f2e18bdc5d91351033c60a359677f7813a792a51fe3528030e5a425be2451 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b71b199b73a3e5e348e0309718744f0f2157095 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69f58542a0d55df058ba4d3bccdc475f80af872fd791dd1ec0b10257713d6fa3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71af6ba272e9a9063b39c872cdd3b678bae96ff2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad825375ee6752eae6a591c11dc86517eca447eda18247282ef3c453e6d350f7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08f2a49a66f4f29789d7803e392c8b60b2256f12 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:123454bb753ae9b94eecb20e3793a31b303204f39e19ef08d9b618197498b6b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..520be582953f2e1580932e8f64961e0e5f1c558e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2781e12d58781ccd797b4092582f02999dc4998fbb951ada112f6e1475a80a68 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca0383abd5b90ebfbc7ba90390e3a33f02c30935 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5b3ea2158b9de9b53b5748459fb1ff068b88ba2debc93728ad49dd0ffaa90a1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ec87ab504295f2df8632160885ad6d0008d3aa4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6166c7d68f884984e1080ddfe0929a814b6d9dacf2d6584918bddba62822ecfa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9a31f018f5625e9f932493be766b0f051bc89ea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cccf3953b8a9946601146a12b60bd6d389ed51fcd6eb2fe396aa49f5f588c119 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..415d35a46ac40f3e8605649bc1e16954d704110b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9ba37ac3473359a874c180f980cb9dff23bf3f3eb739520205caffd548a30e2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9769bf9e0ff5cb7cbad5c48c9c1ad2eb1069ba8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d3e916f53109b4c91e0e8575b28867f0a86c2f8d005f18d056033cc16681688 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa93ebd672b2a8970c3b0c62133e500573b40e62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40a483bd2e179d87b7ca68254cf4f98285cac4dc95b64089bc8d4b4f997423af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15b38db8f50dcdbde65bc71cc4d42c02250142a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce47d86ccbde0cb6bb7f5ca10e2fd586fa5ea79e2e79d84e16acc618ed4c66d4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ee4ecc7d2883b290d30c7d765193f67e608fee5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3b44f79025a9e899a0eaf698a9f999607cac7b302f52fa5f4bcd610669cd688 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceea7fdaba1371763f8f6005c5310b27d9d37f9d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:386d4c2723d3ac552f395335b102baaaafe51b21d9477de24ce9bacf95ba5c00 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a143328c02d049375d8ff730375d9f7f95c08a6f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8b066ca71b95e3da85ad317d2f170abd14249a11ef551465bd36f1cc829740e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db31b2723d58ef0413c7a32192445334d209bf85 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aabc7c8f3949afb120da2d15be9f1b01bb475eefb6c89f05dca4ebce83e2aa11 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97e69ee84b765c1440d0c346928fa5d4546b4db3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb3b2e9e85ec5929a5a0d6f4107252db3c944461ef5bff6ee201a4f390d74b35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cc556f42b89dc06e6b4c677f690924d9075017e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e9c8ec8176557bfb87b8c4a52973198a92345d7dcb1a200b0402e197a30b1d1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..646fe789732b01bb8ef0f939c64ceddaa4a420c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5af534b94ec6320dd19388b4fe1e98c2d55c391b0c57827dd58cb3185a7fabda +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e3a7ef91ecadedc381a180baf069d41ccc5cdba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aa8f0a116f3adbdb59c0f8c97d453be65b5d2354a8c37286ed2e63fdc4600e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5700cb6f38b0c9613ca2751420b9bbcfa8f96ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5bf98c9a85643b7c22f14455da1e45c91c411b90d99c55f6c6e1535fbe9fb95 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cd29c59e43b8eff82678d2243689eadb4f0268a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e158e6e1556402f26684a08c09388dcdca32848fc2b5dea2e1a785c397e370a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dd0f257287b4d37330de5f1d0d8e77bca96a826 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f925d6ea6b383dc5ddf8eb66155ffb964473b38e30a20266144ea7bde63dc4a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eed7c3d44d771acce59c1185fff6d6052768d1ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf540b6d598448d0259debfb53e87a0ecca72280937add83fba8676a3da64f83 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..350e001c84b0a1df94a039171ddafe3f2316736a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcbb2d8a08df11515f91a712af4f2e8a8fd8daf3d626597c747d7d876f9b8ed5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fefe1407c11cb4541c2d09cd59ee61acefa480b0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ff1e46817187ac523916ec3baf5fd4c3e53dab60390314ba1f860985d4f3c61 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0f9613c111b4928ed2bbadcbdeb043d9d705fac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87f19ec72140a848d4d8b76d2d893988f69a18e46beb13c615dc192aebfbe357 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6849584475842f72d2d9b8244dd42f9ff585e62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a783050157fa17fdaae2aabec07624f975d23def2bbdc5197a283dd3cb922ecf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5065178ad809b4b5f78c3c9b475a555eac875fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2501cc3c85dd21b807eee26f6e03f69076716d007e61ebf7285f1aa686075c8c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..67cd6512d7ac3d43ea9078c81f9d4bbf4dbfa279 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f705fbbc9c019d82fb8c34d3ad271a811082ac264deafe4bcf0e0d52014f108c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94a82981451e03143e5050353f957074b039c0db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22fbcf77fdb27304503488358219b29ecac791adfeb823341f4fee032a4a8568 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25bd9da4cf35944820eb86039fc7faae25960b0b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37e64241fe6b45148fc56a905e7bb97f3c0c73953fcc50bcc1ac1ce87a937d60 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7729737f460a5bd29e17c167853548a7f29e83d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e65a4515b1a2e363740dc1600297ec18a4828c63f2b6dd5ea848226c002c5a76 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64a088e80403bd0748017bd01f34712e6771b9d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32bf4e6c8fc3811dea5f79ad2be782ad9803a61295caa76d10606da4948881c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03d9aaad02bfb99f5fab3dbe913a2dbe45fb2b06 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:160e8967be85f39880401e4f606f613e29fcd2c51160dbd98f7b740380a3b8f7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..932488453f07745951c1d8a557dd64253c0770e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4943c86ea4b0ee633a4ccf5903c16d93b37d58a9aafe57f5669d682539d2ae42 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d46c98ea9663257b720228c62e84935d24fa1788 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3bdfc816a33b711edcd9223b1a8ddefd6b0594f1fe8342e90679215ef052b4d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..966f29a355f5a05d1eb3c376ae0f35797aab39b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11f272c236af12a69ba709f923b4070305e76838de956f6478d4439988548bbb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6af96c59466a2721f38d22a980acef3b57944583 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ae549ad392a355a535a9f2d852b3ec133d75be3db959c505677f258c9cfe116 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..18b8281a73d54203c07e3005c193917a7adae973 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fae9643454e9a14a98efa1ef2bdac7ac6a7a67d9b5bdfddc6bab9641ad54a96 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd09207231e7a3ccc3602b7d2129f49d75d35a03 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10b61730d2115f4409f6d445ed0838e69d0690fd7e426ae91c0a40a0abd65283 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34e9960a3a11716529fa658f6a0024a38d325b25 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:783a48e3bd2c101320b4e94760b5a343d2035e5cbb8d112279ff164204b73a74 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e29bed6201981ab47ff03c731240ecd2563cb5ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c94f9ed5ae3ac63625501d83dcaefafd6d8f1938d51c2793506331b9178a0990 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..742693edaafdfa23871fed350552c7a7b9bd5ae3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea7f640ed74f3964c0f02e7c3c83e9f11c2d415c5dc2dabe9185865fc31fc69a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..600b3a60619c526e100342c032d8abc599209adf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6894e1d2efd8e1f3f89482e8930568ccd8cf6dab50fb7db6d085fac00f0da309 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..874ed6315d41101bb9939584286148e237fc31fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03f64f17e46fba88932e3127b1ebfcfd587acc53a074e435730112de26cad833 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccfd73db31114b5095af1deb0fa18eeca723a3ee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4265fcc25c74ec73f7a3fb373a50a62c47e9f76ced6b42268d7e99e49e2abaa5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbb16dd602b201161f069333f4b24bca9907b8ab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b32cfafe5df875cd48521305aa1ea1191fc6fd06e4d8decdfc04672f780be08a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fc68d89e82b785a1b34c9a3a6efa5778b723256 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c22ca72d58474b178c3542e764f80f5f72820956facaa836d0cef7e75770bae4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e423f70f5a2977dd3c0190207b5ac93e0dadc06e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8719891adb88ae93ad8dd6125d5b4886d3fc1eb53c53cd1bc3d9f0e57a40f065 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..587dfe8132a7a48c4e8a9ffdfd3264b168cfbdfa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5063a26140ca04b96306c7f10dbe54586ff1671a5347635cb81430cab2be47dd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85e2923d5ce0e143b3eee800a90b125ec81c181d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:affc8d453578518c3b18ffaa9eabb3c04e6a2a95a4c3a1da6a73e5104165dd72 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dccb752181b036f6a98e5e002b97cda9fddff821 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f2d999e1cbf3138c96036bfcde7cf26caa5528f76f6c7a7bd3f3ef8dec6ada5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0462d9e4a9966c45218a3d489d17eb08ff6c454b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3da0e059c03b1e30eef817e7a4118fde1fd865a3465789c819331e9c46c5dee3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76afa12c8ff8340e419966291826cd108781272d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95d9e5f24728119ef3c044050ecb086c41d53a210eee52f7f2318d21b5a5fefa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8acca1c31d2390382680bcbd2f6476d844510c13 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0203a8f821d99a5d236d906619a6db631b5ec94c7fe8004e08bfa3a09e3c158 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f5e54071f5bf150495a880a9cdfa3e4d966a4de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:680f9e25ec0eca0b1124d161bcd65f9655fcbc696f85b5b9acdccb013c9807ad +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a405c294b21cd6921dfb779ab3a6215db1ad5225 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08a9245fad32a1f3370f56ec8504cf6920d9c977175ab1b57dfd7a48827b8b21 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bf6a4fd475ef291f4d1d72c39c8fd181c73fcf0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34e1eb272119ea2bac719747218be71d602b2d0825481069b1211ff600a90333 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00494d0d886f5a108e86c483919cfc8e05f6118c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3afec3a5368adb903a9ceddf727bda3d00b4e668db29e2d609f844151bf90f84 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d338162f7b36a9d18eaf28377d4234ff0f6bfab5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb48eb1f1630c0262f26b26bb8b39ad62cfe979b98009c920ff1b94cdcc6f3f1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdf603bc9e83ca7fe15f7c875df3bfe5545cadaa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c8c1834451e708e09e078983ee921a58014d15321d8ecc332210647a86b9e4c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc4337f9582c90949e40220795f04dc6fdc5434f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30fbe0d6ef9b1f7d76a97672484c65aa442b93f360be1a842916a576e55f6137 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc868c0d721fc9c0d2391c1e999385a9dca350e8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a37486b4354df2487440832eb248e9d61d063a8fbebe600b4788260b2d0cf93 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..020550a3e4fc4f46a12c2067cf9ac0900106fd2a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04c372e8e6e3aa938c3c681cb6a191941dcac86bf96a6648d544f76741e7e907 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..940ee494a65060678965afff21d75c0b6e3bc117 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:767842c930d8c8c614f34150a28913db69061e8797e282e79253cbbbfa43708b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c056d883d7023fe96b3e8b6ef6c7b05b36bc6a64 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11ec5ec99d5e592dea977901e69f333cc9347dccf6bccb4ef4c53236bb84ee9c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ee6a05a0a52e9c56683a254a01e80365e1cb4bb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6425367501f7473b8ba863abebbe63099e12259cf7b3d4084901395fcd3c55f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..753c51055301043ae86c599254801a3ccbe49ecc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e865eba39bc7da5a5fbe5c027eedf61b44940f83bfa48bc18fb0b23953df92af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9eee7c65faf8cec526361d4323abf53cbaf20e63 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a87f21834bf4a3c3113418e6d2f2f608b5ef3fbf7cbc6f56e95801e98e416560 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb4a8135a15697bcb4f7243586fe6635c9ed0aeb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee7d117b8d5fc19855c53febb60fec7e1adb9c6a5c5f078d6d21b474e5411e2d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e415d079e388add071c2775f1c3d9cf43278267 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab286a263ce9144a30deb8377785789e8ef6aec3802c2b6442f5964ecfd657b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9b0cc0ca53f26a8336da4572fffd2c9a37b1882 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d225c6abcfb679d0e988a196c3457fb6523a644e7af26d0e73b6e9faf538397 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22dbb3cabf1b9ed88f195834cd2f6b075e5be3a8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cc250923a2c967b6f3aab53504d6bcd0e73fcb37eff40adc7a8e8b011fa7419 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ce8492db90f7e51404cb05b5864535f2cbba0e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b6723d8b26eac69555f434d64a9610e6006d06ea0619db6842b44649ec30601 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb0aaaf07aaa128532b1c5c4ba766244b57b5e6a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07f3859795f933e20779f189cb6bb23e1cbf5d82fdd6cf386cb72389a3a1193f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..82ebd282f614869907ec515126f880924d7dbb3c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8a28a009bcd8bdf8b8ff83624d3591adc979ef3b5604b0a1f0e72bc31b1a711 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34c07514234806c11a99e7474360247c8095cb2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:465b7343ed2edea5ba18b42c575a65e4d89b1a727879ccbde43cb2150937de09 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28cd57474ff9e509237b30c5873ae79d0579bfab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e10cd0af4799c0adb9c3e48aad98179094f1e80bc22d61cf7843d3994fa14ba9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9485ab627b802545c515f769104ee8a04c63d0c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21ebf831bdc6e5ce06541ed1f59ee88e58c50ea583590bdb29eb2cb2f6c20032 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1e682625b0a9baf0b83dd644f2631047dc97483 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6276eb377b9272c73768ec9399627c2e0c4c61ceb946a6f2a2d89ccd6d158b4e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70069953a120e62c27e485760d257786809d3715 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35383511678a7d26337edb15c98ef15653ba5b1143c263a616576ad9ad1f241b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad33597cb48d999402aa0192e639dc956c9122b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16e38293cbdad674a6eb2bb9b39d7504c5ceb9179776f5bb7f2407cf8a86bd3b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01e5b6195f3186c6c0ff88b4c820d990ec9d9e41 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3544c0d669c37a34b9f397a48f6257518ae59331593449c60e2ed219227acc5b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1803ff5a162a4bb099e126593840c380df6399c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5712366aa21afd857058d0231dda21619df2a7e3aabbbbe2bf7b6dee34568aaf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d40fa2ef51d37b325aad69e10a0dc2cdfcd3517c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ca73abc614b013e31f99d3e151dfbb4feb17f2de92dd8d13f5fb33a5941c220 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..65c4072e02e69063bba4143fa5324fc2570c758e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:900211bbb0262726856370c776940aba9e8eb7864ad96a3955f628c10e534b52 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ec8fb768819189000cf0ee81d27de5fc4c24b21 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:487c0dfdc38540c29a74eaabf626f3d578445616f4b8bf84e11e6348a2610d7b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed31df70a7ad6997acc67181f8b0f67f4e63a6a2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b31fa543907ea4160029768b190a55be2ede1341fd030724b58aa2b95f8e41bb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..301b0e8ced260490525887a185b34523e824c711 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28712243fcb4c5163e5ca8e3a74ac705331a54641eb84f833440918c7c306545 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df7a0e843cd25ab4f8f690ada49e7bedb3480c94 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3b88f8e4b120093698cd22363711283d2e75648e48efeb24016385c115a568c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61010a3a1ea21053ff8cc461d7c53cf301c647a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26617644e376757d3335325a6b15b5cf64e601ffe8e7c6325a310bee5bdd6358 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c576f903f5bc7fa8a0b9921284d770baba93322 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bdb7d4c9fcd801c84ddf7b3476aee914c5f523e28ac220d266ea8646118f50c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da485b6b4e7d53cad9be57715073b6befaa151a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f89e3b87c9a84286a07b1de85b1c5b77a70f32e6b3dee8e0281d09abc1256e37 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a8a6f4c2dc7cd4e2307ece0b8274d4d30d61d5d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:627efd2553c05fde3e93901ccfa6fd1459ac49a2c5b1af084373d247cc518d4a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da7986243ee6c1f56256457405fd0d6b8d77c3d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c79871f59068fd79304ea46ed9c8247a48e23cd7c5f51d7df549cf0c2d328b61 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..06c92583751a5cff0bbdf56d4bc7d51d5e92252d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7e1833c87d7e08aaf5907f046585f0e3308a386af6657a2bf5f1457b27ae5cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..138d32270eb19b88ce2829e7a898b48e9a5373f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41ac3e9715fbbef5c15ec0a2303a4c3ff31ce8e2b8335e4f441851bab4be2696 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3861f5ac8f7f69e088fb28692dbf0a1b66a73a06 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af0dc31d583944737789e0f516cd643ce25577988ceec065d36368b4e4969da0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ce34d25a941ba46c5a02ce121fe4d3c727eb9f7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60eb8ba2865a85fe60150c649af1f4643cbbbfcd833a92f4e72a6caedc859541 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a55756db21b8ba571b491fbdc8313b23646d1bd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02ab3ac19f6c2d5fb9e411aaf6db6676c57e0a8e5ec1e74a904c7dc4c05af788 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b3d1e2bc9021c84b56c2eff7c6feba8918b3e01 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14bb91e3ee71b0d664b6fa400e8b271a1d33503cbe4bbd81a041bdab798dfea0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e07619980978f51fd766d8d64182ad7b95bb137 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bfd42be162f903a312a1a139c8bdfb267cc923f2804e4a119e813febee94ee2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..546399ab936951dfa64013f16e8719a2407d088d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61934c233714da3d4d0dcad82f86a2d681eb80c7c2ce3fae76035110752ad40f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf5a380f2005f62da81c0d35927606dc259b48e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b591f044706eeff8e4510030d3b731c8e23c4da7f3a94c52e29313872f525a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69f4aafea7329499cd1d7bf3fccbf11190cfab40 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b179d50a0ea25447d4231ffd2165e65021be8ff433838ffe37dcb1f2dcd70eec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..daa2ef7d084f33ec870ce6ddc1fe82496b6cf19c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa86b2fe986b5fac1c4e37cd6a6f4c3f6f40eb0600f4171817986670e82d1a0e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c839c6551c00a82b5e9f3277a9c82695df6acfb6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac07d50ae4eeb788b4aa9d9d2e996121b9455ee6d4a32f229183861f6585c855 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b20acdc3051df357e9199443872b182c100d18c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03fdf4f95d8a40b946efb3b58c288632926fb395b8902ef2e99f310c15f15f04 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..529b40a56dd073feb32855b8a3809965f7c8deac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c60b9cce4b58cf5c731fe37f31c3a8e3588ca1376351974af063af2eb1320f03 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..337e08b9c82c1eabeb397f362789a625ba6ffa77 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a795a0ab911074ad97afdf95eb13132f22e88603afeda0c9cc44141b6fadc49d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..600e7216af80e441d56c0923bc4fab007f32f2fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58913e9b1e52f37205d1a3ff428ccf3c7e02cd531a340535baa2be8ac529288d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9941f2b435c3b493c4936942a5a4507bfd5133a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52ca011a354a04d70ecb8df9a63cdc9865549c7439b5c8a3f241a2030c481ad3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e4cca2f65e84735adee7779c531d106b1491c02 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c5f39fc371153978fa22e85442829a76c6388bb33f5121607c82299bfe0f32 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ed716846ec181f2b5c17ecbeb19b4645100168b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03555ae406381c4dda4d7747c7a28ce1b0556cad87c932d80fcac50de578ffa1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92a9b845428212c6373155869debfd817eb524fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3341467dd10bd203e44816dbb20e027c1992ca78018c177781710a27a6b1a87e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..13c461dcf11146682e3f0c60fa8e35c2e20cf8bd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b1ecbb91725e18f40aaca762d31e7cba88a6a27d59600994e5f8b46f9677a5e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2645fa37ef544cc87b8f7a897eb29ba4e91664f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb7a417346f133d09bb497ec294d48f040885fa37004c5f9fa6acd38cf6548bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e169f2bdafcfc477a7be88e4e0d3d44fb9a2b3e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f2d5cd2417525e95f5aa677ecedb31b5b6e6f747c2d1499c1bcf7187c60fd44 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a1eda78ca99482328a392bb108a7281a44a5efe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d503fa7975434bf3ec1bf144786ba5d98925f5c904376ed75da3a095f0aaa7a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4cb510ae8135a3b839a6b53eab2ee22ed59a2f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:402223daad1f9384744f4446ebd2bfa159c1864f6d9f5612acb2a45927187695 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91802734e2a392de6c494c3a33ff8ea47848a8c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6d71773963c47fa6aca768c8de15d2948d6285387bde1b5530c09da526bd53d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6823b85b019e27286ee6587fe1fcc583b7440eb6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48b7bd4b48bacb43f254783a94ea9a19d5e48918aed773c7e99aefd2bc64fd9b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89a95d2dc9669ce3eaaa89e2227455be1740fb81 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2b812edcb154d3a32b3fafb8c72cfd4d321966e1b225fc62868a81c34c3e370 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0f3929cd5f79ae229d535395fb97bec43b7decd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c40aae94ef3c67ee8c3bc6bbb3fb1f91b44f86578a2413f890b9bbdaef1c03a6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b874f4006e4873dd8ef61e247744fa2837bc14d7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:111d33770c381b8011c42b23eab8a59f00d1e67dd96bb6684d512e8f8daeb9aa +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b4c557509225de1c714797a6537b4a4147b14e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d30ebbe62850d7a1f0b31cc9fa737e65e0ed16ac00ccda92925f9d419467c832 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9f30aba8807ecb37e8998f7aebed34f4ac6db3f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64d62815315affb3847d7e0b3cf57958b277679fd6edf770d18b75d59214c8b3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..739d09a07c88d3f2cfa3f432593ddd1c2e8de254 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4e37b99666e4094999a69ff3e94326982bcf4e9d8d63270c5c0899d20396f40 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..630c7206ac28b3423ac6df30a4278d44cb8ceee6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9939b0ee0ce0e2fd8408e43885e0f946f855a7b2bdcf28e684b54da1105b8804 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08bcb7d12f30b69d2ba3b46af72f68efeed7c375 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb304a544cfe481f137a9c456758d614c54c440bc36d53694851f6460ecb269 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a20eadab8c9f91dc33005f2a598ec7fb4cb6730b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:672a8be8711342cd859ad8f3a6cea5d5a2dd2f1efd4c274793534ed9fb3ef1c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf6dcd1f28ef37a34cbddf53710d48a53923575f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2839cc0f1f4a2151469ac98cd0f09ba3035a3663f853ff0cd3e59cf97537412b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..466effd20c264370ab731bf659928f3e7d438430 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ad0c7fdb1b99e85c3ff6457487e4c60822a626f26e3b208bbb6277c44a7cb2e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..486ef094c9c5426dd145d8372b7d3e9379d7c6da --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73a15c440e1e5aa538a886bde9ba9b1e19568ae4dabfd66e90eb7b56a46aa96c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a717af06286ff74b438dcd7d8190229c45dc6795 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:090acd3a68a69f1dcc06ec3a05d2997af55bbcde793a0b410198575bd6d1c6a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd7785a973ce6e0a0ec46d81486b7e3e1df5d49e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f15b21997182b5c79282fe25c9e3330e1ee3161dacc6315416cdc14646683028 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73857b7eb4b43fd610d0e8bb44629828e4262047 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e00355644dc61af57a82c62e2cb793408dbaab2810660be60404cd9b62cbddf +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..56a686efe9afff54f09b5eb7cef41e6f3e125af7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d99950cb739124ba06f4b1dcd3bd494412c8d856c758315b46e562d18969e138 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..612f66690e5ab61367216df65728e219f5f4d243 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0dc3fdf233f42ac20883cc911731b5f4db6d7be6b29808a2940133baf56f73a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa058d9b6882e04115676c88eb279d503c5450e6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d430a56aab5744d209c3def7fb40820233d9638cee6902b62d9dec81bf21f879 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63df4de5141d54b6da76ca10057219e3e34a49a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f465910f7b9cce6a94bcd7d9988d083a9a6637ccdeef3298c74db066f97bd3d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c6466ce23de55234e017eafe847616c9a30997b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e8d4dbeb86f4b553cb54258304c09fc9209210e5df89608dc9dc4c192beabbc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a284537574a102483fc04f05550c7e108b179ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3d94442ca6d59f9daed2124ecd33fb4dd9d1b32194ae31a5bf79beb197972f1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6079392b5b34debc2b0440b8ef7e39fbb91d2968 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a868d50520a6092d58a0d345d897ada77a6153822bbbb1062027a9e7ed0ecea2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d38a55539f981ef8d85602efae8d73f5905d3ce8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:438791216f7073094ef52f3f4cadaa5c15c1f597bb47a31ef1d50517ee31fb5e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e6f6d3dc883b9d68f2896861ab29be2afb1a43b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e19418f02b6032f3685a19c4a53b71ad325310cc9ba35cbacba96b6d7055fb0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c21b5cb6629e3e82a40f38f870045dc3292135ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4adf7ddec07ac4804d4b34d065f406051c90351a753afc1ed52e495ee2af8e1e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..387a814173a45c8b911416970085ed42669de9ce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43be06b644f2772baaeb368321a44d889d37cd8496220acc9dd05364e6640220 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23d585453740dc401f07f519db1bc83aaa339173 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af41d984612ed4d1c62331d1223775a868295ee72e7187289a34b755595f2c9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..02fd49aabc1ea043d566f7495ef8260c1c1973be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d55ad1d06fcad916276ea4e9bcdc4193472d2219aa733e48446c4191c141aea3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c6998628b1a954bd9e6434f4bef4d95748235b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:268787c0b28a5dd588ed31c2baf0c1c5e9bba21eccfe308dcc5cc19aed2ac821 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ada4438838cc478a698475e7920646ec7427b30 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee8d4cb161f43645ca4be978ce1812e5b7628ca79d27776547038d81ba7c115 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ca27b0db752211a0545dd3a30699995fda0bc54 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9c71e2bed5e28440df6d9cc7815a227ba2ee9e1457aced9b31d4f7b4525fd6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9141d0543a04bbb9b8fd988eb14e3c51f20a2d3d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f151e770e4e5e040cc3da45dba972837a4939cadc0895d1d7bd38c3ac9aba2e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..096bcae1c6394c939b739eb1fe8f860620360893 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67985b21e203d4eaa6459c99076ef84bb37b86ebbaea27c5841658913331e80d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3641312eb9bfed5b11c7e775f9fccffdb7aa319b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f416bf61d1a3ced761e27900d71b23e510421e6b839c165c5336e31fc6b893eb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd10c8bbd1c38015aab40ddb9d1a5116b1b0ad79 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea57ff336406b4197582ba33390e55c1b5bd7b84181acaa73daa932cc2e36ecc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ed7a806bccd3e150e42e3391e22ae271dfb62e6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:addd6d711631b7059ecf60e9d1acc9bb1c6c26a3f560e7657243105013aa8881 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d466c1d69dbaf9dce374751db663d89139b0cf0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81b130a68b1e81e275c898998841298b0d1de38e8d2b46ab949ec69f18f19a27 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc45f29b855575c4b298e6b3308166d10b6db6f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b073b3c5bea07b93d7d63315e4014b32b67bb3c2d40bc4523f93bb16a4b98ed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..41222c332b772fb7092deb942c3a21c2f7638a76 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca8f52afc6e2a58e4c652b65718efa19024b6ac7f0fc387d4c80df7332671ddc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f25af2acea179a45830bcf73876d8ca626818d11 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8959b1211374cf272109ecae8842716feab9b595aeaba70007fa085b36c923b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..87fa4c7d5b7061d16ff1a69f6fe5c7bbcbc3698a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2a1a4e6fbfdee05dddc91fafaec94d96ad3b1f0013303cb59e915007c52dbf8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e042f80fa68e5501e0169e01afde0afa0cbf8875 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cd3f2235aae54c1051d88e9c75885f4829a9571a365e84d839859bc8c26838f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d8a51d7ede6f022208f06da74ca12292f2dd4bb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7380abea867db0041dec27f17e3239be3c760c53057066b691fc61c2732e6eb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..023f5a563aa1eb77dd3329a3f3d27f10c7255816 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0d0436ef688b6ae2be1c2752c616def92a1893fe56c232c0f00e51f7aa05656 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e5d422e857e1388f367adf8fce1a8afc8b99630 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdc5aa9589d9d32c7d4c2698a8932ceba82175e79d10891aaef8d7c64808bc2f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..30b6aca0b0c86d8d5d39759a81f83ea5c28e8d85 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3226ffb96b8f0a74aac1e21dd9478433c6ad7a7f55e209ce767b04c935937fa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9128cb5163170e51e953d2181dec3ce4ebf72fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0108e088b64ea9735a1a4c0700e663693c594a90855c0cec481fce08c819c649 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc2bf805b4695389ca8df9bf69b51ac5282f5b86 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3edbcf6d999317603c0d59cf00bcda3d467d0e82d7ef0488cb830abb2e086881 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..acd9668983480c4d41820e2c6116903e4cd26040 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09b5954cd0eefcbe0dcb4a848b332c5c4110b2d854e611ebf6b036bed1aa82e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03dab7331391193ab1029d0f946284832bc303de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c43a574982410450a07c4452263b1e505bafd37675acea83c211d8506b938db +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d854649066ab31311881e77ca9d228b843a5de0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da6b64ac1465defc5460486939c5958a9450537542a2eae37fa9439f0a1f119c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..527055fd705067326f8a924c9b8b381841d205bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7ee01ae258b0639c25b08b5ba7585feddea8968e7f6300e112948fb89d0b5bf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c67d6659cbdf9003cfb0568760925dc9e068347 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78281616a9224832d354ef57cc06807d18aef06d675709accd6771ababd22047 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92624cfa0d3a47100465f019af767f3b02804f52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23a060fd10c811458709715ceebc64ec05bcafade1bea5d89c502124e1429ab7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fc8a905f15b9a94be12b4b04466f8667cf60abb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0041742b16776d69d62e7d14d6e48a69ed49e08be83d672f9dd407fd21f7a42 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4284f0fc6978658889862354745aac762fe2ce8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99ae86d07ecd2889237f141e77b71f60b5d218e244a41f57cd8fbdc4e88e13f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd9c4e9afe82970425387d963aa9c60f019db13a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d22f13487812a0b113bfc5b8a66ea9e1df6604517946ae75865eeb949f78003 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..738e97378b6a231353d104c664d98d0f4bbe577e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1436e19820b9e5e155c300baefedfab7bcc8011f510b028d7f4d72aebe4abca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f441aeea06699e9849c2750e373068e387a403f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:910187fb5b4b209cd2a7d5386e51755f64a6f9cfa2effb120a37233edfbeb0e2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..22d164d936c8ca5cb0ec8e686841ee21bdfeef7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51c68e81f60e902e681ee2a2d7b8972968465473ed0a8bc85ec42c3c142826b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75755f5b8307217bf98f329ea9684b0b36b3944e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c48653508e77855ea0dc72174c147fc43c2488ca3867b3813edb4128e4704a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bb5c81594a7d9d7f3d72f2352f85fc5db0407d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38afc3da2453701d2b172d91a9b02415f047e7b7161ce33c85324f9eaff99e52 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9a4f0ada8182dd757ecaa630262a51ec3e50cc7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a7603b7a943f2cdf6ebfa135c601e424f30776db012d88eddfcfebc41497406 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..240512e27b20d8310c8a96e731e6cd4b96c6dc8a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39de793e27ae18bf2ba168f4015b5261934eb43656c878b5077b3e306d74b9f7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c0250273e4d5b040ca0b729928acec2724a9e7c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71ce83035e26f9a31757a95a3026dfe0089b78519591a25a63f63c2b5d11e4ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..daf4e9600f60544c2bb3768416e81d5b9d0e19ee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:728a7a09c1e1ef9d293847134bedfae0ac6ac8b878206f6b4f358c004d7f7e7e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2395beda563aadb94c6f7146fbfe539bc46d53a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e88e49ed05f5389a30c352f12a886a264d25167d2c20bc13217ea1b98a093ab7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1462a3b17dee08a427c02e2d6c59402b95dd9f25 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:890c897a2a2e7e50130e3a8df035a26dd7fe4cd3df39ff2e9870ac0844ccf03c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b525c59b2a679f5706f8f01920a65c298a5f5e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d74346bc1ab39d6e7bb8b846db2f1215bf0757f6cfbbe2cbceac1ec772d143a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..87d6e7120d1d75009a3c3312f71c2229d66c9fca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae8e97d7503f18348b3a0e66466f4987f9812bc90e3312fe11095c4e8f3c2231 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51169d04218b1283b3de1353eda5f87f10e7d001 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f92668c404ba61a007b237a8b6130ae2b97229c18bbff0d2489adcc2cc844a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d15356cd24d67df15814ab0135d9aac7ebee2c10 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b305cbf6ae77b840d3cd483361c9ea6921b4a045a3ef0abb70b18f614f56371 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed97d0e4723282c3e586d81eb130d539dd8eeed5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f39176e5e2cacfc9f227729d4659489954655b1edf3ca568c6bf7f489212873f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a42d47dc3261115f491362cd1276c68d3ddfdaca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80be9ed6577978b528504316037614baebcefc3f0b7aa6cdb20290e0841f535c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8917f110c77f1ffce57a470ec55f76cc440762 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e6c51bf9a3526dc4f811513f8c1828a0639bd5c643d5f02f60d3ec14f1be5f1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..00d08b737c2cb68c4441c20f0d7ac13b2328c77e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f054a04455476f9c5a0a0c9a1daf36b8d485ead80d8461d7c0972457d4a74c5a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f31ee508e4de1dd8a74b38ce2f16d48a35d871b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f421b4549080ba255624415fc8b8ced14c0361ddc386e6c68e34aab1e60057f7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..99f72c7053eb5553389d90901c0d9079fafa6b33 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23259caaa4cb3d56263ee13577b9f449e86f6322e66ca45406c362ca0733ffce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10ceefee50d8653076912a1c16578fc6bfe81d40 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33e36e39ef4ae323af60902394855cc7adc43dc207da15ad27d51f83728199ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..49e24bd33ea3d358731fc54740a3a7fac9a70d3c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba6264be7619482f054c574b8b4e84122d020041d70c4294c19423a941d93f07 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4774d58b34de91e38b74b8ca040fdaf7b08d2813 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6bb3633816318364b76ce0bb6610acb62c690557d12aec91b7e76ca3667ca05 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79f0d8e076eeab07a287dcbb10705a42a4f62546 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14a30318d7b9dc2d9239037354729738a441159a8b488e4fe681c306b073e106 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c047c78fc55f677ad2af350a35220c334c9e7052 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18f1f0c08c5f16c585049b6923fe79f4af3aaa7efe4e8221684a6c5d10ad42b7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..23ac460e75cd60fe5195254e92835db7850cfd5d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:612e2f5c0a76d786ab2c6398d13b6d1c428329ceb2cf702c02a8287af585fcc9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5940c426c1ecce0aa0f2a1caaa143c1943e7dc54 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7fe31821cde5ec625323842a1d3776f4b64d03ec6785341db899950f300e727 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb0912e5fefad87260c6f8baa6948c7056058da3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dc10d53d5730109286f079c1d96a5b2891ee0bdd4871d3df2371a37e7efdfc6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..399244a055f4daed7f9dd0d0e189023e1cd28a03 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7524604ae9a61c3e8dfdfac12d1ce2a70830a73c5ca2e68f5ab261112813cffd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0bcf874cced6df203e4d82457da279164a976f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b40a0e477a5188136228bf8f20fd6d3e7238346343d28e04411f3229e0b99f9b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8415f07ef7cfc947b42c99c8f7e8b759ab090842 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1406bed21bfdc9a08a767f331aaa9ca9930c52a9769b9081fe6c77c7f2b00a35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..67b18fe3a10435e90ef756b350c94a58a577373c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99c64f026eb03feb769363aa4ab675486d5265dac7a9abda018a6c2aea1246c7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bba0f75251b6597fb04cf02ff7a4290b19904843 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c25068ad5591094c319001bc0565d0eaa585c9e12e906dcbd4c3c184bce7db68 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb0fe853ef84b060f2970f6b3124977590ebdb27 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f66e1fad1d3d2c13cc9c59c9f918af0643b8cca3b17642d8beceda29f064108 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfc0a16e197e51a8d9647dbfc1c1792748269fe3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae71966f27137889c5e1b1d10f5bc0d26bf90c0574d9ae93d651f214304ececb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f85282764f3af378ea30b4f9e89672712c9cb6d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7563ccdf844531806bcd2fe43c8a5b563ba46be0232c80a1e51cf6bd9af87acc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a85d94a5b8251a170795577be0e6880f5aa919b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91059b10b97d99b863ef46d5f185da1cb53f40646c83d09ce4a5e84bd7e47216 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b07bbb370f7b09606ada430ff30e5602dc887067 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23d017ee37ce8c3d449c617baa08e84b50c78189d670e5726b5244725ccd895d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3507b53358939baaa4216271f1fcd3f50b77b669 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95463ec772e94926027edef1062cd2f822eab4bd6a1dce51b9a2b6df234d6888 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dd3766b6bc24e9fa06edd12c88d56df3d2e239b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0605515b4248d549135bfef71514cb93cc52104852761c891a44298dd6b419b9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..838ef986160cef9844034f12b54c34bb8b40e0ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4898592678eb03a4112f223b79a7e22db6c474f2c2ebd6755f72dc72ceaa0f70 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..90313955ea6011f0d5b78e1646642236d837cc26 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ff3b2efb17e26f921f00c1ab996860cc835ee6cd695088356e8ce8867b71ce6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d491cc134a0db382d53bd5a54b07894d535e8a2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fb5589934ae0536603ee772d34ad81c548d37aaa05acfa861802011f958b857 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..162dd570cb5a2689f5353c8fb6f09af0d0d370b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:969e16b746db1a9d1fbd4e4e3aa02b534422594e7a77c621f0c12bd886f5669d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..35439026729fcdee6e7b5fda2f51babe1d66db5b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ed4b95c64abbf05fe4d1d5d43451ef864ff2a638ce939004cc6c9faf043f4f8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc9a8e382c95d6e4f57cc4417c81bcbda83bb6c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f8515ed7c5941a72a2d1eb146d1bcaa8d186e67f9557f40f8a2044f8ce58132 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..27faa73c260461e26c72a486b5aaf880f2565358 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16cb07a22f74a6e8e096b776543a4a4d70121ea94891320f23d41270dea4cbac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d254ed29f006e6b462d7bee5e8af2c8a1ce286b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e87da9953ad5c6c70b2115830442cc8f5516146ffd0e1c57c075f979e96d033b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eca048f6fdaa568cb5f2ae28956abe5197de7461 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93e7e222ec83aef3e31befae149aab6d1255ff02de2fc065608f537af74c5f2f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7299ad3c5ae3508ac73b281b4882bc7a1d83ab1f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48bb111f9a190ac221c01f4c45277abadc353d5602eae7b5e569e933d6a0d3f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d30098832c81961d924f8ceec035b6c49c7313c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e113c5bd746541485ef0c1ffd471840ea2efaa4489d89184835b663e569ad6b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..866f0d50f890c6362bb702f22e229a63b8fccf0a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a7d64d6a4993ab4d1f27e91e8caef549000ae45a5f7e16ecd062e72fee46066 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8698f8e2df70ed5b5116d3cd13301cd1a792debe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01c58699a68ae2493217de8413edcb866fbc5b85be1f450ada9967c36bdfe5bf +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e4b7346e09603cdb6c21ab47eaaed346f150cf9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75c6229714374369d2c5b2643af689a646e65170ac8f51ba96e03ed7e6749809 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48bd5584f658867777ecfdf665cfd9026fe540ab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06a6aa7c7b1c1d7175e96551ec24170cf7bd54c154ea8decd10b5033f07096df +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..98358783b0454f895815942afd2c59eb8feb6986 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c89331747f3d8ca6081cc673d5de920455e19dc820648907d76fc88d57850933 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84f5afedd4f0b55d3f8ebc704017769893cd2453 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aebf7a9e8793e48723baf694907c5920710e5474f10a9c92d029d601b27fb87 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..10591e6a0c443b160bbb6d4bc1a9846f08d44121 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:626e9fb75351f760838faf1e961468e869736fc84dbc5901cc5ababca597a802 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..029b95b822b300fb1feff4cd2a4000d08d5fe31c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fe7efcb1eb0599da61b0d645d8aa9b8eb00be88fbb43727be720a97f6641bda +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5270d35be9544c0c50e32ecd8112131042689424 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c49f49d11911a9563fbc270daf70e926b91b746cb13abb0ed077ee5eca952247 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..985e673501f2df0f7433b462890592c0ace2297d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c67f790b3a0ea751f1cc164a1ba526a9de9bdf96d1b6b88d7c36bcee1c5396a7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2622a914f8f789c55d706dacabc8cda61837c8f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2df42c8033238b7e4bb456ac75aa5ce8cccad86fe9baa10bd8d93a4842ecb29 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97ed945aa60d026a6d7522efd077e242b758b2d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e30e90ed4f7ab1dc0b414b350e1711348918863665e0aa3da0eb0e2cada62088 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbf1f5b2854cd6bdd1104082953bc8555da830a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:664c82ce22f1dd62758effa4d0260c5963333d611e1d05c9df2e20a0dbc4156a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8ba064f37393e94c9957cd4639ea741267ae0cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c59edb0551d55f41d59dbb7e001316b3af697a473dc2c240cf0cd92d33ade791 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eec9fca4d4f8bab89b60c23cda1a0ed23fed2b7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efec3575875165f1f08395c17bb4efeb9053bd130b8898cad7896316d12fcd21 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb3427812479e8dbcb1475049c95791252ff8676 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ea0133a41ecd948355a3b02aca1cd925032412ade1f0e76fd28c02df6939030 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..241a7dd67dffe68d7056e83d5147a7adb78528a1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abbd5330ee1a9e220da866bd6f86c5cdd081097f8a1b125c8537cc889335ab61 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93f0924f325012cda58c862c29c6a47d22a631ed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56b1b1934c58da346c831cfa0bd002261e7dec4a274cdf97c0c42fd59a186c10 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b85f3c57a25e94bc7d7173fcbd671b3e8d9b9eea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19f667cfa366840fcc9ef345a525db33048d50b7c41901514ac25d6a09f16060 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f99d0767a12aa0e219f58df984b27ffb55d018a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8784c9e343828f0d829c5f3ea5b080a5fe5ce1767f17c85cd18ffe923458ebf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11d17705063c00672f2b9c5691b3d6c8e8f80bda --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f296f563ec7bc3f8373093cd2e7414f30fdbfb5270fa362354411cc939872bc9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..adfbf7fc25cdc2abb20c4375234e1258b17904cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a5f066cf3c56cec0bd91fb30ba32368489d022898d89f6b5cb950cc92046c9f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5f3c94e299e90587a3ee015a88c59cb4708249b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dc3aabf6723f5ae561053834a78dee48ce0d57f82841e96274def6cc5d2e60f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6c742243fcd0dbfe858ca708901b83c71282fab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b405e403e51f4d9da97244bc3f47ebb1a06dc39b5b5cb9877e5280d1069937b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad0773bb62695278744e58babcfb19b42bd10e24 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd4b60b78ed89b7b248198d4760352cc7094566fb29efd6e8b35f91bff4c52c6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f49c353b18ba0c8ad0b99bfafb21d79957034f64 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dfae671e57deb2dae3b6c9a0664ea6e235d07c4b66319e281098b9a652fbba0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a57227473886a1acde6d34e08308b6c3d821fe9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6502ee26d953ed149aa0cb88fbf64cf2207d7462d94318b62df14182a64dab5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1cd13b19ace0db6f8c289ef6db75c1e5fe36785 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:555e7826bf1df5c416e1b72a8233aa275203c6ed51d6be29e354348d4af10890 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e63af86a206316afb3cc319ee952d3afaaf9a22c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:963f1d3defe73373f5760dc72c2cb48579a8e458e51581eba9387277d0e343ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25e02084bbc2e691a998a95bb18dee805b60ef6f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f6c475fa387f8599e1979c9679279077c329d2eb56280f573b254772ea1498a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5e8a785e6c4f5a4b2d2edbb3d991706b5bb65f1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35b0be62bcbc8302f9d229120a06bc55ed5e06d5ff409808e451ed32c36b6549 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66e248515e888dd761210bc860b684549fd118c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75a56c57faaf6dcaf4b6c30572f9d3f1c2cac1e46789da833092912548ed460a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cd78881cf67cf4d19542f4274a580504f83efc7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:318ebcdbeeaf57767d5039e0b7c8d1f6827e78d392e879bda2da2c4b9d5040a2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..397d5a4bef772afbc8c3648a5e8a263ffc3d9c61 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdafbd2e8fa43d28e5109445377dd36dbfbdefdf49e9e70b8c6c302fef7c70f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc65e89e466dfdf295e4875f06f755180e97e391 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b2650b396210d1a548c7d440e1ecc432e3540c0fff111d3ad335129b0a7aea8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cb7cb1a661a8dca14df0459ffe0516fb5dd5ee3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4caac69ccd001a0bcd72d5c79e2911139a8b1dcfbeb5f261977ad29787c5560 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae036edcc4c7360b7d96eef9fa7d40aa7eb2a171 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0f57364f3a3353b45050b75214761309c4e0a214638879b5f6088481193bad7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd527b9221b45f113ecd3c2f66d7021a271d97f7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545eb5d824c2c2cfb796da5e317608d0245ca2fdbca748ad07887df177c94487 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ee6d464d85a415ad663a870b0282905d287c3fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7113e6ca58a3977aca63886ad781ded3b8a05baa332719f7f0ea69b11a0b511e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6694b0c27ef95775bffc33eb7f8803e5337352c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ec6995c51bea988476b2a8a2478176788b12c79868b992bff58f1e8de3994b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a650e5320f8a97dbcafc484ad476ec46a1d7f9a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06818c02e4e9d6f7350550fd22006150bbd775c0bf490fd8810ce07d902754fa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd5cf67d66fa3ce130d7ef02a79f7b6ee093ac01 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f61e9c7dccb567b4cc7c1efc0818d427f762f0a3d0823c6342c17938cb2ca80 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a390ed866a1bc6dfd5f6664c1c7b8021daabbd60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7feb46e9d9a10b022750c2208cb7eaf4cdbb7cb218357f46ab2ab5215e37882b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e40346c2bb592e0ceca11b89c9b3e2a2a29eaf1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6612a79e1737962e3da368d46959711f3916cf9b11fd72c5fb39a75c852ee49 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..533cf4462d945a083b343061e854da551153c72c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f9825b5ad7792503c2e30bdd00c3c6635644c67a3f0e32756bcf0f8fc21e124 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6c3c6e4e82b54d57893403ce300a80c1ee5d32c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:954305a748b3b93e7cd7e422362021fda81a95c81f38d30384ad3aa6d33a907a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2a83dea916f86ae8288e3811197cecf30e18bbe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa07013cdd6618576692fbd980aa2dd2e19e42c527c6a13f51347771e511baf3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91cb5c44ff6574d8d1bb0a4d119d25a7aaee1333 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:585d9de259169730c48a992b2300673ed5f81d15d594dcd3942eb91635ec6925 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1494f553499c3d59f494590fdd3442967bcd2734 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c278eeb71e6113e1ec1f0791d4463f23172f83e7db389c97dfffb2b151b3a5e4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11f66e6deeb1a04613b9901ba9f5420f1dc89c89 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9550ad808afe7e3e38a659b681193e66d80e174164d86a4c6b244943ff2af75c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9ef897b5bc1cbb220a7bbf6b68704ff0b9d940a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c762bb760db7f62597078c2dd9222cbd64286d4ee5849e51d0e0bf5d01588afb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77c6385ff1def6a314ec7d809923b59da1e1ff88 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94f0e545c3affab0b3d03f5f68dc683cf93b692705080567b22421bb803eadee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..098f709d8819e99378ba1dbbd7a3c7941768bd39 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39f59ceac71ee4dd7b74f00ad79ca3f3d7be38cae255fc02db65486fe554b6d8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e5ac85caf4a941a554dfa9ee522f05557ef18d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:956f4ddb6b4f64d4ecd395bdd62e83273711a8a66e4534271031f8cbc8d94272 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1840a36d2f28f89f605537e465cab538b22fd52e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b47936371000b8049d0fabdff9fd8ee19666c8f4fe89a4de5a73410f2f0c58b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73db20858938a5618cfc81df4f50b496f772b13a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0a353ed960539a417d372d014e7bdfa8b1f48243f70c68e370b97aafc9afbc4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1000dcf76e13b609173da6716708ec2bd15bdfa2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:563cca566d470b4c88ab7f4458e98f6a00c975059c1b3f382fade0aadb3f6723 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1a9b7b8e3aa7c6383be523dcc08297f598a849d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68a5d251945aa46d1739fd28b97928c6936a1b614a375c79fe0b1af3094e93b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7c91179d8a5bdb55bbaf59acd6bf021c95f989a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba1afc5f6a8ef7f11da9172c3a225fd7eeb3d842ff4477bfda62228f235b6f10 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d184dff5fcbaee96ca032320f2df8c9319d013c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22b72dd69f860ee6cca7bdc99121788af619243c7116a140a1bf8ff941a0ec07 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..053b528783836e35927e1356f7b98223dc854e77 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4a829eb1ca38619265f647701b23722e88c3cc5e24cf684116b70ed3223e93b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bc65740e080cbdd39cbdb3574a7a558c4e2572d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3bba4267af465dd4b249584342497e1d24adc56b04d897feeb0cc0e7da80d82 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b78d8e1b9eb37454041895a441d916ce19d2a5c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1751a4ca840e9526fa8f694e791f055e95c5ee009ff694d5af025f569b2bb1ac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..926f735191657db6aa3312ec0102d962bee1709e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:988f7a60d9ec7d9718f0c2898e05ddfbed075785c90d1991be853974d8539992 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d2c9e3dd9fd760e5d76e2893aa7bf97af431ca2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be02bacff74bed35cb817c30e53e7d2e89be9a1ae26819844e83d787c1880dc4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a48adbd23413f057cfc03358997237de27c2c427 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:328d674edd7adbc316b8fb8ef60533600ba440499b819b774acfe71798b50e96 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..513b78299c750e4e9431090793a41d5374727184 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:191c18e0801cfab6c87a73f42020f7018552bfe3d60f9b6b06bc721491c07123 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eed86fb890627000e82e93d9455b14b72b5a3ab2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7e806ba641d0f1c6bc66b6072c302131f078954767a163caa9e47da4a9f0e67 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c1416a0ee71c4ffda2aca43f9f376eb913ae79c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3a2513db12f50bf5821ace6a7fd0f5d8e9e9b5218305979eef7a304d04cd8bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b3a96bf994c221df58fe5fa7a670c4902fd2ab1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:526340577435d4994398d0027173f239c941ce68b823f61c813a3aab8a1549f8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f132ddd8f94750b5c006121c56e451c801efc587 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f28fab4d9f1677a77acc1802742d5c5c3cb3772576fa43c2d7b858302832ac42 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a1d8a175f28e23f1b10c50f2a430d0474f62cb0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ccf1f48e50da0d02cd65e9f8c1a40c4069b889759cc8d97d1e4da621e3163ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c65a447f2c243cae13be9cb15ca075c83ff6cf9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fc23cc8b9ad9b35b47c2cc63fc25370f25d454d21a2d9007f9dce88a88f7b29 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ec3d251d6a840d1527546d5def3f868bbef0acd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eb6c6bedc25f5be9dd149cfdd869219264b6488abbbee93ba2a1ebd59120107 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e8f2a6cd3014a264d9e92fdb35831d8cae2ac2d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3acd3e1130e3c638bfccc3355dee63652480eb8e6678b47c70d69b917702c46d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96a932c4523e78cb6e87bea9b1519e086a1cd05b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab11e9b409aea76d7bc5e2cd49626a0ed9bbd0ceb87f453b5b7c5bab72e54cf7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55402242c114921b08637df88976fc2ccfc9884d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3e32641d9274076944a3d27fba567ad3e4895dd126279007f759591cfb4d1f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0614f62f06b68f41710b9495b575728bd572a7d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7340a8459668d4bf8e1fb2ba09d70a5a29613ef72679b5593561fa3570198e85 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e57e769f026377b2c3348f64439cd505e6af2f99 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28dfe8ce488b5fdc5da24163411cf07a71c166e71e8debdac44c781fabcc9ad7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06ffe03295fedd509ea31a323eb3f7c916ea254b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89b75c8ac15b8b1d452d37c72aea1253ac6c262aeadc014d9ba0f3eb34728208 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..964579eecddadcabcc0b0db46affbd5731b70b3f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44111135fcedde9e44b0ffed8c48d41d95cc24109ddbf73694988a816ce317b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2379ab3ce0bb6d92af9430b8a5cbee83a7825c7d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c6ce4c80f1e7b6e7ae633f481e89a23cf0016920d7112ee67da9c380c097978 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4ad4df70b2690f940f4211c02250c4988dce9de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c705fb5deeaef2dac8afef76ae037de8e2fa81df71d3e224c8285af91cab9a45 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..727aadea9e256772dc47b9f705f4e8139a7505da --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccd97b7693aa1013c260214fadfc662a20257afb55628563f4c34168eee8f54c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..23f8ffbe13970fae6f29c49836c01ac41a210b52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc04d1a02d668aca0357b72aa0f580f397067c4872f713c8c267956eb341a956 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff4140feae1f099043969624c47c201013c5fb8c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e915409eff1b57b7051d849062559194406b47354e8ef3dca75fa309032d25a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c35ae4f457766f35cc484424d8804cc2b5c3725 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cf5713b6f12f57b72c985fd99bb476d97d17e638906ff1557e4212f743211f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d36978434897c90d7e371cd3cfda36cd133f7042 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e08954038a7ccb7622b59b76bb9bdc82d57cf6d18f7e1ed52af636396797afc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d36607cd93acf207eafd2e744dd5c1ea6b874166 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cf4b3078748bc029b7d6d694da782654b6c2f00b5d64c60b28a92c1fb573e01 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d063c3b3e8e638c2f64977f22225135f462e3e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:430a5fd89582d9d03141fe8d968f09c1a82fe6787a019c6c96908016b620547d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9545a41c4e6f74e1184abfb2e5b409d511914f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a8dc82810f6172da60ccdb6129330aaaa4424781b0dea9b30309febdfc040b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f36c09ecd2d75e097efe574ad98abc31525638b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a2944f3978299a1e128a6b9603df341952c950555248877864b1da91852ff1d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..80c904294bfad058887694dca6eec2b95e195830 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84fb769bd809b46facc876cdffbdb482dfabc686a075c6a974c9b8c553ea7fbf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9c1338fd64095416e06a596714e9a32a314f268 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89abc29621b67f7daed6a987539858cd5e3c4bf80fd048c9ae350f0fa39d69b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cd7a13631a013f02e9d2311dd4875689bc7000e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec77a1cfe0558661513993e255ca5c8310b23b3c8f71b92f7d5bfe5a1c355b45 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c51ceaa9fd2f5eec3a90524e554ff1a5a287cc2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a73ae89f218a27a664a9fdcc3181f29d576c8cd7dd3e7111f532a42d1bd0ea46 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..efb203ca4bbe875dea3b68b1812602bafa7d870a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:044c9a382d834bab2dfc861570d2bb7d82330feeb8c8fa95d16fb7d4cff6be5d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92a12b44b701b4f452e16be5e0db446568df706f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b432005c4e8a3c5b06f36eb8c8849cd4426da6ddfcc07cd9597e6c7ff830f7f5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..65bc8497ee599d83acf58c358db89eb404ad621e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa4a0ec187901863283118c87a6456b3125199db09886497342904288f31063e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d17c5c2734b95a610d991bf82475a431e45292cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8421e5e75fdf88c8b27ddc4c8b516079c3645b9e0bd0a7493e06fd5edd1da7e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e71db0174bcc9960d62979de119a5ab91f80abe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99ac18999d8794323c13e35521edc1f5ed486feeb24a429e7e0373a985106a59 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..673c0c420770c6d504f4f0b3f021af3512f1b81b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:665038b00f4e1fbebc2814502aca7e4d3cf30084f43ffcbb069bd73133c1dcd6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff0b0710f6305e1c98e3bbe542338a470c62ae60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bde4521e8a98ab83d3f081650aaa59f83ca0806c6096ee72576efd6055e05a74 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da4c38f8f140a905e4a6567bdab43e035f739f53 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b017fc021c33d0bd819b766ae567c0a3286f96f781f0cc6fd14463a81373a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b164d8cce5f1b0c9670c4ef6627a83fe34e72ff7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffa5c685c7091875146c28f462d18fae47ee7b0cdeba5f832d94a5c5dc2a4be5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d461a8eb5560392e75bfae1a3242add098c0c6e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56e20cbda7a745d6fa96d820e9da14276ba0839f6927f741e45699997bcf7d0b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ccd0d0080b0d51eea520f2922d5a0e2d3ad8453 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1224c489281649081a446d10944964b68ffe4f973be0c7046e285c6a926f4c62 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5b613619e6b608c5445bb3d842b92292ac80e04 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3dd4a7a79a529de7212c2733f054eafe6fee662f7171d64391fda662202a5a4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..65bcff35faabf0d7d675ea9798217e840a0090b9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14823e7887fea71bf1426d2ec9622ada1328abe3be4addb25c0220814b5c991a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..102b0cadb6cca97b7d95d4cf6117466eed35f283 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4108fb4fdb89042621a4be8f84e6040985b916942c4eb023e60829c460ab56b3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfa4ba9ed21ae36fd9695421a3844fd6f6528711 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:052eecf9f88d584f76bf7df3fbae58a3cf34ca202c0482152c1a639bc4005eff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0b3c061a4556ff2458af14c8c4ab423cceeb0fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd02ed14bbc6fb7820bac97412fa4ed1f831aa6b08ad84f228fab87430a4c6e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6610ada850bf7394e1f046d96268f40afe17a5ce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8d3312885464d234b6d3e672a10a53951aa718d4cc2e0a8a7d8cc44118fbcdd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..433db4e3d49a6199c33f6b9bce412422ac18d621 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:078c38f1b4b3abcb636ba30c30968679d1c5af3d6e4060baf796719fc09f3973 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..33d33c466408535e65017a5f64a1bc363279f02e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bc5346c83e36a2d32febeab2014838682929f5d1497f999badb104053851410 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ae7cad38a7ce63398af165b1d3a699d992fef4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d15fb18946796f3b10819e27f7522ac8075f16173ec98e1251172e92177eef4a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8a88a2052c16f64d4305394a4ca19bf00304874 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:350c096b5bfea77eac04cba86f98d258c8445359bef2703f6c8c871de19950ff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31329023d941c3ce18b08f7fd6686edaab12348f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04b8c027b045ec21eb300760af9acc2897cb8e42caedbcc82394898adde02285 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd2f336d110a30fbf4837eb3907cbe29e3ea4b84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54fd3f06927961188929ecb18b2c2c3287765318c93f8e92f2f8a43dd1830ae8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..874663c4621f499d8e51e772eb8de6af4d5c9fc3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd81ba96598692bfc0eefd268814cf49533000a195aebfcd195a556fec8c3114 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40e503a20f6ebb1384b7c115e547fa99d08604c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5c5fc8bdb2385e7c9f4226a8674e1b2833e7aea91a75fb34c236c19478968ef +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4487727d57c65c8254438fa124aad07a7d774375 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f2afffab154e9893c15bb150ab3ab2af9a2610d86b1b3370debc391b2029b01 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb7eef87afa333b90a6e52ed4cda819693f172be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ebcd41e6b14781e0ff93c590ad9d68704d445e1516921ad9a7e8a975297670c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fccaf46048de61fe1a3ceda66c15639aa883f532 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:360f11ccd0e6fb897acfd3df5c6276326d05c83ece97bd8535a0e7258c99c52f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b545f47f7058572e49f544e170e472802046065 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daf0eb7f7b4aa8ecbd2f5eb3c86fd5f52282c9eda46ca0cd39a5f3b4f23b866e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8a1ee52b46336d603acdc7f706d2789cf725d06 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c1435ddfb1307f8b1b7cbad3a1883a1630a693b51268df70ee599aa36062f45 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52c79d9b63ce02b783ab7ac12a119eaeaa059c44 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29fcfa5000832cc3df0977fe0a2f45cdf341ecbc4d805aaa3927597f1bfdd0be +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..610c6b71b7388a92a6b06ad42bc99bf6ce307635 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a94b91d1efdb4694d758ce862368619f0de9d4dcb0f5ab992fe5b621fd1896ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..04c96da26f291aa5b6adf9ae7ade198f4e80792b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33e946c6773b489b84a6d4f01c61c0e4a1b8071ef0f8384613e035edc449c094 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc3a19fbf84fe1fdac03df270742c455cf343e15 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caddfc8dbc3f3a44a9e9d66947940df61e95242dce04a48636dbdd4a2e38ebd8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d42018f62646bc3589215cc3b86a046d5720f2f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5449ee84f1fd18ca4a097ecf5aa6d11ed84993a2156ea65e5233dee3cd620a08 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d61c27eef445a139f95d6e41d73796584da2d472 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bf8c4ece687d64f775e76e2336aec9df3580853f10bca1aff47dfeb4e523099 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a298c9108e0d2e455f061031fdc239241d9c9f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8da20581e2ddaa196dafc3d8327c6fdff2a519da183cb544ec025ee95acf9e7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b97000b75b40a8131fd26c3fed58c753d450975 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:778d22c1e7c13da75c42747308e9807cd8fae718bbad05cb2727992cda693ac5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..26a147e19d965e73dcb1321a1240a9add7012c03 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58bc2e2c83c20d6b4766e6305496a04b95a256d66814a65db96919c65ba4efe9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82b24c0df1627a2b99a09c01f67e77da04d33e55 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38d37957804d877e1daa2255f9ff4e3c336f40ca355a80e2f46d2729bfc4ebe2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc319c5b491cbdb37d7a7091e280c51e7d0f312f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01b7d28d1679fe8d515cad3891311aae64285f2a6a8b77a26d1092c9cc7e00b7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2bab85207823b4ee572ff764294dce86290e09d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7638f20fb7b1e42d158789c3235d1af030adabeafa5e054e63033225f4d6cdae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..10c52fc397b1ddf35ea26602e3e2ba13cfb2850e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:892834e76a81c845ede7c697517c83b7463c9ea46b66eebc5c41e3d6e700bfbf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d7d6e1f4b171286cce60878de2d0229585fe3e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfc1efc1fd5767981e8d413caa06efed9e43f8f573911e3a59cb52f5e9864783 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..88b6469498accfb02bd6fb87b73138ad93b66781 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caaf673c2ac42ba3740ebad7fa8d899580546409c876f59be666a1aa520cec8a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7beaf95899fc7433d24e531d835e93c3ebebea98 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:059b06f4b96e691b085d9f0984b0502cea608f6d846c3c657d18e0fb30d466d4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64616275d698abec9e46a20ad15cd77dce9c089b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18b3f3e482249fef187fe91d0ec20f3dd8b914deb31578596d1e47cd8cac1b6b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48c6250bea2bc811720f8089d3b145230a84af71 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21075533baa3b81eb0fbf09381c2b731d525931c7c7f6dbc972252031f3dc0bf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd037db89c301cbe66e9cf33db9a788e59777151 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d66a8dee8136a28737c5a120a91ef828a3383102de426cf1cbc8a1d9b568fdf +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7586644763f8eb2c2d52101697c9ef432fe949f7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61bc7a87ced73faae4335f0315756a00403b93e48618f6c2faf4e5da1ce95b90 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..588a612a2eee48c423f325b14db0051c8268d976 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4d8f3534bae2f852db004ccd0a097296b2df845e547bf564439d388ccc52772 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1979a07076b4a616a68987b9bce40deb1829ad70 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:500a126623ac0e101d8eb49d7f619c8af0439bd6837e722ecd624240bfb391db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..78be6b2a15d9160ac793da09f7340c0351db7d1f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a9a9ae554bb061af89778c5b45b6939afce3faa9805ad97232a61805f015964 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e03ad2da987ecbfb0931571d4b93e71798863ad7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33b86286c3d3e9ff18fd9b1ccd6cd2e61fe95fad93206b04643c47d03246cbfb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d1bd1577e749b72e0376143929aa43230255ead --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4bb2fe6cb3e194a05d5004a0f8f781724319d3bb83e07d4b5f03dea751ec5bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53028fae63b9ed5bcfc6b2d68369d4d9997430a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9f1868aacc573a91c79568170fe65f177f1ed63dda0fe193f6fc897cbf6706e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8ab9ff1669ca23686457068cb5b395676ac6276 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:992e4173376042281954c62853a2fc9cf5e8d27af015f5349e4c9c177b826437 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5729b067b2e92e3ee1d5b817eded2b3c16f6e56e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88d1f5b64e0e62e6ac699919113f2994fe594914a9df7e7ab88aae068369e55e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..206a82e0d3420b896144e208d708666d897c8f10 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ee255f95fa066bad7d996c7cb43471492f36f89cf7b4d6e552b43ec1403192 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7598cfdc09f495178a2b469a32b9d21bd016a32f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce6ff7ca1d42a64fddda96b89369d0a1bd728c9fbbb5eddcc8977e7803fdb644 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..edf93de50e2b5a61fd14f92efbc7d34f11a53e4e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:369cfeec6a91710247525c59da414ba37c05474f87fea255e7d3b8bb1752c394 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ba0bbe74a32df7ba32a2b71eec3f5f97d0c27a6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21caadd90877fdef876d8942ef2a7a2b3e5c3d7da02c86ff9f29924e7551e720 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2352c7032162eea4b023e21fa0719dbf2b58681 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bd43c3ffc43a6f11ff52486e0888ce6dd45366715bfb33edcb1abee597eb461 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..87bf9158c45742b742835376b39134cc6e7f8fe7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20945c9b7bcba2e56d36664028170d75c98501ad85e3a2b8e71c3fc16beb6075 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbc9e4a6ae10577cd7d77738ab69e47de0258425 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2554e713e70b2568cbf4b2a7fe8a5374b375c12ac1d993dcb1e522360f47475 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83d4b602eb89f53a15e2ca0212417641fb27992c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f390ccbbf341672ad1a26bca9cf427fbdafd612c845c58c140c8d0d3ede96ef5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..656c8035fd96196d70dd89f207b6fa099b1405e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78d260712fdad721a6e39086e3c10d45ef856e86b2c068e6c6456aa91ad972cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..140534277364286dadee7059c01b54fe69cd8346 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ac7c3bf3c5d7f6c07d4bff8e08aad43370425e4496615423416e7d43dd6669c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c812de3bcf537f24e002418857f19c4b0439b3eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9347613e85537b3751ae23f626d36f660975c6f18069cd0f67498b9b5bca8bab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a02f8203806862cab02d506abe1643d1e75f5e88 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7870d2bd941641a1c362fe14d9b33c06d343eed01508b0979b17a92b8247bbcf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa4afd5bc132ae1f7013cea74b834369a3688454 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca1dc95fe9a3eca9a937a143ed5f1b5ada8d53ea0168f2dc02b8be8ca42e9ac2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62c3fd7530f663b17d64123a71e3ab2d43a6eeb0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d779b1a9890f108dcdaec8ce7caf310a4ec943a03ed433c0e7c6e90251d93690 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9b204a53be639d57cad554435a993f4236fb18e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e62d51495c4827cd15b523ad56aba4bbe24a7cb3e231d40ef20a541aec47f556 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86aef10ea00a87eba21de356994e9dca0d0d984b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29f3ec4940fa4a92f084b88c0c6754a1e8c9ca8271d74e146c09a2d83f8ddd4e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f47ec587e6bf2f3e3aa82736e713dbd0aef262a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f5c03d4a5562b200d1d22691c5360e248753009e154fcb5024cfb46696c3217 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..418ec9275ffe12cf0df1ce5eaf1db89488566f0a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:294ef467ac783ddc17713c8b8c8a33e395a567187955a31ffe86760f75253166 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5956bc542b9da81eb8961ed6db8393c3042abfc8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1595d7962bf887a95d527715e2cea7a00cce3fafcfdb027ce009f20db36206d3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ba3dad320dbad3841d2d6ea677fae1089c140df --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b568e6105da39a4f801effe252cbb279a5cd36305804249b4de07a03b29722f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b702fbd4fe1c61106cf2a1d77d556520a5d1fdd7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d77336bba3e27f3e5e567e3132bf532b4646f1bf84c8919f3a1ecd8971fc218d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f09b8adcca9e4f46af6aad630689967e37cec39b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc0297836fbf47418de435b2890ede936be48db14b592d7169257f9aa2875c42 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f2322f73b6c103a290c3a2741d1826cfc3cd7f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e54aa6cf78250c914d2f439f3f0311460b1f637c0f40fd4db2be3a96f365a00 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f96446a3acddc6c983e58ce00613977923e0c6a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb0626d86c77ea4adf5c026d30d425e5bd5548bb550b24fddfe7cc44465c1b00 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4a32a573255a0b07c1107b5a07f9f0a7394a815 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7de858a1ce5d80110ee106b921618ee2f7a6e9e74392eae1f985bc27b6b065d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7911f09da561b5abfbecb056988193f763520369 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14170901fcfba9ff99307f8d10274a42ba0c3e15099db7ce6cf15395078437f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f84c20d05591ff0ad2a083fe79fc8c244f878e5b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bc1c186a4d1fa34644e43f450e968427fa7c5163cc375d45ddfd7810f061b05 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49bc65cdcaf7b8ee3da3455354279ac98c9d0c84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9759a6a65b31c1c64e89f52c0934b16decf3f1b2922b6ac6733265a36cf59a12 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9814c3b369eac2f4fc86b40e6f6748c20c20d1eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb8d7b0ee6065f695f27d25f4e98f96ed857d91ee7f91069f2053963c67f84da +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..301de05a523d4fc8386ef40be4469ebff4c0072d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3abae66358cb3b21f5625646abbcda796e7978218694d31dde5d286ad4916a2c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..faccbd004709d93893f43c7177834f015b14f50d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95a91b605adbbc60991fc4ecabcd0f7e1796e1ed909781f6930cf9980d6bb54b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d83a12aac532bef400b1a01338f10670259a27b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:263a38d802ccd49d30bfddbed8c524932cdede1a6b5284922706b37de8a1e617 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cbddb35f4cee7bde7a2e6b50a3febcbd7e52295 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:219d9d3f6a7480b7a61d0e945e6091e3f3453ce0cf6c7d63f70dae5662485ff7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..222b9c8b1902709d54aec1b76d9e041b3175135d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f68e6046c9c344770c144ad6cd003e1f37565a6f95cd3f5f44d4416a8e87f0a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f55bb8cfe3d00a89045aa8f0e401434ce52dfba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:838ac3a2d0b44d62a9765f22e764bd84a921957cf3f32cb98a349d74424ff037 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40869f30399982ea9988271ef8b41de65b0dc6e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4410f7bfc9ca45c2fc3a2fcbd9556b1c3ef7e624a5fc4426a998d5471c5738b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3ef98431625e921202e384cfd2802ba31f1dbdb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:205cee2ebdad77f1470c3cda89f97989b429eac023a2e560db459a957bb497d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6429c682211e8014dd9d8ccbc62abec212cf05eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45f823a6591fb63f2fcf262bbe1dd9c61907b998a57464c35d5f03c6c43f70f1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79f3300c5b8ebbbbbd91cd42305f33bd655e905a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b2c1bc129cc778a0cbbfd48ccb2d8379841eef04a62833368089ef4ad08e266 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97671f5ebc2c5500a22636d7bbaed60d0991819c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd72934426ec48ad51b333c79caaf1f48effaede833faf8fc59fa7037f1da83d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fe8ae4a6213a622896c97e8c2a3271a14550216 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17a4f44746c8743e6767b1e17d76bba0b4b3589ef2e81bbb6c31e718bfbbf10f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8910daab01d000291b3a21eaffada3869385c44 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:651205376e23ee4b522e0eb21cf2c586bb9ccb01f328fdbb467e6021f5cfb9c0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b04384cdce90c14c51bfd6b51770343613b9b5d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e2a9cdd55819cd5d98197e2fdedb39244732dc6c9c04e5818884750877aacab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fd9564a88623457e617c10928ad8a9e9f2a5e5c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fad1859be97ed7a65d59328845e58658c20e34d01806fec4157c368513a11bf0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dd9d75c342d2bd4e03162eb144baf90ba339f9f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01f5a407d75266f3abcb5f3612213bec526b76d996cee645c81255e3a2a57520 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07b4698c1de86593bd0ec5552cdb76a393b710bb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49ca19399b3ee3702dac3ea85dcb39a367c13628b3149ca592d4d77eb0ea4fe2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca8086d3bd2bb3dac950166c8183c1ebd9a2993e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66cbdb32a400bf87171791fdebdf64ceef77867cea09495b275ac36b0845bb8a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..899ea4e4726c51e12a7676c176119a1f0e46685b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:938f30686d29b3f24511253310793cc11f124e7b58b9f3d77d2b1fe1915ed016 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b417ed9c3634121daf694065158f843fac6f660 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:963dd1b70ca554f1cf1fbbd2528a10f3d52dc85227f05e67fbfe59878d296630 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1d2f0d399b851106bcdcca15a658406c01efd96 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d035716279d8129e1e9b64a7902a3f0098b2ccda67a36a78104fb5ec02d59144 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..84be6b0cb66d0d93b4b210c87a77bbc5c6b5a9aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:378e1204b0eb200ae80da84d83c6fc1c581d3d85bdd9c3695a3a8b508c0ee0c8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75fedf81609feeeb8b55228db317a04c186b703a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:444f88fae9b88cf2902e2ea5deffba32e362ce7ff4ce5da6ed08473737eb0af3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccdb2dc49943d68c33881501c4bf42157ebb6aee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f7e2375645097ffcbcd6d8c9b65963c62e1bc758913303dffd9a2b04be0ae5f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..363cea3e1ff8d0569372b47f9d2c07f6dfd2250b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22430a89952a901db0f98313636312bb4647bab1b8a4c5e3e6950f7e9e7affbd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fd71edd30cbb8cdf28e28ea6cedfcd82cff092d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:822c713ecacb302b097c7d917b9b1cf061bf79bf5418ee0098a963f37b984e6f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a034727679bcdd2b366624872b051ec83c89716 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34713054d7139bb2584454a47735adf2a8fcb1784be8314ffa7f0ae241c6ac3d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fefde54eddf9076331c3df4524c01f60ac49572e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02164181e7e7ce63e0196afbd668e9d61c6439a26afe628a655658f69d5f2dd1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbda25e8d803052c016b70b62a3311edd469e38a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8e73e7fdd4c67a8d0c0f6860dfc0bc99b568216ae9800b262f5733611fd3e6b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..33565c94d2596a7fb5798b527cc52714a702ef68 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c49053a717945ee17bcc8c6854a32c01987f23f0e5b7112dc6eb6d480c31d3a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83d58ba529c79a078e27be89cff967e6cef2469e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc5ea0b2cfa8f1def7a749fa839d37e8e75e66a70ca34e4c9d59902879ebcce2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..06bc9afcde1f9fb8dd759603d2928d214e3ca12f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9696497f40a8b5e8619c7748efe40cf68229f9bf85476cea8a3aeedf5285d83c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79ed51e42b962a493ea36702a1a54991fb0478ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_6/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f3d949850a33fe4d2887736f6478a93681606286f2333d905f769594fb400a9 +size 11395