diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3687d12f050e0c7a8b3bf367c9484ac8f228f20b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ce3b002eaf000c66ae3145b821bdd6a4b7af085210e55826833727d85659bfa +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8c6cc20be6143ec1156285667f3ca6e4344aea0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f6bed76c35690b07f17c167360bf3cd5cfde1da0c617435b8e80d2c0e424c9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b969f046605a4e624d390ab2c6a3042ba650fd3a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b448d5ed6a23c25ec11ad89558970c6f50d2f891f2d66d9de4b8225b0de828d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e32288b1ccf8ad9d6985c0a83c5a6d7a851459bb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ed81b1a227b1aabfdffabed3206a05784226b1063b3b34bdd9ef63fa958aaa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a789f3f186fb8452683eaddced59723602cb2733 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f25c30521a7642d6adda9cda68a781695da1189295a21c875cb4a8c94988ba3a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e4e4f7cf6dfa67269c061527f8f746ee809646b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee212642bbe6f35f8a32871dd6bb3905a4977cf08e4e2ea4bed417202bd8bbf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8800b2de6fe918e99de3999aefa6822a68701a0a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0167fdb8df4f24f0190bbf41d93d0579be3862507b25538f3d2d2faa33e39249 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..483fd7ff2f3b083ffa2044ed9f6b09b3d86c70af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:226a8c869aea5a40f52e8b64b8daa762f80fe9929b60e5af8d22acd91fd5a626 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9de78d2e55e1b0e3e132db1cd866a65d3c54928 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab79fe35179faa043842a5958bb97bda8f9fd8a569c87404b88ba584e735a217 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d0ec77234fd09b4e9c84e3bb134b439163db18b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc6337a5cf1c32fa0368dec0a29f3c820c690d002873099caed4343498390fa3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9baaf2f144ebc3fa23248a06c171058a6ce4371 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed2b03685a0ea66ecbb02e503b42ae60a913bbf446cb1c68b70a2d25cbca3b85 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7cddffbeefb029f1d29a22384aca145acb69a05 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:defb0328ce5bfbf8f4ebc071768d057cf32ceed4b1a54c569d5d7553e18e586f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db251802cda40e2d8f95005ee7bbba2972aebeb4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:272ace44f903b3e3bc6bec1e35a18f831207b6b8f04a424c8224ac5deb36df75 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3dc98ced633ef8784d27d6c438727828f5ee26b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc2c69ac87ef4c1033d079c74ca7c6b3f79183aad14d1e6a666d774f89141124 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e3641e54df38251d9f6033ce473fa5902347334 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87224bcc9a640b3c08108e1c96867ce95320ed305700117f671801f750df71be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39d4a14e7cef27a86ca094ceb41759e5c82ac7ad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a6cf979f3837069290a8974649930063279b70d183f0de38989b9729252a740 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2260d13bad075ce46580375595936e07c829f0c5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1dea5dcba16b872d36670798f19275dfa58f89b69e72f3e7a418eabdd6bdfb5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a79769a889f7620a2495e3e4329240e95020483 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41eacb42fe6fd3a6e2e892053af537dd3c7cbc7c9a4a4ed9761e0c126c8a3031 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1061fb422e7ab49d70390dbda2a2edea9c699518 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbfee50cc30356ed11b7316ab29a2087f06e137f8b3248a8dab0e6c2bb3c99fb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51fccef7bb48977e3c286e876e32e9c078b4ceeb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42585a82d4fe7f501ac0b6a94e0fd06ee836b14919e5a8f8906c54c44fa4045b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..203fc32d77cfb513c567099f800812bd4cb7b9b9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f84995454b212c90523605ec53a3aac0ed86501c371f10d115db9a310804c5d4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37ba0ddb8c177b975916b242d6966106d0f13c58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93c3e2babbe240a14398f91eb5136840227d6c27c7521d5c46b49e62855b9b65 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..633031766033f222342726e9ee414e66cb37849b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2470e9337da32e12b84a7e82ffdf4ab61bb65427e652c0d84e15934cc61c939 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4ffafe7c7a68bb4e3b32a2ffcea373290a4c191 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4887967ee8a2aa484ebab22c2c19fbcffeb81be6816f9d29de62b91fdf58a1e3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59a7b73e67dd79aaed904b89a6b9f0e81d1cbf81 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:628414013086f87eabbdac1cf7750f739171546136dd7c899b255da64408f969 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9234cb074f1546cb6f0a1aafccbce09052fd796 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeb1e6861e77d624ff1614af4a70209c52aaa1fa67a0b3b84f948e4174258548 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2faf0dc905867a086a1752d147bac0301fbf5a48 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd5e59ae1b8f95bf800417b3be0061e3606005c5f5b935830d08274554905308 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7694e1a57d9e6cdf29246e196ebdc8470c94c556 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:520cb1ce989a9ef4d37e529b1536a39386c8ce391ed323eaffee22410c68d886 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..550fd13e28da0d796c5cb794940508fa41cf5c01 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:970fedc66d2333b78ecddab985861efe17258d3c02d733ce9f15aec38b62dc2e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f57d9afc34d7d7e99b08d148730c39164ff4b63f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05304d3f8bd4df775317e7207bdcc9fd09df156941cc0a4862fadd2d905dc15a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5b91ecca2d07ce45ea89cff26ee248ba1b23fe7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c43fa36a7679073d9ea0f2291f6c80aa120d194b389fee021366d1487150da3c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37a29bd166c9875f2b4cc7e5b632cf9f5c2681d8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a03766e74a01fc83a701cd66358f2a60fcfbe8ef84258fe23b89d9369de810ef +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eb44df20a50036314451138cefefafd84e07cca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2f91997a8f7b0d93bd28f95d4c8b6e300117719cc364076c540d8f5cf43f152 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de7b1584145c105d7de38b9d71e7de497a73e7c4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed5b79fd137f0900246abbb8070658ca763b1721513769aa46ad62dfa36f0b2d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5be939c7f2d54b87bec8def7d927b88b376c7853 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c45571ea194e427322e64cc8593ce466d9744b36a87d3ef6cf9dc2fdcc104a3f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5045e3ab73cf2543c593d9ef53ea78acc4428b2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7a3bd6d2cc0895631f7b0776b7f717d58acc707831db3de64c7ebfc08577bcf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81713e1aeb71980e96cc73ffa5ca897c4560e485 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c971b68086b5da6ec8f26a65d873939af17f1796b6646205d57318e03d175e5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..300311076b21084e37caf0ff92df586cc5284c6d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66117809d7b51eafe8d7e464b470d3185ca23e5b66b3c695fcdcb1ea300f67b6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7290ee805dc84b68c33c9472c7b8e35b4fa63303 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb8f06cafc763f0de7c72c52b52bb6a645bddcd19357ce2299ea8a4a4f1e9100 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4105115cd8ebc7dbe193d3c5749026cb296affc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0420b9a77857898cda679c44a9be84b61c26d4d0106632db4583c98569ed082 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61916e1742d978c8d84ac0a0bbf1aac90ea54a87 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62608329513141dda2cf6096ff3c6a688e56c78fa8b532b97af588a9a7192a9a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04f1319a4b9570f3158d1628007aece44b09c507 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bad812a13c901afea33cd138e0123bc274939d2d459580ffb80680b46e1027d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a1414bb2459a4b50cb3abccf568fbd3b0690363 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37bb8dbc1bc50f0e09d0bafdd5fe95aa347e3f204a754fdefc174afa5c883f55 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86f35ba1e9f415e8cb27428fd4afb9ec67258306 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8709ae3ce9e58aa0a2bb0783024b0ded182765d906a4fb36857465b1bea22af4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7879ae91d2f6ded3411a5534470722f4d5715667 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72b3f0ec2671ca64cff203ae001c5f14d3c35140966bcec986230bd64a03a44d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05ff07c20e97565af572e605047abaa371d4cc2f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74ba63cab68cc6657e9d3ad6820a963934ee1461169a879da4657e4aca1f0e40 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..348229f53994e1e18ff691d15ea7ae8a18eee058 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75b3acb274c9c2d689d77c9abe74a33544bc78c25206525fc9abf49e232f16e4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..befe78bc95570cde04ca8e97f4ee5371b5b09481 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a94406f5c253a9d1ecb536df2ff6fd9958b2b3844e23e0983325891167dbac6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79c8579bc4a53a26f4f27079b2460f3549bc3796 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25fc101c0d4dafe69577a59790c8177a1c91d8a9f7cbb5ed30baaf02abae57fb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbdfab30bb43416f8a5b7fd8f70e4e0907008f66 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4578e8035c145e2cf92cf29888096f1e8429679da18100fc9923b3436954b972 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8712e1e19666662361e89f6a0f7b46c06d6407d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c2ae91d800e4251bab9d79fa33f3c98e8595a65dd82b8553cad7d64ba8b494 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ac84f5dcc8031c96346df82e8e524400b52e262 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dbb4d6154f5b2275cddcb64acdab87037818b73d9fe684b1ca0d0f100ae2fcb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f525440cc800f2997228877435ec2e4692051735 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12245852d9c257d5d1b638c44ab24f0300928404eb57be645246a11f56a4c842 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4299bdfb8f9fe657efcc589aa96b7301de2530b2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f269a1766260a965e8c85da6ed4b3c51e05e285ca000b1e4e477d02feb404906 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28e89324e19df9867ff4377a7eb95a3f3f21e46c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e63b8406dc4879a8748e21d9ba234c5999c9a6ecc90c5602557ed545bf1fa651 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..652dc108d7f4d281d61fd6684e0af3ce5c392d2d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:277e83e960c419735baa3f8b2b5f16ab5e63512e0e5edf856c4f264544bb0150 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f09b546327e62980b4a6091d84c44c37c93c4acd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b84597f1c4319b001cccda6126d035206b7ac49591f259c33f3a99c6632156a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4dd261a9ab81759fb0ce9ee66b00867223f83a2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9432121fc28d316a21414d5fc3a16822d2b37085df56346dccd320c3bf9184db +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5f1db3c932ee28d8969bb6d3b9c65d5b264c7f8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cee01dff837c8b7947ecd6c425b7ec01bf85a2716f0fb5db91a3e68fbec8015 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..588c3db69b56fc690499c50cb76fc464f16c2ac9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ce88c8d51e40957fc466838566596f01d9b628bc90026f7b9b654515c6abcd7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7aeb29838700c350cc181ad8301d8998cd33f8a8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0568e905d44d86da8c020f0740ec718bd9becfd730045a5dde78d98f5dc7eecc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6744bccdff30b6ff15023ecf753e4b5b2402d43 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a34f50e295cf4d3da7d786c9e5eae479411d731629dd43557c9120712679c8a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69c695e70274525569461f0f6750379aa887408e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8fdec5b93a92664941dce2ddef796d0bb70c8076d5dd562d58feea957cecdf7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7113dcb854886eda6d3ef259868c90f686a5676c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e55768db12af53f633be9101a07eef006ac272321d4854beb6d8d0c0d2c9cdfe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..742205f63b6aab7806288b2707faf3b363b44568 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c67e8d570bdce4197444ca48c73196efd4cfbd963eb492f6f0c3a92679055a63 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddeac639aca915244b3456fc07f2d3356117fe12 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:237fd400cdf127bba94c0b7e646b8e7c9ffb17f7c723e46fedefaceb1cb89a17 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6d66b3fe546c3db74106625e182adf003b89d83 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:156eb99e060e4abdbce7a527193649c827dde94492588a1ea68e72309267c60d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79a8fbef1b017fec1efc0e967e25ad078d5a4af4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe74c2a91012aa2fafe8228b7e8c2730c25c22d6ed6a20781895ac64781bfcc3 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6fd782447f010746460864cf79fd34cd129cd05 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c227afa53d53fbb204ff351335c4b6d34cc6f95b797b598b1003faf1d0522604 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7bcef9bc66942a00ca98688df665a37ee10854f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ebbda925a544f5e6ece066f9d3ba3ff6ee27dcf618a0c4f45c258e3accd65d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9b65e68b98d3f16e6af89653eb5dbee8c736d58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:782a2c1e421ab3d0d8ef4f697109ef4b6e849b0b24a6523d54f13979cb6cc91a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae05cfc080f3a6b747ab9a5bb94ac62b0a736bf5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:487eb7655c3b7c8d06f6c10efa5a8938a206bf18d5b85517eeaf1413c1f6241b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f897342ceb89dc35af1a432e62294300da443c0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d93fd9792b7cca58ea558a683cd457a7cdf69cf70f6c7d287b3287d02e4a79b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e464183a231a3bd07b3cf4b98fd77d84a78f6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83f56ea511ed022d452dc9fbddca48149523e75bdb26a198289a16f401e7ef36 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e176dd3ab13204410f1d0bd30866ac108cb5c9c9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c06a097f936ec4d4ad58c1971595960d41d3f1138be42e9ea949e5684594f0a5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa645fb37812f41548727b357d730b5273db56e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff6f3112e412060b5637270cb1a6df94f8fac15df5bd953e6244c4494371a9f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5c1f03cd0a6c0ae2ecab72649a7829189ffdf24 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0505870f34fb3078011611359ce587334e34f3b80371b50b9967aa65782f3a7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3c7ef235994c5abbef80d66b709699a7cc9c5fb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:753eb5cc4552ecf0f78a3aca4ee66327985da384595a8fba1bd9c427aeb51468 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89b2d9ad495d060f5b99109f9f4ab20b93117107 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6adc61d3e353f2f3b04aa6c639fcdc1839008a179362863a6a9bfc1a82cfa54 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d52be9a6e4482ffc77e986576744c49ff5cd4d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbdda0f94842cd146d2739711c1633d09187e3aa284cb9eb48d507c686acccbb +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c3c4e69766ba561d71ead2b148749aca829f2a9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4780cd5201ade1c3ee4cda8c3f75ae48896cd4197ea38f56017bd40346ed4829 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b72f7b90e2c106a2d53232d6574477d80e7c312a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e8ed344a3af2aa6d773a0dd9b2619e656ad577340596d2eef9f7db638dabfdd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e65e2690ce45cb7492f9548509ef18aa76598422 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:764d259c14f7693e1356942048658d8538a8cf02c7e2e78bdd2bf0199b5321b8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58bfd4a9954ac18abc53e7e8efe22e3118e2ec73 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f34fe1af27d09601dbf39f2acf75c7c3f031b8bc3569360c6d351114aeb39f6c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..872fca08f241e6dd9ef4330131f3b008bf943e0e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:282ff2b734654b5f5a85b35a505f3867a386020aa593b29cc5ceb5fbc7eee9c7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff9db999536406361c70e47d1c595590add775e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b18a6e7b658e45df8f8b81c4280de75fb9aa5fb8055450cbe9fd069b0a1c8ee +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da8cb564c64b1b738f23fa8d1179f543bf610db3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09c99c476e5a714c183fe3df32166470f548200c145db5495e0ecdc80eb30331 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e929a74049700b9de5a46f96569e19c6cd7a5ae6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec2a0af264847ef41e757a7125133f5b230918dd89d870dc3d4f6201c279294c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d67952d2ef8a444947ef31486515688af4ed0cd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fb4de0435d68b81277f0ea4bafc9f65344f6f503654d1ad1399a48f6af0b2ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bebb2e7f8a3870af62161c803b02017564ac3b1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bf56b983679753a2d87906cf88f73bf7065658db3d08a2ec9cecdc3c4722680 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a672c5096ed5069ec2205368c56499974042796e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90bf23074de67bcda167ff73d1633aee00c908fe28bb301f8ad1c605fabc90ce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6653a0de1cee28c1b84e6e4e2c3cdfbd76d8070c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aea07faa23be11947c1d12bf7bd884b5fe05705eb2a567bc74fb06ceee24d5c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e981a1c04af0e976de16efcda59de40170f2ac08 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a212e30b845f71549380ef5447eded782ab9f68aed92f5efc6b6a21afc58f560 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3d35ef08268f6295fd5583052e2be040d977415 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3ff621a570ab622534d2b1765eea449c77613dadef84fe0c801e38ce3107760 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..136dc66137f24fa210e04337f438f8fe69dc7cb2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a3078574f6fd91f8b1aeda8ec5db8250df8e80bef3cd6349ae352ca70139858 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..27c578afdd068503b6348a8f402e108cd05b5f5e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6e62ff13b688fa67e237ca869da0a9b7f38d72e2c009e999abe33231ff47ca3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..554ec99cc8d670c482df5ed5f666c5675ef41011 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcc859e669aca3add245098fadcde550c0b3cf964a59930547ff777cdf9ba3ad +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e05a275db0ed888b008580a21e197ba365ead5ca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80c5aaa28e791b69341c56a2136923c72ad45b4a1e3052c9699991797a812c8b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10268a3dc7c19f558683419a0c0ccaf0e576d023 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4279e3ae97ae4064b5ae7e0a26be7d540183375c2f195647ef931f19f510d14c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..927f8e77095dc7b982853981d71657997ffb16b5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e921d775fc42bc111d4035daa5fa12ddcf1174d974c2d84b3277900cc039a522 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e277ff533fa73f855f1afe03214ac65535f17ea0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6c602a0c345c4a432cc15ace4bc39a3f262a4efb67ebc1cb49ebd49710f3329 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5329767d37082b9706d8c56fcb127f1d171423b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cdf3ffbf654043e2dbbba732119f697eace03783df958a77bce53ca254bd4e9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77d5b558b85e5164185cc5a4f67fa150aea02155 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13d09915d3b86681fd46f684599627bdf98bb10fd19eb6427b27c684c6d3cb2e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aadf54d6da2bab89f1ee781890efff029d65123f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed804f3fdd1bd8f543320be7440eb29d6550647c51f60413953027a74bac745d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b96c5b53a19e4569af7ba6df46b5b173a9cde8e4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b73daee05e70a9e00bc71e552d090bb448fe72262fef651214809d6dc62ddbd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..356c908f9a7bff1cb5516fdc889d11e7dd24e525 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46908fa447727ce39cf3c1f40f1b4b2932bb99957836b8b7b40f9a8686dfa6b8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56a0f64977c331782eaa51136945ecc4c356b9a4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b91c48f5cf9fb094c8b05c801301284d741e0ab0260dc4a1fb50b3cea41a40bd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4eec9cb4bfd9a46f42fd0c0fd7d2608750e99c5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6a6c9c994cd74070200817610d50cc783669b59d75b244001b16b80299d572e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5fba2a22707632a5a543f79224655483123fb04 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f775a592113201637aeac66038e56e3eaf03e77ba5f8dcf90e1a1242e34f8e0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fe0b96d08b2a1b05191f4cce4fa413c4c4b7cc2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:481c9f44ad4399d3e5eb04a49e58857bbc3c2fe94448b15a5e39d65b077ae75a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4eb8b7d70018e097aa4440cec704a4e367905a4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bf71cc25ce42413aca76c4dfbcaf8775a7b3619389e5ac0512e7e08a12dbdb5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c6308db1649c28501fe332e610dd6f1242c96d6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:611b5287c0ec6633fabf17dadde4ab09e60fb1c1c1166f9ac3d4a105a5ffd179 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..013aa4bc217fa0dcb59a30cdf8e74afdede47ec0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77923a6a3658151e7fb8676de3a0faf841271a55b02ed8d28ac1775ef02ac5bf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..822ffecad1c6a4845b0ec6e3b40cc64a0f30d477 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5e289f73810c8bab077f2dd767fd8ebb0f5850f8eb324422ada4678596b4505 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccec3fbf46b71907f0c2d44f10873e518c05ab47 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48f8e20af6224a849a3f0ba2b7269c217f54982072456a48781a07e673b293a6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3488719de5516bbde47adde949aa487c60a5f753 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3a1e27ac9709bc383a2c0d3ecad25a94aa546c779228496def8037e9eecd717 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f92eed21e99c3b4f241c0eebdb4d27ef66f7ab97 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb74c7391273c185b188f098d5b74795ddad302c3816eec06ad43cd73ba6f28 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d4d8d49c0a2ecaf4addbd520935bbed4ec01910 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5263eaa0adae649e61309e0e440e05332833804f6db27097860348e0e3cb664 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93568dfc5fe7249bc93847f5ae5124e8e191e046 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23cf36c08403f64f79801d00ec6de0e7ccecdb122cd33b696352055141130d3b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..314393b41a62a62279e5bce9b49cb316ad524b64 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a4174bd1dca1d41c8608276be9fdc2ee1e4a6fa22a4fbf6f4b444e7f245780b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fac0fab3032c958f83ca257b75e4e488157ead9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34c4dc55e8a4eeb1df1c19f9479fe5b946ea3cb55da551d28f5cbf70938b7037 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa8cea7d0a2ff34ff02684678be25318408b0291 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f13ffbd528ad33bda67499e42479e8026bbb96e409e3ddcdd5fa8a14259fe3d9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8620edde82d1aeb1ae5a8dbbc234f80f4b5bfc4e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:787f62d72425b6ee7df29c9c857ba146080a8f931a2b075237668aa1a40c5520 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98888206e1b72e30f33d5f7d3f04b62c64c5bde7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4da523e25eef1ce06193b18ee849d3bfdc6a2a9438f7fc165a45f42645a678d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81cd9d53e7441c8c640f54b285004e8ddc756756 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c49c53a33c4727aeb7d221b620fe39cb2f3608f9a589c003dfad9bbba5b7b562 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bfdf0729b809238f3baa3249b4b8511d8dcc355 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0597433f907356318852d6006bfc0b16f646f9f45dac08a97c4b3c9d895f245f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8879ce57e8540d7bc602a35f4133c0831f188d24 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7dacc95110f5ec3e4f161b73a9d841d534d0f481e76bb046e4723478ef2e028 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f4f1dd6801ea41be55f679bcea3a2227b67f4ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29e6ab61891c6a84cb90390e3e42937d26a4e3f5a2ea6f00acce81829150f490 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24cbb31463be3eeab3f927aa680390b7da102d39 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e11bdc83126e6b9a8170cea08652cf7ff5e766da6bc1c068f6e225b736ea0ed +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17699fd8c40fe6ee14faee03fa6d18be8b672963 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3e8965b807d692c23d2abd5a2aa588c23c5cc994fc456575eb1c7fda81228a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d39237358d079c2e8514d40a0319da7424fb41a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9b49dbdb91cbbff3a2e6201cf4ca55635c986590cf6650968c7bfc1eab23eda +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1abaf0d9b031e51e69001cdfe4b005b7a00ed9f9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90a05aebf1f4a1eb0e330280eaf53e494b7fb08bdb479d2a63d76201d5ca8f60 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56d0dd997df59f94fba7372c245971ec8d944024 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7b6da26de1436704e5a068354c27f9ce4165c50e489ebe4a121a75744440d00 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..541b217d74c653ef2431f51b38054f041e2610a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bcfd7b41ee071da935b99316c8dbeefe516311cad132fd4f0882d03d45efd02 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee6ea03c5fa053557d4b8d9e3745375fccd98523 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06a750add3dfd6ca3ad4afd0a6ab1e57d2a8258024d03c171680acfc65448b95 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dac9626e89bcba337af80ca8f329f0f42d636fb6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d66a0c4dd735e34df0362bb2c7ac177bc54a7043255ba858c25f631507f35e47 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da6031feae01d8a0259a820cc84c4f0551bf4981 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be73d80603bc85ca6bfa72eebe3ece8c03114c56ee59c5a21cc86649a2bee60f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f87a8aac310d3b60882341aadb95de42f6ab4b29 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff8eb338018365ca10cdbad4b0a773c373143a1b917804ba28aec3a61bc13ba7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0ac43a2bdc9d15c6f90530f47be4e003db413be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2926dc6c08cc5ba94442b4efa320a08ddfc7e062d7526a5147408ff49aef9698 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3843296a969513e9d603066f7896505ccea6bc6b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf314ee1b39ed68058bd72b6f0d39d2eb410f0e13c0fc7d7c46ae53813e1ef72 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..abea2ad25db0a1760e8ec74a6c43ef76bae104c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd539e274209b3ecf62795e00d8977ce4f233bde5dc7b60ee9c1ed38bae2cf72 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c230155fa60865b019f07e969529b05cd6ebfe75 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8ae1158502ca0525ff89c63a90fd212bb71ff0dd8a80578e53dfd55b234b124 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e32b3d5601bc84b4b577fd5111225e33c4506935 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6fbe4727092c5dc694b3a2f98cd7f14238c387770af2da0562385002537929e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04ef61e918ad70a5c2f9522ebc975502a6c7b1e4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:706d3035cb399ec6add0639f4970b68d4a3f46a6449732185e101b8a23b2d75d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5844158569059feaffa3a16abb292cc221ef86ad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c6db030a7efb9bb71900f1955de6ae1ac235bd3a8510a2a17ee6fc9be182eb5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c70739dc457e97634cebc3cf91512713ddbdb1b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b42a20ac5875f6e55e0d6317e299ee54247e1a98bfd828e777aefa1bb8791015 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bbe6e4bd9f9cbfff0b38252038a25b147cb90b8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e26d73c3313e708d2a0b75f16b7e359f81ba29ee5c083b86095caca64a0e64e3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..263a6bae7eb64aca66ca61e4ddb51afe37e3db2c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42260848ce9690cfbfe2bcf385e41fa642199f0e44321dcbf95eccc2aa25441d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0003b9bbc694fc024ea2c67005af7decf8f8c642 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a783cca94e096fbf638ce241f088c38247be88c1804677ffc97c07f2bdd4901 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d81f7216de517e91bc731315aa1cdb7ee371c4ef --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:417f5c444b1a2305a1f8171c58fc7e8807cbea8c452aee8aebba86fe2e78edec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5445bf9556d9e8e4ea47ba07e37bba343e7fd74b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93016c8e9138b00a50b43159f7667529530b4d5e568099ef6a44115f4f2005c6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b666a53e7252df16d0226692b5b0d90f04ed8180 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c3a396c82f461facb9b89133e2bb5a67d7173652d24d43b6d135344562454ce +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c6b860a2ec9ad7fc6850b78b7d4fccfebfdef18 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4baddb3fbb54050696831373abc92570eefbf4898ea3e688aa6c86eb08a5046b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..645b9cad4183a0710cbd4b73b048616be6d07596 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a85514b3e3ebc08e0679e8fe215528706c53360b848c9c90047ae5a5adbe515 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c25b0a10de92156faf24df7cdb208f8c35047fd8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9e250ecb9492abde0fec716de00c8bef232a8b38bccf2f01477ba32e3f8643a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0106ed846299637887911fbab1a6e1943ae3317b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:746581a2e003300f1f0cf20789a13eb6a92ff8edb7b497de6e8b0ca4b8895f13 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7165a74af0be5e746a59139312d1c7fefa6507b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca732ee4e2d2d9ea3f5b7c2890061bbc9a07df9aa15350f857c18239d2b04e8a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cb6b442cd53e16d15f02436bb00e2f3a6cff5ee --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2415e1d812f03161287c52c3d62ccd60a147b782c67c1f1e90d83f50e75e77c1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4af3cffa01f79c68d5be771f1c6e162edcaadf5e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3274aa8dab24a55e36c71384072b9274a4ed733ae2938c538e6256adef1083e2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..721b4801b37febdc70e4d9fa854602140432af01 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a3851934e85327f66bd2198e92f8c6c77f27161cd25e2090bab86b57b0d760f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab7729db08880596ef09d7fe6a364dadf93b078d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce37d6786b6be2cbdc7dad2d16206028fbf13ce78d6382021abcb98353756db8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab6687d0185d68c2c72fba71621207d4f93280c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1255f58bc0fdb99b55ba04d285d8173cfee414ebf72cafef5814c0e0fb3464ef +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be555ef75d5aa4dd1436db4a26ec6cc5300ac64d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5192a0b9b1c6c15a98fab056f08e30c2653f0ed7ae479f77690b7be5289c47a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c439fb5c900f69be10cd7a28a332dded25a5687 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83fbed2f8c5baa603d2a5f2617a8ab4a88b672cd8b34504fe26308a176f42bba +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13c1ace3719ce906755fb2801add0eae5b944e82 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:674e448e1a116feb11f269866858d7fa5a59c5bf7b6879b9b09db12b6b67efcc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a76f73a3088837a7efb22333b1397e0d83f0d27b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea1c05065bbf227a2a932d8a513185ff1df855b64ed61b53b42ff89538de2213 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d943249573f5ae3e2c045fb487fc2b2694360b76 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d29ded3dc99e036643807b65afbca88a617448c11f57251fa05cd9cddc3d171b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07f2152cc012b72bdac44f66f48d5bb158dd12ba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec9eb64c1be72e3f02edfc0d2a4b92087ded117e48e8f2e81bdf120846594be2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b6f7a43bfe2499e277eb0aabb709a53e4fbe647 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35f1b15a92c92cd72e8142574f2b33763f53655ac20ecef699e1dc3841d51695 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..230a857f16f26d5827e53398e215426e38935f6b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1166eaba701cd3d5d700c785f74d003d8fc23cd90324cba61ff22f8f0e919ad +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e0e95846e8f526f1a6ea4bce46395e896348c28 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd42913fb85b84727d121932e36a4bd5526e4c6a532e757c783a146eeaaac0d4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbdf1896840a77152db815b9f8067fc916df9e55 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb8e7d7e70bbd062b1f6ae0adc8b3523af40128f133535b89d7b94b69869d7ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb5b1ab57101f12e3186ab5dffa7a5c1074ad77c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b2062e24cfc9d7796df9b0f9a4fabaad414bbc2feff3dfd3450f973b5abb494 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab0752f81f977858590b2b0a0bef2b8650635b52 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:497f9f906b751e5f1be27c5f47e41b15857440409066d80ce476fad0e6f639de +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0b865e75bdb1d1347b494891260a48284afcd5c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c68305c104dee1d06631d10b8a29b66395252a9ba13b9801a1a134877bc533d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..946d8bbb7b1f1758c20b8fd54a892016873bdf11 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b402219c25064cf1f76916929c92876770f1499a70ee31b6f28aef49b6ad595 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29153e4b8b770b7fc2320c22260b17aa5094f774 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed08d4deff80b007183809e420d5dab172c3361871af4d7b3d15c7ff190390e8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7615ac9ffc46ef5151bf6bf8dafaaf567ccf5d68 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61a444e3a40ebd8937a69b9a4e85b1d44cd850d417317baac34c0d3970a196b5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d554c88c199577db030b0e0828b19b85cde3b876 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a74f8a3792ad747e471a5f1e23c523f61cf215972b7b0bf55f00db9a63dc2dc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2697f2632a12c984c6cb4c847f1bd5895ab7d7bc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcb8734989298cbe18d97ab608e1e48b4c4eb4f6e875bf0db5a530d452a23c0d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d1a6993c4fc53402048aaa7b0e722e15f2848fa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:996fe559d93e700c1bcee9ecfb5d0ba8c6e6840c435dd5306050219dc5e9f410 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9abadddb8447961ec85596bd93251b35ece99517 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ed3f5508b0b1820ca73ab32eebfb7431899ac94d05005f38b856249b27d997f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32bb7876497b7191e43565198753fd31024057e0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a50a34016c9eb5380be1c4c770d02eee610744b6fbe6801347188ffd61d3d9e4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0ff5878bf3ec53603acd1b200eb0c95dab11736 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c2888bba58abe58c75ae95a0568770004e7de2dbbe02b0212a7307af9f0340 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b49a114ecb86a05179d229f2066fa00b0c942541 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7999cc0f2f1f1b30cc05487b3fc8eeda754fd1dd331e12b9b54820edf67144d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65376fc2ec8eac1176ccd91e81d2d2f8cb7fbb76 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbd558ab4b79da02812c9b5f752c3da0cfd364079c9de07490dc2c4953799525 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..470b83abe122e88d4ab02e5d0064984fe478edf8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68075703a44fafec1aa5bb8e6866e6814cf6597db53d0ef0a12ac5d6c7f334d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68719ce5cafebf103d420c32bbebfefc3a5e57be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35dea0aa7855d0e163a792455b301d094642b5e965bbefc01692ef5e913a8da0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffde2b45c52bb912907962cb33d1895547160a4e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:547f70a7de8f57ea81bf4d4dd748608c0cf799ce5c165b2f77a0eae2170ec742 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cbae8ee463796b7e77d1034aa24cc73f0a8fe4e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7d468dfdec2cde721a479d3e1f21da821d7c279016d074a5238e4ba25239d06 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7a49ea655cc9ad42e3ee8ad91aff74e367062de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:070810d8db765f415c293f06950e957c87fab460f2ca841dfd5bd51de492fe5a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e43e77fcb46c804cc131f0e9b82c05607858df05 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efd77c6cf58d3d57fdd042952b1e15aa77c7eb3a717dfe9aceb84605cfcb51d9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03b854c20b3974aaa0cbe6d56a9eba6fa60dba7a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ceb40c51947afc2dd74113470be25c421c0d6fe76b60efff7f6131beea4066f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9779538c3360091b5b1d328bfbc0bc0ec18f6e0e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fca66c1441e3c63766c7e2bcb88759bfcb4cbb10601f1d30f5995e0b9d42669a +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b73af45cfc5745e858972d6556f0f17ec6993f9b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3299040dd879eade995f3706f4d6901c77a630fe45c84dae72660df82c92fa39 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d10a7bd63e04a5dce44c38c0e984fdbc449ff0b8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18cdaee53e83e29d7a865f0a8e34d8e1942253ccd8ed4621d70073bcb36bcedd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc679a005761ef55703afcf64f3506a0330d0be5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0640996de21925f7fd6f647e3575ab6f9e8aaa8dff1c1d18a6110034ea03ed8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7314695f6b541242de19d6db4e45652095272d1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f70331b34f78f3197fa25f108d8c30a5100d0968ff62be69fae16b964683558b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf5ad35b0b1ea28fb11e56c91c679da255ebb94a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1831c8d49da28dfc498baa5755d265455e3d8c744d275fa1e810bd9678ca8b7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3277069e97e133a99e6bf352fadf38f4c80f0cea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7817b9c76ca76d21e4f2deac43c2d1b87d9f773b59a39b7691624c6d4710ff05 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91c97cfefe6eba69db364e7dc39c40247c0da841 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:334babd262eb69bf8d8eef9b46065a7997379a90e6d43df374f0614b69f3256c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..870187323dddb9e84e455dd67864ed2cb2683778 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e80e94cc2698cb37c699ecd1b8ff5dff2020a210731493fdcf690e1ab7373f46 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8e47c81ef97d98a00cc1ca57be9ebec1c4560c4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20f886a50101d818b32c0d953832ba5399f9e0018fca8615ed290fb12bd45d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e308a71cd286397c624503ce0edbcba0ad570c1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaafcd31d0d82f59f68f485b0bdf2bb0e4e13ba6657b633ce6ec218a00d93b1a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4cb2f0c96aff15b9c73ecc1e9213f47e2082dca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b8e484597b6cb60b34d26da5ed28960a7d3ed423775927c36a5dde8e179bea3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a3b55d211487f18a63e9b98c5c64217b03c2eb8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f556800ef6ff78ffbd8d1e25c2950fca34ab43098f483d6e3b028a95dab1f47 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17159ff5904037e6a81ed945486d29cfae8d8a48 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e0cec749c879bdce9e4a0f507ec9abedd0482361349e4e6222e6be3197a57ef +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..76303e7b3f8060db46c68a57241dad032c5404a9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea1ab960dd2000800eb68b4256f2f5b567793bf844990a249eaa133092bdeffa +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a34400e27f52865d2ce152d82387b4e09358c838 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a49bada91baa3745c06a7c8b8bbabb238d6c442eb6cd481b10d39b99ba36096e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b59a71cf11557d6d0da869237263bdf74708bfd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45bce82de877402145f0676514ac81ad820a9face53f9a83051ea173eb6d2b6e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24667cb1ab23d49cdd9dbd8c240b0fdcc95d9a72 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d7cea7de68a0f2ba50db2e5b5e6db95a285bd02f1b1dcfa5e018143c50593e4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae25a67ac7ef182b6790291c07c284b27a609de5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f94293747d903bb912132af5daf87e9fbd486ee6d5ba0bdc9d380cfe20942730 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f334900fa5729c7a67b0c72fb7dd6aa848551a42 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ebdbdc565d5b7628653c61a8ab457e3dc990d7279b8ce9d7f4a770e9c8a8c8b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a80a5372f072146bd1ef196285481c8ebe2af11 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90aaa557e95a27e606fb53c6869d0ebbd74f7d431dfe53ee56b36178fc7c5606 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..163ee5bfa8532ab76c4e31147a8717e9ff2679f8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b6851c9ad3c64de56ece6bc4b64e9729a0f6330c62ce73854f19271be56c3eb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..055e9d8749c9b9c9625065805e9515d0e4509bcb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3a5862c72de9a3ac756fb90188a20169edfea58e5c7da02b238e7ed3f246fe0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe68cd5671908505f355dcb7797ce190dd20b827 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70dd615a817d4c8a104f8b951bfa2fceb8002fedb217bc69afe55940b8a4b9a7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..659c5e11de74173f2029a4f9fc186a4546ff1760 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:651abd17fc501a0b539f4f176155521994d79eae804e1abe080a57a905847468 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..275b5e80ee2128f32871f94ea48a51911d167f6a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1794d14994ac220105171978d17521b8fdc1a66c6d714fad3033e5bfd0cde20 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8457e334a34d26a5b4bf2538274dc626a609f23 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d3f2deab5e972fcfe19aae95dddcda9282d4efeeefec8de0afca72504a1b96 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7046f0035bc4780122f0922fe8fff07e468dceae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e1976b51d7663c48acd76ec5a3dc65c915f71f2b670a243866b6bae9bb1fc88 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..341a9dc64d5aeb62c43d65ac1bc8d990231e8cfc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41fccd4a7e894faaac4feb5b4352bd4bda452de743b19d50cf690512268911ed +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50b1602f7cc9e703e1a6121ec09a2e34225dfc97 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5567baf0ce0f239023e5af793cd3643651b1bb791801d9a58795cf4c6841170e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64c40f8b9619ea8bf5292947e8d0497a71b88658 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eebb4e82891a5cbf373be1fd154debfd4d020b5b4a9a74067b2af9287a49e7c2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b467d70e61c2dbb04d4fbb16abad61e06d2f747 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56def55737355fe348f146b556e4234c22918f659d817143828d5829f1912292 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b34cea670b0f80e1a090a48d2a22b7989258fb1d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:675cbe1a6e654d7511c09467af179490f3f9d91b557bf4b61c1297f340e99b98 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bcc3f7909313b313e1a4336f46d2d154b5e3da4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d46e8c96eef8a9ee77add580755f87a07ae3351867ab9651597abadcc4652ee0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e26202ccdbc4d70387bc6bfa2c9dc02e477a107 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0499803edec3ecd219078bc65ef24753e05fb8ab88b05b9443f2ad3d937af1a3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a024de1ccd69e6bdf9fd2af724e6ad44db71a67 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5238f48faf3a557c84679840bce318b0b7744c8be5a32f623a1e7bbfa20b1081 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cc193534fe8c879a0e73256156689c6136dd9cb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6f70e419eb1ee42b0b5fff89a02a634ff1039977eca2b08c3d8ead06b4c4465 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ccb76a03fb00223a70a0a221cbd35e12ae0fd21 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:657dc0b6dc793e665f268fa6ae156e3cce2ecfe42d83a72b0fa1fabcab52fcef +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a79e42c255a0adcf601bd83e52fa5845f885a2c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aba3cd2cbbd84ec48005af766487751d8fdfd8f25c0e8e71e9039f9595df996c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c152cfe8111ae06d84e2d91a614b969226be50da --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd9a0731be0c6dc909709bc80a543ae339de476bb61520b324e26cc10861c79e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c91447e11dbd0ed6e4d020769f76d3d584055eb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8938959aa6f10c0005752fd296e3e067c6e72dafc95faec33411e6b9d03535d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fb6f37e189d311af793b0679fd7a20716700ee1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:852b28ff84f0fc711bdbfc519f44462581bfe0f513fbb5f62fb4bbda9db2383d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..af78ea69d754e76d1ef3b62e4964de8d84696130 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3554db968c5c358e98021bd9dcc150baf4fb9009ceb14e68ce5afbfde156229f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3887527f0301a3ea26ce2f8114f61dee90a0b600 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7f5ff24039b1369971e21b7c40142ac5cc5cda851ba298b8d7ca98caa394198 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a7a7b55c231b80d2646cda6343580f75087f43b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05ae7b2ef59f5860a267299489335bdd36bf0a65763c6ff1a2744888948f480e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..276d03c3d4d7926ec380f5003d9c364f14710baf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3cad978c9e369f02a02959f086932fe9c32ec4bfdabced6dfd294ef11909fd7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e551c19a19e08accbab01fe1a1077598325eb709 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc0c45c541e6258d15a162de93f9e6a465eeac9e0ed5264f446dc7d4b2d52fe3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a2b22da4bc15486a18a6e571aac8e252d777480 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89706eaf4a027b894e96d3f15edd5bb653a6a8b4e3e946d5a8e3fa09a16a6a07 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a42a01bd5dc42949a015bd26ee0bfc31b4d4b16 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aff4d9e513d2ca4979c7ba5e33326106d65ce3dabaf20c1e5ac06783e57c2c33 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2a24319ac84cdbb2d5de8837abea23c1c723dcd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:179b88da4a6f780e68276d26b00e17c01996717bebf0a106a7c9af1410e34052 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..910601043ba7f7c9d7bb4bf679bea0ddf2b6bea6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b3813f8210c5c2238957b8b99ae5345009ba689bf035ad251f4d1d933d3a49f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1fe4c424bdcd69cbb6d81b543d4fc0b89e56417 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9efafbce7f026e39a8108324e2e6b268fe95019edfac9b71164ed4c43ebf85c0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28685fb8efa8a11c4e3d73ec56653fdf80c1bec8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdf195a685be81d048a605f8aea1065b43bb8147382e9885bc102b957c4a31f3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e71a007f0d797587bdbe5bfc28f15e3333f7f9c5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f6095abe43acadafbe2c702f57f85cfe050f51ad89ec9d329a6c86c07c420b0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..331991c0cf36e15bc1e95954939f8c99b9cf36d4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b5c930d835e95986acabf3a1dfc9a214b32258ae9ffe8f0cc460496f7d961ba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceb653bb04c5817c9faf9ec75f5cf5e963606d22 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:911c1d025f8706c45faa74381e58bc8db2022c0e1dae99324c13ba17ff3041ea +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..29f1f2c38f2ff34838ad4251f31b90d5ed4e48eb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74e08f44b5c4f6c6f4649ad60f40de668e5ef8cd967926a8555f5bde97b0798d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc5c45fcff6adddedf7905feb2374d929374cdd9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:150faaa1260e15a371a651790eec2b2ba2ef2724fdc2812ed39e9cf87f394ae2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..730981bb2056f65531262e39a3be40cb4198af40 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a75a45f130ba36d883c9936b7f4c7c63faa9de6d84777effabd75bcd7ef63f27 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..039e423fc34e4eca66496bc36aef0748d8a92274 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dba56986fc42d929b9fbd63e2e0540d1aa48753a8c65e0a6ff6fa0e11b24a35 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a070776efeee4b1363cee6eb96c5e6d56c49cefd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba9c4bdfaeac94b57ff43ffae81c6a992a96a875e652dbf5d5eb53542e68b54c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..835f0d03af11f4fe120ee73eac89f8500866b9e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10234d1ccd0526709d103420eb8057ae87d5be15dfd6e11886df23e43b6c9a14 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..982aec03cdd4d7dc06d08a5e0cf67631bde9ad8f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db168e84d2c85ebf5f967e1803493175bc5cf55ab8a59be31ca1f753e4f9595f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f95a8f9b5a5415895e3089337febb8e2dab3a22e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:536381c91a9ed3f257c224064696875ee114ff2b59f47ab7e9f7f13f0459e694 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f40ddd600e787f6548daf815883995851208517 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e78f45bc861a9161b69f2c5dd029baa0fce13067d1e09e474d0c6e3f2a2f9221 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcb76f5ddc68b881a456832b0599cd4c8bcb5892 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb1a2be9c71ca1e934d48dbc4bf564b73abc3e2f0864a955e6da8d2994ed8404 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..83cd6442f6e394521a17dd536bba7f88ad22de2f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2db667a03d4d206421ad7564e5d0da4ed494ea7537060e953f5de7877d966e4c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44f0ce108ea0f84b1a41d079aac4b1e8b3ccacf9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3132c23225c3a6bec21a20d56d0885a23c051feb1feceff8d227b019464dcf7e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcf344d1ac75c605ef5a34038ff0dd8ef739784d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fd678135c03366a9ea52332375ed49223530cd2513e27e69bb8035fc2839362 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6458345f918fc5531d8e7031352408f1e1d4bc10 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d6dbfea10a3c9e0c7e8068bac479bf990d97fca8364b5bedbac041019e3bdd5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..25e0dc9d34d005497d585c2d79faaa69030df83b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e940ca5ee0085faa897aacd93890f8f722298adcbe5b96c96260c96868b198a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66c8675b12a9486f62e4182fffdfe1ea68aab9b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e041f1168ffdf0f5f354725c422f50c0927bb6c30336b37e822ef7ec8d46fea2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a695b378ce8f8017cabe8b3aedcbbd4e3c0c040 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adaca0e8d1655ed1ad95c47f3a1aa8009b4c8ac497b0f0d2671b7624195daf4d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9347ede3205978d5c1469c7908d2b659bf4c9d2d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dbcb038347954a321193789ddf0ec85672655a424b44da6d44be701e81d5322 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f491b65a989cdf9662bf62fc08901f9a5cd9f19f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97203907a3dbe5d20e3a2b1e55081ccc92634426cf9a2029603eefb298b980a1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dfee4e646b47a1e86e1cd6dd792339986c7958d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dd543b18290223b4c1cd53e9f2091f3dc2277cc25e40fbf07caecd1d1dbf8fa +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..804f24bf22fbfd00f025a4e23352d87370889a19 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ebb203005a5f6888bef10a0193d92fad80901edcacd68ec781cea364eb333ef +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8506b16e962205ee5cf95eeb249f411776ad6c15 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ae589c6735f4392852353e057360b8cfb0ed4d4aeca7075c7eb28f78b4d31c1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..44d7b37293f31537f0cfed8dc88c98a3f9755ee2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:295ad65660ef59045beb7a0dcc2fc4205c2431e1231827dc9a9c91e332fc0b52 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02aca72605736f60012e5b117eda5032f7108dac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c2168aea42e263b48b43df7cf87ea16a678a21ac948eebfe4648f7268e1dff3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ebebe81e44d6794e05b157b591ff74884b12456 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b61a80aa293b190254011a7abb580e2e9bcef85361c524f0a22e7f934c0fe81 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..680489d051a807b72d8467a511498a6ae843d390 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49d2ea9397af7129f9e635c44a6acaa2a366c9f4bf23ed1a2420c9043cd97efe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..12368e0f48576e233892b7280507ef1fe503ff0c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52ddc48c602a8ca89c11af527033d19ff6567c0a2f2ce8c3a9630318efd8f6bc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ad6b9d7c094d43146172c9fe88495f39dfe5af9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62b1671214f14310613898a892a035cb29037fdbc96704db7a79f7f63e84e5be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad5b1d1d402bb72d19aafdc99783622e65b04c74 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dcd0ce642096e22472beb078e7d0cb03be5082a2378d91334e49cffaf25c7c7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22649f59e7aeeca4088421140aec332ebb046f15 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:701336bec9e17b51417caca2a98d82ba53d8a9dd6992d571b2e6e1632e76add7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92cdd1aab41195e7921695cdaeaba655c2f8fa5f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c5aa317094c61413402d5540a5801d03681f48b66e087d0a6b1c488e497c445 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a2677a410ce027b06f251315222257a788cb2d1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:357005b24c43601207b98ea23eb808bb4face24949c93b3b0a7ecb69772a49a0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c4a5f19d1395652337418a4962e8f43b18bceda --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5cf574ed12599a7dc55f6e64f5725e3b580c4d5ef6170516db852cadaef8b2f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28b8032577f4967af5eff54b7b88182372890cff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10bfd4c5b0c13bfbabef42e209b3e97ab05e47761c314d8bcc7b971b88c67f15 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..668390490900120ac6450742b8d8bf9c614c0a07 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:350a007d87e92038c20ec2a946435597bf3b0f03b2869e31457b3bd0ed072c01 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4daa1cc2c980e9e60a84d9b83ef35a9bdd10210a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61104d3170f0b0391a47a9d9cafe0400a370358361829bb5f1680f792ff4158e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..88147926df351f18beb1a549061268c668f72300 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28dcdac2e98949306dc802920d2c293af853aa1fb45fe375b80d0ecd3ab26d3f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a92894c5be92937f7fdb94a0b31528e5165d1ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b06759a44fee357b839677e4ad58265b65454ce1f934bf0c0d6fbd8d473a25b0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1090f7d328accc1e8aa315c20d0245414926191c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13f6a5fb473078fc167df9c2c5c293e854855c358ce7d02e492b23e80d7c6446 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7fc90b1fd08fe683438d3c1da1759c97d15b95f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:896777125b03ed129520238b394382f0b8f4d3998b12514f09281b7040122344 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f665f430fe467cef27dfead70cc5f0b06915f5d9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:284f083da4f121181f52f8c0ce19d6a7d833a08057bb4a93f08e5399a525712f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fef6b1ced5ba54d7ab452c5e662fc0709c621c3e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5770a7f03eaf541bf60f4775030faab1b73682840a12160478f98cf1a342e85a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2be5cb84c2bd62a90236d4a4ff6e00b9da8dd8c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b21be64da660f486ae1b1506ba709b02b123d31edd3a5dc38d9f8b6c4c4cd0b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5864907b85be8af76be1c5349bee3cdaeda833ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d89fcedd99eb48b24f550fe50026a249674f29673ca1a41899195b838ad1dfd8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c1380b074ab5f9bc4a6b4aa7c3edef4a5bbc917 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55fb0ba571418e61ea8109541b7fb459ab3644566103d2cd375d2f138ba66ef9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dc0271471fd10d9df8e7154a6f6a0083a9a4948 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39763addb0c71eb037b092c3d2f26e7bfe3d558f41b7615dac95f402e8030c7c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d13c5b2f1f7e156992d87d3db90d42ab2533a998 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cf47e03d484cd3a7445cc91e82aaf1180ffd2f123bb21530ee7a6bcf03b154c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b924fc2ed02a8bed3e7cab0f828124a5c4794e91 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51420a6ac375479043501b2eaa5af68d3037210f5ddea3cf807158c336718cea +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5b9c74c626f43b08540700e21b8f307d13e68bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cde891ce71873c63c6f4daaccf6ea0ce2cba1bbde544e5d7fc867ba113fb39df +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e7b42cee9c7cff0d64a2b46154768a209883a91 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cdfa1786571f1f21f48f1e2bc27b9fb6d29e1e6dc9b52a12ddf835bbde2dc90 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1afbb098c5ec8cc600d5d1dc59724c523da7e56 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6aa12744da66aec9eb30cb2f13e2327eddd0cfbbbbcbc0eb24ecb1a90d2ff3a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b78ea517666fde5e383c3615c56c5a5309fafd63 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f838af2845511d67eed4ee6950adf82c6bd52b743ec64248f9a9f2fa6c7c9c06 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f1cd111856d96665710ca31ee7df419ae1c4866 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea6d6b229a9c4e69411066927922b860c21ea5f39f1a5cc397cacc82c9284021 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f2692b5a5ada16f14354e6a5f372c2e01de3cd0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fc35a6b5eb7ebabcb7effe02e35a051d1ae6abfa5b64e86160e2f60efe682c6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6eae56e5ff2762444e5c0367ff0343457964b7dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a241848f763dde12e7b61f4b4dee529dcbd16071e0c7cdee2da2a13e9e34d69 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b27b5f124b0f6f6ae756dc56b4d2ea7d182de21d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dbd9f57684b7fd305a3b15ab816a7392ca80b66e361f3765ab5e7e5f1562720 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..59a598f864313df44629501c1be73d959d962069 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04c4984f2d06f264abe9f20fbaee8e86654fdb228515c749aa5500798e80d33f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d656871b8d45766480a7f5b9778e2030b219514 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f6e3a71234e806d09a5a1c37c6d512211b5349c4ab44a2c17144a0572d5691b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e267495bed908e2b15b01dbe35f82882890dbcad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6536f3154202a6c5cef87fb68706ba530854031746d3095fbdb1e07f156d27c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c02ba220219c8d78e272d5af0074ad547951df34 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba0fb8c065f62c7463b7c2b388e8141012756a0630d6515e3c2b60af795dec0a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8faa994022c1ce33a969930ce2e0147c47da4b4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8540dc38dd11d606389f28827536999dedeacd9bc3001c064df9429acd26c748 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cd76b5f3c159a5ece71bc6fbfd73998f1ea4337 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fa941f3912e27f365fb951dcd5efd49eb8bd73ead39179ba33ea29f3680c907 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..20e7636fadc4b8d0106e84dad228e6331d40c94a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7da6734f1340f839d37bb3540dbd48e88a9b0cb309d9f709535729f355cfd6b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03d0ad69be4d8fc8dfdee78d9dfb645381203818 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25101481b9774f0c5955852b10463845bf803fc85c1c7c155693946f04c17ba2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b18b42e782c86a13ad5a5e6a638ee431336d7160 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b1ec35354a92ce820e9b6855ae17a9d5e03b6f82607c66166ec14c607e7ae1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ead93ca2983bf70ebb00b4341f4572a3411307e9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c32fd6736a840aec7ea7eeb248e7913e233733cf02179f026ccf2eccb1a8703a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d14c372aa1b889c4e82e292dd62ef0cae82dc6ca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69e28ea5e995c2f4bb7bb7e7a7bb77a18b2afbfaa0f5b56464c191a1d7ed5ba2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9e5fa0ef2491cf3d9f44b4f153b71b459f32132 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2b23d04012e4ec99a23bb3acad29f8e9ed532bb7d77a96be582d48738444160 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e856813b8e4c34702b4c61fda5df985b4950366b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71f6cb0ccf4f52934813cf8e65788c756b17805b6c3aca77b82fc30830a70fd6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aee2341c9324b1ca065fa8053d85b396fd634327 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe8ec41727030098b8a2645b0cf768c3fb888452fc566ffa6f28dcf17d027f26 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f35336799c291b46b83d7e5bae7d096e56b1e1cd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e356444619fa79277211c985ce36ef47fe4a95aa5328da11c976f48cb19e805 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6208d6047e23abe0cc363436ae1de6d88eb9d510 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1db471930031ebfa3b0f9fab7e3283ec1388c82dac8981b88bfd553282778444 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc079a98e254b45f10f4ff284fed31c23ae45b91 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dd19fd3a55b4da1bfc6e5b32bea1caea7ef6a21391255e17046b26fb24f3b36 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2f00a2188eccbc151df36f6a0a2ea6476267c4a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b211a47f2573d6d6f4e09ca8e16515ef40a5ede6e936f83e81e11c5ce6927829 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8041ebdb388026e49ee2aa29b8da4be3f5b1c74 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90d1083871df59fefdca80071f039c8a9c318dac0f5eacdaf287813a135ed82e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7974b894c7d56fa55f01bb14281a4cfdac9eb4fe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edefd915039cc5310b4a0fcf95df655c50ca38999a4c0d716d47a909319fd07f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..531b4c6abd1156b487e1a6b44f5e631220e220e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08fce7686a6e616f49fd35204ce5290b6ee5dda1da655fed32f0361a470bf73a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b118b46acfd05579a23b3f41a912114635e8707 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8482775f0ddd0e86bce847f05a62a1afb2f5777d2b4e9723066a44a0c243feb9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6064aaa60c5ae1a92121f744515e0fc704c9be7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3c32fa2a00fbd5f5b3d0c2ec5204ab37044f9b82c01d1f232c6bb87fb713b82 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3d2494b334bc1180b72129091d607c57926731a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7900626edadc94d08c3356cc8767d5e7eab9540a2418f287f0683e290f056bd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7380168281dd18d4a26763edff92e25a31420f08 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a88fe14e9387080c5a99568346daa2fc9264baf83ae9e174c8ed9e161a2becab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65b9316b7f894f5470bc75de748029074eead2a9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11f5e1b218d844a7e8a0351106ed85c7b8c0cb7143931d5c29281be28d67300d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b98bec9889493e9b7fbb70103b02c59c368022be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e0c9618c9c849d5aea177e53bc4cf629d705fc6a801676456cbe6d940065a0e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..acb8cb7bfa3b6d5e6ef1332a325d3cca667c214b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d4f236f53d1b30579c15be9881861efc7ddbc0673134363d0b28276594bbe23 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..286c7455be7a96588493d0adf0bbbd7adb7d6384 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ddfcd4143bdde9b70b9fecb7cba314a7918d48c7e243af8c698a3c09190101e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..401f7db10b28a122cd7cb44b22fd9e2f2026ee75 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86eb51e258a7d17bb599c69f6782da5606a6bf7fe18c3d22135d32e9eb71c94a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..689a8b587e04dbedf507f29011c9b5c29daf5a1a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe1eb57a4da9a635ada8a36782c47672e69b439d5bba6842d498b53696aeeb2f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0211c782ad019a31e1f5969a459bef54de8809b4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b541d1c33bbd79a6d152265d7a1438f1332bf60fbabc7170a0a16fb7c7337af4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b885e6a1e498b3d840abaa316d242c06e307cb9d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:113cbd909c6acd5a8b7ea754aa080f8b3df801503250a6fcea02e8c25b7e2414 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d6a65ed5561c325c08678a544317a67c88d16e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d220ae4c52c02c34e72276efdcc797cc364f56379cb2e73604a8a1597a2648f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..190e00af2439a971333a141f7c83c0d49beb3282 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eb84f42513a52167636d38874e46b7a8118370293a48b4d90acc7c2251754e7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f95b23accf63b4ddf626abf5209dd144fa9cae4d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83588a4cb060f0be8441ac69cbc5d9abf57a35642a9ce459dd5dc29513906776 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d79bfc50b25f63609081a476c77ea63c2d3e3bf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d4c1db83417146d6e2aa42f7ea8fe4db07a4768f4bc85014c2e839b9bf391f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5f3b228817f1b7db683ea77b18ed7acde105d70 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d48c8a38d51b9ee047cb84d887232455411442fd7dce44c6433d7a39149b206 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8736edf66c55f1778b10050ba0f40c11281a4003 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cb4cb232d4a03ebbff9642ff24cc56286e880652fff8bd9706986943cc6f4d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef745e0d665b1c5036f1735788990d10bc96b0e4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:101d04de93b3d9bd13620a9a9a545855ea60f3fe9bff35b437a2ba0ec03ce1c0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd2173e827281bbb78f5e90d9c85d52aa89796b1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6170ff70e51441e34f439e527044ccd7d44d5a603e56d6f2eb5458359f4ace0c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73ef95fc88f8f982aba30d6b748c3610c4de59bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c441860abd5b93c0972677248bec717fcf9befc4bb484e060b26277cc8793870 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..86f387a0831fdf3ddfc18c99d9adb431185411cb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34b4fc9cb768dc9e670684684f26d8f150c3e547c61d43ad0c71a68917df385e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3641181dc36de449fbd128523f384f86ab1fbcd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51ec82d56cd32f1f50f6610a3917672d664957a7e13bd974f025ae2a01b0398a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..01618337f8b835dac3a0fc65465af4c6fce328f2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e82c727eeabd02053c9bea1d095b0ef77ce659039bd6e440a1adfa970d43e7ec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d95b931456658c1b9261b4b8a9b3c9b6aebcfab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a66e496f3bbdb8ee4f4ba3302a6e0bc67291191174ab7f0451868651351a4030 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6ebc054a904361d5cb65ac9ac1a17b7bbec9db8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fec4d6a24dbec7590ed494ae0f2d0f4ba4185d066e0f8da87e362122299a3c6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b0f8cdb74b541ba3c97c1a3c283c1fb55f90be4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4df46f4f2ada8984c49f9c45d5f487ead963323884e8cfb4a44bd438343be3c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c575044a2ddc674806a1c9a85aae799720dba28a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5be8ea4f06ac4c8da842d3c206cc14953a5904e95fad8c0fadb5f7f701a8b260 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a30cc8aa18324407082dcd35053dcf884965104 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:849e5ded7c899a9376da7f6ce7edd4bb252fa52544d7d7aaa638aaf136ae0db1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cc987b58d9df29897f7f7b9f2da54a89b6c45c6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cb1a26820f79f1c3c9c6c5b5bb40ef7478e9c69012d44f3d75a97155bf7c1f6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..18bc4963a2663252e13f6e165377b00133aa9bcf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5cdc2a4b6e9657fbc62b65688dc737db3704e4898effc215df6992a68c01c67 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b70fc1aea06973ef8a5d616a7bc70aaeabb483d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d01afc611e013c2c1b3121d6258b146d9c28879da0b010c6cf01f74275851e7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..718f90f7fa8f83ea5e4c5ab1f2cafe7d39ee43e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:369815ec616231def9a148852f6b44a1ad07ed3561fdf307391c220c90266af1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0eca79439b89680d57daa8b3521212ad4bd5f4c0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e49425efeae36e4e15192d2828f5b16bb3515561dcc63907ba0c2508ccdc0a2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c5e0ed89e055ef2b6fa74d440a2d42364485389 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54369f5e7a31ca6a371bc0fbfb178b80bd58d1b80c0238ba68b99f0fc14cf4c8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5be1a838acd48efbbe64c3ee3d200caee113ac7d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7256056ff5a09584f917217351b6c06a5dd1d69ae3d7381f80f2ff37468e22dc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6924c1fa3b4ac4d4b3d8d01ef45eb2b395b4215b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca72273eb23310eb2033f160101dd09ee824f98f7236bb13d235d45aa265a693 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c7c402531f01307c3084256a32d111540abcc74 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b3c1ff3a59b611e113ea6fdff83b57446788553d8b4ac17800ad09f8bd739cd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c2091f9b384531e91cdaf98260a16ab2e2401ec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee6090a352c72b66ca2722208e733a055bd5166eae4ef08c22131f264226605e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..18dc915899b72787d7b91cc5a4fff99d966519df --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbfab2740e22d138308dbb75d96525f4f69c1eacc816a6b7fe781f2f1dadc8cc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..abaacca888a0d06d364d7cf6f81275a6168672ac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:429bd85feb9739e5b8576e0aec69b64b9be3ce5a1d16311816ca9631039f2d3b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d67384c445ff204aeb34e5c914218a1ce88ffed9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f710a18256185a10a03fe3a2da18287ed43c379f177f5f97d58dac0502755ea +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9e6dc62fab7a790e9f896b9e8c7495313913e67 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d9aa4d26fff7fc27a511415805eabc92b4496d196d658ae7d102e9307316084 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f01ad6f1280feade5ebe7d080bd23341c2be99aa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8df3563188e109f7ef21e50f5cecaf1a74570aa062bcdb28271f3472fdd460f0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ba6b3636356c90d0597517ccab3a1ed0830a2bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee741a557fe14b9c3995c9a1d2adc65a2162af75d032732f2628e3f4ec26e419 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3edcdb105bedf85f76ee6b8b1aa9a0e3ad348a5e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0fe9c6b707272b26b94e17959693730ab888abf8df68b1e22952146f7ce5a36 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8259d4c17906f0068647ca3f22e7b60d070296d0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a255539192d2832f0d842f821ac1e65f465d3b8356c7c6a40e072fe7e4b88a67 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be4d65022a4416ffdb4e3a5670cde3206d4e8658 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f6d53b66d6bb7a6b88ba74308122beed99a889f00e6814afc27efeacf661919 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71d2561a487cda0def47b1d06be90d0e8356d138 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd73617bd347a934a7fdf7ad286f3e69086876182e60e11ec8bba137163b713b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..573643162574919219ae57fccf0bf10f248c1c1f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccaf410906fdbdd6bca0e0d9ea43b8272e229f07ccc8a9d217ecbb59c63e9adc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1a9140a70866ac93b59927bc141322df02c3124 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6c080df56f95a540126c11d87059d82e0143f886c2bf0c42de1e5fd89b090d9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed9a14f31400f119c0ff9d3afa42a536549c13cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:339baf5003758897df4362b99ddbf783758eb9196f8cccf091482353fb204c7b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fcc56cc2a5a4e37a39c15ef8978da7144f6e386 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c83ebb0b8d06ba3a952bbf36e2e42470e66ddd275d5e039ac1ab98d89872320 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c1d363fb3e148c3c47cbc5cddadc2f8e4d1d6f2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12fb328876cb8dd7fc53fcd6addcea14b172cac58061ed07138aff3c41a2ed4d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6750f28d37ef5154e045863b54ced8da36e09a8f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9293f1df697dda5d37b70338258cbbd7ca62cfea063f9e614b1a374214cb871f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a30b9550e7dcdaa796e4235d5820a2e28503895 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d7007b55a4509abbbb72b588be0db92479bae8a5ed16879cfa7df8ad9a6495e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a05a48fe3eb62e7f61b5174b8c2e848e0c2b033e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d87b23c00f7e25f8502b5ae894d33ea2176d4590d33824ec4462e8655e473ddb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ad9ca5e39d53b21017024b7eb6a7ec01f559e59 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa6baa1275b20477401b9e64aeeaf69fd97429b73881eb9e75773aac6615577a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..52cfa023fd633404be1faa23d12c09d5bfbb612e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9200fc23923da261fd9b7e42e5a114fd12d4f0aadd88e38f10f89e599f205842 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d82f73490a105e4c466fd221e1c15cf0ad223a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01cbfca4c7cfb7751b8576aa3095fe093bd67099998e61741493b50d07c4aa99 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccf6520d01a6d3b258941895c8c076c5701468a8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42de465e27412bb2f52c0889fe3349196dc64ed909b698242ee770aad287539b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bc5ecd32786b132c961193a9cfc21c11431e08f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63176ab28799e979ffc6b45c7f79f1ef4167a878fd1f7ad2788eef8fa97fb0ad +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72853d5196fc8d95bb34d8b66d5ae856b8fc7301 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2603d9441bb2398f1a7ed3a4f6a71559116d2cb2b4f6f3b0783a72404e834dde +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e560aedda762fdbc66049d659a0dac3565bb8135 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df381719ab06126d87ae2f2b6884599e26f1203db0934895ebd3b388086e5445 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..356d152bb52bd34533e37bd99ee0911e7b46f7d2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddd06ad34dabb69bac1b9ecc5dbb2baa200be7c5d0b6977f87638acadb810ac5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4995eb792bc63ae178f831f8b539c07459cb5f5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c3696f98e0d5acbca2091c858197a200bc39bce866a0fc1ef166d43080e115 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdc3dab6f633e9654ba4c89e14f92f1968f570c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3e86342c2edfa93efe71e65f99c319b74bdbe60889b2819f2de3712fd1b91f2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..44e3cddaa4761c3ab79ec29e4579d29e9c890351 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72f47d06c58b4fdae5f533038c2a77560ab63c7f0e87117808825eaa46fba93a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7545ac21449c1390d48186bc6a55db65cf92fbb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf321a4240bee9ca70bc85c67d329c39a3cf79eac6a4097fc570b75d63d05fa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..59b9e850123d83eef2b0074ab90d950f44cfe48a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ed348c8204788ba9a27a5234cac9d5cab10a0d50e3ded414fba5f70c814311d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65ff6476b7e7b3e61d8a1bb39d3969d0605a6046 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fda5e2a1f8d35e619e66eed36523920ea18519cdc066602bedcd96340f40bd95 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b19277f6d2ef0e8ea26e4ebd5ea8ecd6eaf5869 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4ff5c5218134e78932c72f5daa71466ca6e596dcff2bbd8dad15ff459371e01 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45a4e5a0ab6f6adefad011bcdaffffb0efaa0b60 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40305d56c2f74a9c60d512b8288b0693f6d63f6b7a8df1a603da4a90051bf12d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b0697db281ebe05e7de7f84255551ddf2749c0e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82d060788d287c8dbb1ffe6612dd00fe87ba166d689f4420b84a01624aca24cd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d6939d53b5e196795f30517350d24a15f4cc5be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6fe5429572198c2d217f990b1e6db941bd83a702f2e350e1b63e72ce4e1b633 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2ad414bf429fb60d20a703f83113b5d3e83bec7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff7ec7108e3759a9c4019caae95fd11648956a108ae2e9ef90053f09b33eed03 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..422053dc19faae58462238eba8b1e70fa4485c9a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dcd5a246ff6c87631ecd2f1a63201253ef2e926889f77ad5c8d51065263bffd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..34d9708b1da69a6afbdcf08154b46f22ea17e88a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95bc1eb5781a436795f902905e3a9d3a91286c9a1a4aed00fab44f35033962a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..415a2d901ec5b616e790cb9fc15ad8e119e9ebb3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3606e785110d4950eb574550b7e5f9388d4528abc417fc91de390eea652fc602 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd0dcf5b4eb337d39599907f57f119d7fb744c20 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61a25ff6adca8e8f1be83c38d193a6ab7e65b81a2352c7d81c29b3f438d3bad2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91084176596c65a1830d24d48b3475fbc52dacde --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4001d05012f622bd25a674bb958cfae33d3eaa0f8f04cae6cd121c18b683bc4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a698ab77f7d701355db8b88815639ae1f1478f70 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71231b0c81abfcd61a901d15a925b9e59fe5d4b143a3538e55fe7081d9cfa45e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb953ab533de44508ed3b3cad232ba3994a5c930 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72e851ec8e2431d137ed0e6c8b86c8f8b62a2f1d07c97b5b7815b2de69de6808 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ef2ec00250cae30e3611a1c95ad7153b455ced2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1c009c7673f51987e1b534688b462d1bc00343d9f199ba3a3d916f7c74c3b08 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e05b9d88602f07cda84d21fd15ec238d3182994 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b0d687bc0aa9adc920eca0e650064178852c928489e5c8fb470b25506dcbaf5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1810571fa5455de6b4d5eb6338c4182d593670f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01b8cfd7eb57efa6ba2a7020faefd25f7a095c115990e3077c685d10e7f8e796 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..052b598bf865ee15017b7054f789f058d968a271 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6a8e548ce577b902c5e14f5e66fd838db4d7502fe10f20b3ebd6637f595b92f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae55ff6c30354deaa8801bb9aee7724a3785bac6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac387ee0ea86470c44f4ab64c3a9626dadefb79d0e147e25b5af2364a40a3111 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a18f1c35cc5584635a3e9aad4792f97a6cc2c18 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98c3f1a65187c0dda189e5da4a3f6d04c3bd15f6fa6b1946f94cd88484e0a082 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8df4e1d5fdc34212d7a6f557d70f1c0593bc815e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:767358c00ffd82d6099c351001732fecf84d8f9cf9e860ff07e36b24d89bdf23 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70d4bd690daffaab79588e6014c63c2c045190a8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec50d138c63d30f254dfdb0c3109303b4f128fe011d1937b371ed39c323b75ec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..deb85745a669d102892bd0aca6ad2e07e78b9e99 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0592b2258bc4b984ce9d165e4d1bc81ad8af7d3d04f511e3e61287f3d0a0ba4c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39ee2244409146a6e296d70324559097d2901c53 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9f86da95fe6ccf298102544c62be82aed689c6d7acfe2fe68f2fe452d89da95 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ed7820bafba99e96a1960e5ad58aeb8fbe027f7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca26dc7a3376a012736caf1e57be683b7b7c481adde5b10e596ca90bb017272f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57a574bdd7994c437f668a4909b486f3047ff3e7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a844c195cd28f8a5ad1b9c64371a983fdcfe3a3998353ea957964431c5dc4c37 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..33cfedf3794ad0e5b48eef5dbee411e63e038fd0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:220f6c1f6aae7b28df415b8dd21397d5bed3215ecf77149aedf667da7d464c6f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04aa72d51fb0e1e7b615befd5d24a85aad4a7b3c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7bd0bd64c8f376c1a7ff991e4157ae36c141a10e2b0e998874d1382d252efdc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ec1e9712b587b21d0993041fbc486b58cea1208 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92eb5058b781e5843de67e1cf90051b15d95ba88b01390c1a322f7233539c83e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75e55262811dacf7129cd67e8c5be58585e578bf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:736624d1315d4d4e0d974bb3c50d3ef3f69eb1ed95ebc2b86cfa78a1774247be +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5bbd1a53956c23bdb7c6f476866f1b1310cc1f2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d26a8bdf756f2cd5e64cb9da27636fd6cd0c43280c21eb8299882045bbf1731d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85d354bc118fc383f72843aa97541c2792c32f97 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d1b23e15b74a2763a6708624f59a15bf1307bb5487a67e4000a5978a29d09ba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c358e3b26db750c7abcf1b032775332b6568c369 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8f1c3c0626e01f24fec9cfb44e36dbc555ea7347ae5d9839fe1c6ebfc1d9d4f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de9c7764b7c7ba86bccd382f46bcbeea5e9c1930 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65503b103029d2342cb4b627c7ca21d4fa9e811a79d4947220e33a1318b24ebd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c4151cd77a6600a5a14935d53f475d2f19eab04 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:443e0bc1c22bd42808a3500d3de221bb37fcb2057e05033529e300ae02cc75e5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10c2090ed61591a278051af97668a63129fd6c96 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b592fd37138805ffc5216b0de7d26f38aebbcdcaf5c65641e8a6463c768bf0ea +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb8682fb25485c00e9bbe025b9ce981f26859627 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da3940bb580568e8849506b104fcc3284931c571d11355263f4e2ebac4f0f045 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89859aee8ed52f2ca4c6c69900e15c38e51c97fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d778af14879af5e80395f95284411d31a8160c710226d3478d8ec4aa1c9511ef +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..67d2d6a589cb4c123f869abd4b99f730c83827d8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ee3d78511cd61bef588382c891f4886bd98ab1efdb8fd886f57c3061d5889d3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a86c7d0d72f58607c0fe196b8ad542a637213e3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca5ece6bb9dc995ae98f745453ffc33d840ea786c1ed9767c48fc6e4724f2ee3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..36006abfd03447d54cc0fbd21a775037cf18def7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7065d3ab7649f493141391b39a4419b138c16a8b280f5afd9a9187e9fe87c034 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7a6b8888bd2a586e39a5079f3061b95f2a18174 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec466d4e1f118eb75918fe5cefb4be4948772900b182231c4c0c5c4a34e3a696 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..624e1a5755e2947615b44fb63a395ec95b441dcb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:987f2032ce86f99d4aa31032f23ef7b023af813dfbdcce5f5ead86efb5e7ef48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a81f8c9f855c57970b8de2e753ecbf13dc41e9d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef6a7849c666865841466924b4035d2f2e66aefdcdf08ba0afce36e62820ab97 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2729ab800a11b6a35507e3e9c6bff1b445855f94 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99b5433bb3e867e336349323f70a2e5751d6893d794253167d52395098decffb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54535161c163e49f04b873babcbbffed4d729519 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b285c437eb32edc5cb8539d2193254f89d150119a4913bcbd1c3af98b032789 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b81effd85023c50cd8b2996530759107c02a7b04 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:351bd7964eb5644322bf776cec617f179493cd83ec3b0baba402ce69e06d73c5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3d95aa66552f83a78883b6a08b3adc3e935ebd8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:524a305a8b15f8546fb6d1d8431cccb5cfb98eb3aff27031cb7b5297496b9abe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f1ef0f6da64993af2ecae09512a0a34d6d74bdd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c367c71ebd8744b61e1c9350e61201a2355d816f46ac6142fef4ebc92376901 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e193a14acddf9e6b3db534ff41eef284b32e4126 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c30928076f6fd09543b229935d0c133b61f45ea435d7c657792c928ef669a94 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..575a898557386d00267f62900f6a011c272bfbd3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c8368de7195b20dac14d28c1ced87b8789ead2848540c25aa98ee402dc9afba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77deaaa301f6360e21c20ffe6556f14f29de30ca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02e8d26530a2966031baeed76d43df7ab636e57932bc1a34346d25ea9f8b7e65 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad5891ac3a035f0fcc34d8743fe7cb1b9091c1eb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba6f3b02621e7f09ff9c054204df2205127531d0bb77ebe9a9e7ec123b26d70a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0800ffb3542d88aa5e8dc49ec49e930320a7e508 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a452722d69f61e3175bd0cf62a5ba207d3d2f5aa6b1605686b12fd504a685cd9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b6bae44bd4459b9ca31b7a2de54365a969a440a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09499d1a7c281591b9abf50b65e29789d9db73fe585e22e5db8ede77f15cca86 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7f151c3a3fd54943d0e9113a7568c27e190d872 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:889e514e46a5fab6165069dc505a2e8498c10ae87bf32999cfae85cade3d6866 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaf74ca446a7b3986a769402e3b74ad4af3e856f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14b9ca2a478e647357e41e6d2fd6c07c9761ff59d4e1d0532609913b7a321dba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..41759854541d0aea9f7fcfbda69565e1e309aafd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f818a3ac61f362cdfbab51a4fcdc647b890608e18b16ccd0397c0fd399f72b82 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4664b0f49b506966e19779aa444da729ad2fa515 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d15cf45c9c452f56076019524231bfdbeb5bf31bb46a3cfc4ed417f641fc65a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6913dcd325c0907587668c88f679627bddd450b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3f85c0dfcc2b627253e84e1c10bea84fc79f131d210b9bc08152d027d94988f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b75d88506a35c50d871a189776a0df0f61bcb68f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:841c6428131a8523ad1669dee5945b708d0c2bd23c71c8529f10077414dca216 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b8c33314958f319a16d90b8847c493729b3f014 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b9d30912091bd1ed0764abf6a791d7dab037ad22c425e4f502c8b1281947e1c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd0e711ae22afdd4d4034d65a0ee0ca1be1d0ba6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fa20ed521719582097510dcaf41cfd37fc5ef80b9ffb97d8fcb11b7ca1fb2ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed16c2a2c59d092efbdb0f4370901d0a9c9b93a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b04469992f976030257c156919b99eaae65a42a1c656344661fc220caec87e2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..accaacf717021103012ce25277b81596bd423b9b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc362a53ab60718dc17f5a1d307613ab60f06fe34e6ee437cf291fba5969705a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89cb5e892fd43b8447aab1f25c89e376b87f4cc8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:788806dcd96a5044de95fd765f65240d92b0211772c9f4aa9926fd386a6ce67d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c70e6cdedfa6faaa9780bddfda8a3e8617e76109 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:215d2fcf4918446c056c1396799164e092338b560720994ac97a060e173736de +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e599f7c731c17cf86be45fed6faadd5d03e74f5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0860419f7421ee90b550a970b8beb3c5110504e903602d676ffd4f95cf3b67e1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..41afeac5e98bca01e3695df8fae9726e92c1a8a9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc2c99497ad2d55b581c7a54bd6b0594b8a84b4a5b8f9013f7d4df3496bf3423 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4482b82b7579d771ba0eb99ee35b1ac65e25685a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b237e6c12b687d24ac1d4922a9f0162dcbbc390b6a002ffcddca2dc7623ae75b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcb9ae6c9e7fc9d9c64569d28c2a80d180178770 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcead064e3153f5b5d6bf745370ffc90908dce8dd82c1b92548a9180fc58f0ed +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..abda4194dd653bcd8dffff2d1c2f428f0d93b6c9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b6c5a042dd6eff8525c9e89609a4d6d3d8320f8556793d300caf5a93ccc647d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9ca3000e5a91c3483e0517fa19a423c0ea4391c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c11bbd93555aecaa0c1d8227cae91da9844c8691c1559e31d9b7e3eaded3dc0a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..169fd07eabc2f340da014933af813287af04546a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d83bd95d951403b952ab2665f0ffe8423765de8a1c4820aec1fa8ef6dce65a11 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e12f8187e9160b5b5b9b166d57f51101210a3b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdea4f04036db0349fac70a184b9a3c97325929b4021ff7a003d9dacbc409e64 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd76ab9370a4845a0cdd8446c9824669b9028436 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43b56b02ca6c1c76bc8556e1a7d7507cc887098ab55b3419694177374b8e3645 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c66726daf16f91a1a67b5b88e8bd5321e9fd4674 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dd2588e9138d7525eaaec4b23222f1fbc44098320afcd2c6058292992445a0c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d68cc6399fa068cfe5c8ef2be696af80e320574d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37faf63c89eb0184fca9553e7ed56e089ad949372da7194b8a1ef4f6ffbc369f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9560165db9e7e1600a7a2a1edb729a56bd2c6895 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19fe46303c209d4d45503a523d7475db0aecb4dfb33b2fe08ecf9d4eec9bb8a4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b711547ed2d203dbc18e01e019e6a4d1753b1cc0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95f984ff264ffa05f1da1ee62362c466591a6921a9f8726112a63f8ea63b0e13 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bbe880a2e9ce01df0f245e6e0386b34c56a345f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:358021337ec6264a35d7e8ee24ce642e297eb84b066c8a98c3e52be85f6cd6d5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38e65a11780318ed7cb220bf8e8727c16a9c2074 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:694104c9486edb0050d6dc89b99e6078a112237ff3d26ef4645fa2514d45822e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b572fbe4cadecdb8cdc13f0d0f92795e8f8f297 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:658c9e55ddb9cc22c32687a8eb4e51033186542d2dd208473a7096c81e724b67 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bebf58d947e3fa0fccc4fb1f4a3ea443079ff41 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b57ebe9a1a41ce49b87a8c5601bec7ddeb856c840db3b363d899818ddea45066 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a3a2e4b62c8c9b65eb2e9f037483249caed9812 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c82ec33ce491a05bbb9f7ec9fb31ec7af0903f4b3b63273859c2273048dea4db +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca428c623350129e4f2e65403aa12da48c76b1e6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07fde473ebfc2a5df0d9832e286caa0f9719da0d1c117c22bf7dd28c3a0e2609 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e32d04b1c93c294ab1ba4afe18c27d889c9cac7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cdbc8aeb1a2508b675c0a01a6d00746a8efe49d8c0ef53d3e58a2e550b80571 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d844ffbab802eea3f54f28e1fa11e5b9b9a1d86e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5041a203e9a9158af55c9bdbaade29e30a45c066501168722ea2db915a23327f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f9d51c38996e40d05eda8cd328851e3215fded5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8e28f86c4fe95ca37229a2d0e1a21367d11649d0f7e87074baa515f936f9412 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16e091e770b9cc1e18848c77ebbe0a2eac6feba3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bbb81403fa5215504c72326ca8f3c7054b3139cf74f1a06ff650e286b073bd5 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11a85d42d8231e8b1537b0ec1aee1c81e07cc505 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc9a88cb195edffc76334a9fc953127499532a137f4a6851aa45c46046937cd6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eff60fad979d8f2f2331ce340836108c8b54e23b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e3b51ffc3f9d0ddf6fa3065c1e8c90dd09a58a9e8df58ac681050b76dae1961 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..12c49f2d0e18a0d22bc9ad632a68b5bbf17481fd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16da728a8a260ee0d0933e02aff7c1d83607e70ba4232ed7d0b69709b1bddd5e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0267ef95eec325710f63c060cb937d2d4018eab4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae33b37f831c4a531a230f569dfc01589e1b620be82439fcc5221fb6f2433ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0d1344654351528821fc2665006e45bcb6ee423 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b1ecc815ca5dd4ae3b57551c1b1b2e461bcba25327242ea57034714c954577b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f58dc00a991f54adcd4d44fd42b5c31f148f2dd3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dc4c3d2e4eeeb9923b53a1189bfaed223b9a7383e6bea167134dfa505d0fa60 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bf1d84d9a2dcd01885d00d0aa3bc1c79c347db8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c35fd67dd870a383a79edb03d5f4643e02262ab57826e11179dd18f1656a6f4e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e249b24241b033028497a1bbe7ae6a30726000af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90bf33951c1628c12b1907dc41d7c690a9dd3af3a86d62d7685a1db1cc36965f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50b42dd217459a2890b0f34f7f47085916245dad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c68a42206479e2185b2141270282639de0e192b60ff518181a253d9bf8d154e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97eaf512837774f62cce504f4edfa08ea2fb660c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e01dbabdd404cc356c2834b94d6e864800e64188a7a1b69487b8f6035ceb122 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..143e55e499a52dbca26c3ba7cfe081191e8ade29 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33bd7911435929fc2496653f38ad85591c54de79173abe1048522cbab23542cb +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dde1d7725284f3ba4d419605e7593a4ad03dcc3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4ac172f15e0bc93d12e6b992a7c6d0e16a03b7939512422810d7bfa6b6dc4b4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6cc293ac5a324b3a3f2c98ac0c9361e7b8882a7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdbaef2690c29fbde6b45d88d00880ce5e2ea807369d541ccd3f29a40d469f3a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8722327342fc691300ed87f91525b1fa16f935d2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b35d58a17a802fe353dc74e11f14112d992935f2c044e921f4f4ee0a29b298fc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dffb376cb303f2e8bc11b0a027dc7f696d97ef92 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96b1cdbdadb85e7ca92caf0b3efc9e1db9bb745025086f87df37a50333d78f96 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4b201454f17cdeee78b2b0edb16d58d274ba3b1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dca09a547338059beed7580fecb5d3d5990fb9190b7c0d7bea98a35799490b1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..045a3f999175dc353085adde3d1c5429174a8047 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:506d90b58110502942280149ce74273f12eb7d54b092e59ea9832e2098780638 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28bde2497e2a789501de6aa1eedb94e6b1095769 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af308d74f7aa5f59960c35078746171278b2c5eae2372f547a3721a384aa2f5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..087f9095e312feb252f654f02a9b6b3d193ed7c0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de1945902bac0b65fcb43d4f8f2c4eaa613ad489578667bf5dda2b5fccaecf3e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..435f18a5f23d87e35d5b25385ec887ac874c8c29 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:793a8afaa6d0de3f3e0f4487a4ab9f4425bf72a6623392319a4bce211c600434 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a28a6f485f86374c1c59bce0b8b5a40f4bf8edc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8df05192679040e75deb5a5b4b02cdeae6bca6f5f9997a23da47e400fa19a4b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1517333f793c11c156cf684d88e688d6a566d788 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89665b8a20d90e7ca5781148bf4c27d998341aa5e818fff032577c55e769c20e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..160e53e385c66fe3e0243a5e15707beb7b0e5523 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c27a37d0e492e0bf688c8861472a36d264c87738cadede19184521fdfa06822f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa7e67ab7fd5ffc11ff885ee8be1acd0302aaaf7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c824f92889dcace1f3239433a522894eb4b12885f88db04a653f26592fcc05b4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..96e53094cafbe0e4dd693dcfca0d96147360f0cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3114e4230ecf84a401ad646901ff72796d3fb1bf456ee703ff911bce5985ed42 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e12161bcd576775e23cd92c85ecfc005d224ca6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24911a9978fffac1a89cfad29b8218b77ed274d1d887178ac1d4be55f7d77b94 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e6a2869742542da7bd29e03ddd9b17365e0329d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3accaeccc1662fffb4d3d3e09e6d424e56850b0acee76bfd3cd130e174c4e41 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1259d64d0af9045ac213ffd28269c0e41742bbbb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:765d722abd6bb0eeb51779d2f6c758956899029abe056cf01998b321613d435a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf6525e40dc56b7fbf53d94468c3e332d6505ef6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11faa8b3903ce7e396db816ee1e80148bb3546e063393262c52b953214b99e8e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ead6e461c97ca2dc6a4ce57a6db8a4cd02f1278 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f57e97945a1ed74887ebf0a5ff0a1ecbba5306b41c67b413285c27c8ec949f9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50bb6be47542f600ae017b8536387916fbf2e20e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feae9f6787167a68f9b5a56bbcc13718509ac838489349557f83352c883b4517 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54b57e1360fdc2e815f6bdaf565c4ae45c527482 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9542c4e64269e3c8ec61952a50baf2cb55e72f30fd59b7b5f97d2a5ad9537e1b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d7e7ae102b8b1df04d980c5c5bbe20aa701b55d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ae519b337d11d10829e59df37cc9db3716d5bf7830ee7fdadf6b196265eb254 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d56b408674d71e5eac0a383ec6d3ae89c0d965e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0251566f0dac317712eca4adbbcf43bf0d4f6c0e5551fcfaf6c6e24bc33cb868 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a63e65aa119a01573c4f78e9a61090954ce50ac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3885f36cf26288f9ccc0aa77ca71eda03dc6cea8f1dc08615b7de514438012c7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea672de820f8cd1e4ee1ebb88eeaefe6931a84e7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afd6be2b311f15129de99a3040229b02881936af9b1e48ba8f9c3ad7172011ee +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f878de8b85803dec8f4627016806541918107a2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:183accc3ea84e8ba28d02a9067f8f5759cdfc2b61e151efd5a831fcf287af118 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e37ab449ee75aec6cd742437b06be641faacd283 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3c3a66d98f9ecc5b587002766c80a8c16c66968d1337045b9b141503cf4b48c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..334fa07ad8298cfbfd69f229fbab2d3848863a86 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce65187867199c2f4f6e819bfb8be977964aab5cc36a955b3041fc01eb3bd80f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6e9e727f67941055fe48738992a64a5964c12e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:860b86661b4ec3ff9c2f3bf77290fc8ded7df3e1fda0d975b9bfad401ab6299f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ad0b47d24e35718cb020ca21ffb035cbe9b5e37 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af3397e2064c37af5443e0311abf1ad250ca88e49e68374a5669e4bc511cac3b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3428c7ecfe94efac83baddeb26cda343af011556 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51b7f4cf1d541975968c18dabdd25e1c154704ad197012f24a7f2011d1418a33 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0990598f15ede8a922edc2417f85e5e6b3498494 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a357917c3b434cdf50df6d9604286cceebfa2237695e403c653c154430d2305c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2aa8879966839ca3a18a17325d6c61b51bf10e29 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b10d737ac8994e49bd27a6038e1f9856fba188c20be52cf899d65f13bc5f7c6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..41eb42463a119ae7289193def6cf8dcc491bc7e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3293cb540de7f65e2cbc86cd13b11607f89ae9e1ce0cc001dc2dd0e870dee8c6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6fb5bcd920d550c397361efe7835816b0a966be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80a32b1d259ef6cb7fcb64c6ae0714a9e50c7d8d72398a12597f582f6644cae4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cf70701f639cf9a7277340ca9ad391fd2778827 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fdcbe91c673b95036375af743c697f3802935d4b62585a45e17f1da4d36b8c3 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..860272acedc0bc1dc5ab5c1debea2f3c124e637d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a8838ae90a295e3e2357807b231f2ac0148f8977364416e00a4339713e93a02 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..30a5c9c3020df48468523751aaa7e0381a5736d2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6821374351dd08ab1171ef2ed1e59efbad76df36495db3da441c9f936d1ba024 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..264743b8c96852c3f4144a5f89ab4ac5074dc684 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7deda1cbe1c82d43ba847155259a953212fbc07b828615e6bb7468e4cf5f8952 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8495758cff332664dc22075936e1cf8d87e96e0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6646d08cb5fa2b241c4accffd1cf9f74b9765ce10a9de2e463da17d894c0c235 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae6aab82daf64df8f70f306d6bea26eda9fe1263 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19a708e08b4faa73328d778ea7962d48a54a8cbc739b57ee3295abd6e7b7432e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..16611d8142689907e3a9df37bfb33950b6097cd9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b31c93001a5ecba8d3a66f28f448b64957971d20124b39e13b970ef4299c230 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3c9ceba356a60d62db5152fcdfd4e962152e158 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b23009aa3cdfd8d6ad1a5ee9def72b8557f2d2f3140ecedb5477faf848db82f3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2376f5d7ef83b8c82f85d067bd6db9868cb0340 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:457751627adbcaa4f7d6d9509a55d2711d728a1c7ae47cddb21760faa08e9edb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76395a664bd2eaa5c2220f658a924f5479b84709 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c4661a742599af4b80d7f2b6d720d7763044a779f3017e2685fd822b8bafdbe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..88e1a3b7b1a2ea7b32b034817cefff3c992baa5f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e26f47ee039fc6eca7245f09443de4df984c9b693a2d6798ce442d6094a04e6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2981a448bfb7f159151e97ab69cfb0c2b14cb452 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06aa74495b91e87c227181ceed30b4f4911373ad4e5cff5aa51085a9cd83e510 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfe8575e6e74afa0e7bbdc4c9b6970675b833097 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02ab76098899fd326bc4fe317103b3f24149248e264a0d1ef47aaa13e8f279fb +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75aa84cf0c186ccd31f59e75d1be5d352b1d5d3a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29c0d5b7fb5a689279b2131654062f34d49fa048847f1b08a6755005c6edf8c7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d321cbbc5984ae47a2e8d68b4acf6db1df826d0b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c862cb0fa7b59cb2f072172a5e52f9d8d8cf86d807ee05355739ae8daa58604 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c86d7ffc1cbe51564d104d9be42bae3f871d96f1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a1af504239374a8d56047597fec917ac8dbe0369ff3262062d7286be1fe82ce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceaaad7a07269d66e10cfa9e770c142676d9dff0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b293d70ea19593552f194165618fb1cbc873455c77e7e2f91bf4452aa31bdc52 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..821755658492a2d9812556ec9335673db50666bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9716f33a4492cc2ac1cdbc973c902bc2bea24bed43ffb41e0fb1364611f3be1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc7bdf74e56d3b98d511a9d6452734b1d6486031 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bac6333dd969fe18e527ab33f5b4a41295155c0eec85a97ebe4061f52450f013 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0995958647bab1c1d5d280967dc2bb6caa04c9ab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0b447d9ff1f0db70464c1edf9a4e1a56174d330d0073855266c8551c66c387e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8952ae3bb3dcc8d48ed2efee597a399d3d8b1632 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8464f87edd17b2b17aa51df6fcf29f43ef77ece6063b36f6b958b59d0bc45c6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a9a1d21ac0daa02d7ced610cf7648c7d62896a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:223a74052d783eb219638453c6ff882a887ff2c85147c090e3e31b818e7f9a8f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2062f00e7039dcbb7e306a90b08fe1f98a63cebc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d857451f69a0808ee02d70561a36622d7b0e2cfed5158987de2d5b55638861c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02ac4b0c30efd016fbb054ea7e970506142f9057 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:256c73449eb1796c461588d766193a3d8f9fd2b90bad5d82f6760a2164224651 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4a71aee93391a926cab2c44faa17a7eb9992e51 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1eb8f6698311d6c4dd80fc39d7b8fbea6247c2cf4eb25c14690190a7a041bbfc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbd5dc25088379782da7bf65cc4cb25b2d25644b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:088e4dd1333e890c5d7d560153e5b3e28c061acec6504b233b5add75fd80d7a9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d967c2f900c78455a564bccf8e594ab679ca64b1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eda94e24919f141435423af88d8bc5299da67db62d456b0cdd6e09a3583eaa7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eff066d3d614ab4cb830db293e7afed6d86ebddc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c72f1437fa17cc0d363ade6610330bd85fff695a775c1586189cd3fd750b323d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d4ed811914dc779a3671169d0fec253dc97193a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29120312d32dc738a5fe7878fb1792ebcc0cea2b66adf902c1a7e0aff3eca09c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e20e589ef55d2462dd178c6b44bbc512a4d1201 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6417a852b64c3cf9513f973fb263f6fbdb63b8ea83d8d3424a4cf03d3044b181 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5daa81db11c133530ae52c32905ff5f2067b8402 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5dcbc324a1ee0d5c25e5e1e8da0bae57d1d3ceadd8e0335201686b4a2bcf2cd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eac85cd4cd9522fa0001300020a3a252ad6b3b1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c120b4843a2e19f7bb1d99c72d7f203ffe7793d0cbc90d20a893fd53090571b0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4050808059d7c319e31e2a6601610cf038115abc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4e81cc494c1bed659ccb833ff24a0a209e4fca42de1ecace77c960735af34b0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dc69d44bb9328bcf02522df15af4e8f9267a413 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfc18a279fb1e01f662e76aa7bc2c5c5984ca519bf2622bdc00835966a704ef8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd4ba93ef6d567569a6866114bef9a48d049b06e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23dfbf49b23c76d3bb6ebfde7b57c35725ad32df9b4663c389e8bb1079619424 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f183405e113f0c815918c78e3a0eaddb43f3adb3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a044e7c3c3d43c14220e58d285f7b43acb23d3da1b2656f8b6b25783c53ff9b0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28ec96a2153bb2af7f2f2b792ea0b0968a210c6b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0413e7c217babbeec6607a9398c7c9c6af70571d1a8dff5ebdfcd5efd33c3306 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..503746a75e009720dc7f88238c01738a5d154107 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc5959b8f6689d0954f25440cf981b7fd3dafa7abb97bb87e2e1c8e3e74076b1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..99ade0eac1acb0b15adbdfc80590139f305ca532 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53bf38708f62df5a202b19c1b9e019f356df4f2f2ad52acdf6efe76ceca3b8b6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d52738a9e5c84e98500d3eff31574b7b66ebe593 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c5a93d5213528e4510a36214bab5d21a1dbd90a11d41efa76b44bb4277238b1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a747b7723dd453265b4f869e4bba45a2b1bc864 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf4efb152ca241247e9b0f78ab15c655599d9393bff2d35e77ac7548c59384c1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01ee6a013155269299ecea9b997fa0916fd8b9e3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0a20d0ad9110f6f2033f39e44fa02e94473819517ddf08becdb27c338b5aba0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e960a007431cd826cf0e0128f0d0468084e2d24b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73c724cb306deb94c5951f72179ebd0831da914d5731d7f689ab037825d3825f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4391ad731cfc798d7069a7e60bb165c86709c84 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11df4400f7beb837773d3550499761635ccc375bdc13c2de281f6b5ed48d7578 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07f8908e16fd4efd8fe5eb287a513c1818363808 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d429eeebca90b0702904ed47ef30ac13ce7a6bc14e7abab0f5c12a9313d0389c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..031b23e3445a56f0caaa15224e29d194c9bc4b4a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c5758cf50e67140a0eb9bcbb9dcc76df3869b420a5a5569ddd318cdddc2b9c2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d602e61dd93aefbae222f8efc76780ebe58d4d28 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:390a98b2851fabcf93a8de7844fe5f526f61a17082736ff7c12ddecd25d552c7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4906efb9f420bfa7730b1c424e82301287794727 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_13/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d94952d6f6244ef5a6b0f6c4687834aeb9413b6345ad94a4629640ed088ea60 +size 11395