diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecc353a7441dd4585b4dced2fafad3f7facbcc17 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62588dedc783584dae27f3d23a226c32574e40ce323be72190800b9afc6a9021 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcb832186075d0cd8d770398d577723c01615316 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:058171cd18bf5e9198f2a8295f7b3e9911bdbfd82283ff17e06d4d4cb5f70c1f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..212b2351923439232a1e19584930f72a1f5fba04 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b67b588161abdd597005966f5109842aff19c10b0544c0a9b6d0ef91260935ee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..053580c1c191a85d75acd3c50ebda185b9710d7d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85400073b12a2946b828cecd3af576549a350e9caeb9baa7805e704f78bf5612 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a582b46b660e2d2abfa9793e955943c2b4f1e258 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb86f07ab8da41b8c38d544bddbf505e1de1c4b82ad6f436545995040074d6a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..445b8d7d7468cc6210a6ae856c26408f4130921b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9bad0700e4f7d96b59bc9e70fa4c630cfa9b3421f39ac6afc37c26933d244d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53f41053057f8a20cfb646a1983b6ec66e202eb8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66e3177a268b8878240ce92a5d364b47d136308593b3a505cc464b97eed5d552 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..067dc19bbb7236fb2c9b644e28d1c8bd9cca2654 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de94ed9e2785201c2e9b0cb152588c0b03d33055aaa2cfdc2e774c73c4ac11fc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2981a92ce3161252975d9aa3376f31f09786609d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f92e32ed9a68cbbe9f89a5632716787ed02141cba5283dc7a35a2fceeb54fa4f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a2fe18fda8c2801cbcd0b9117b8b094f4168ab3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75d0d2c9c05e779e12775ad6ccf0f0798f322e060c05d70bbc5063b8a5bf5c08 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dff799771b24946828ad92f0d5c4a320edbe4030 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc51217eaa0eac1c5383099a385314908c341acdec138d07f43522db451e5d8f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9650bcf7c8d2416fb048f519a317a9fd750566f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b66f70ae451e5e7391c2b747ca5a6499b5ce0edd7807dfa4cea987794949a10d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dee58d046208a7fa94779b526d043e5015a655f6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c13f5c22a99f97522b84bbd365ec394a5ac00fcf75996fe620dccec6ad4451cc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..027e393009311295d692ed2e4518624809de8fb6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e7ba4111174012f68a555274a22854073cadee34115171cc318763646a8c1a8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce6482be5a17bf3b96ae4b11eb30190bea368741 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a3dbd9a29fdf8264118371ed7577366eb7a3fe086dadf3344cbb5482fd2b314 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb1d22ec578ccc8d380ba4b12ac4f71cd33ffe44 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f01a1739478e6989ee2b4b0261ae3965761a71492af28ba226adff2575b2ffc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d10ebf1e3fcf094e4bffcaba94a3a4fb7a68e4af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f43fef3a3f905a06b6a50b6f5837aac24e56e982d865ef6fef78aec32a101059 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c3ebac05c3d906cb1ec48ff2b02f1e78b95f3c4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3b273c190d655c5fa261046425acedbe6569085a040fad58d72e1f5d37a4490 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a2b34a760677ad5d17c35e19e1e96d76244d6bb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77feac19e2596c930be95ed91d5099f6e1e2fd9bd742a0d7432b502ad787ed4e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92f9c5eb19ae72c9032a6446b56735b19e04e10f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:094405c736b567bfac6ec788d3d360a5ec6a58dbe549068284c9229bc6e6c173 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5747f8327d21c7c399acf1a704f14463cb9e8b74 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48c2b1cc354135684ecbff2c221daca459f5c316482821174119b5cfa6246a21 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..959c3fac672b52256a88b2ed7496ba856e98bc4a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a40b19abe7b34c47ee90b948e87a6cb8fc490997418cb02552f6688de551ce9f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c831a540850e6b0ba0306871d7edbfdd5d2a0f7c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5943f1fe50d05d9a1803a67728e5ccea9eeb99bf4278d3e19cd516b6c08c7d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2900b8504f74558f8938ac5b1f2ddac44c388694 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f2463491be57644a78413288df310b6d3a2b041af44cde6529927de23eb8fc1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d90bd993a6eb4548a23d23bd5aad3ed0c9ac90b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:232a51bc25a1a069723ae0c47000bd59e340e9bcdc42f3a78c5e2b8b12c77cb8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc5b74099aefe4f3831c749420e51d366acdf5b9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f262d197b7123fd0bd2ec91c10f275e8c474197fe684683889c396439ed5face +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7b8f8fc62563a20c51167d40d7d8aa7b1e1a9b6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c95b2bdf92c100fd6a933dfac51832358792e9c0c6107af11c3d672cf98cb798 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..809abf7b8c8180f114d79b2072f05f831e99fe02 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bba11340ba6cf3f818f3e8cf3129f89f13aaeba44fc4d5e1d56009de33d693d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5c82d11ff285dc2b305316cf1c787585b4b7df6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9792d51055f0c9c842c19cd75f1064acbe885d64a18c24dc9127f10a335dc839 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a74723f4d39f616a54070e339bb61236253fc902 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:417c12a9873ae0f6df30319eb301b77ffe90107bca93221638adeb8df1fd764e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd606f49b97324dfca6d156eddb79c41151470b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0003f764d622123135a8a1452cfc7b1544dcc52ab5e97d370a449765996f3b00 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c8247ccc34e1991f0f1a65ad407c999cf4a61f2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04d51262c820fa3a9757a76869453711f826595b447687c024b9eef5c0a40324 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d553f34c301e9a1107872a29f74e24b1521782bc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65ac47d743b006e25d8bb66db647cb64e2142cdc752796d5883d4dfa607268e4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dcd38166c2960465927e3319fb553bcda0da77d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcd5c1bf779320e26aca96b58cacafbc0350df8cc0329ea16841a2f2612622f5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5c0578b8e1bb9945fb74f3e961d9576d31e419d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fc8ea5aa11eabaf1fc4eeb4fcf16b07656d5aa519b79b269c914e8e4ef19c67 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b547f494f05827665116da32210ec88b34c4f08f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc2c85f813e35d4b11f9c0cabb0899cee84ad46adbeec9312b0a557a21fb170d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cbefd6843d67c242da38783666fbd5cc3f1ee5c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2e5c607ca7526f723131e6deea5981adc17c1a45e37f1856053843501a22367 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dfbe69954898396b4a012408607eb1f2df430e3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:303b35b6a30f48bd3ed082e4d10c3ab4e5ba98545bb83dcac18019a7e53544b3 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8563a67c37270e4410417bf191620590cda7951 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:101bf5b7913f52e4a881c5057a776ef0fda14427306f5f2a83a49b36d84ddfa7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfbd2cce1d72fe4346bdaa3a1aa0d709170df8e4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:941af1030a985bb795d5904d4be9f95aeb0f759719a31315f4b4385f9f3373c6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bb2c9b15cd5ab466510d169b1655e42eeea6f97 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf556ae5af8d2b4fa955e53c68fed62558c0753fd02d20927f7221ee91fcf5ee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2acfc7ea21e50b502b230f1217cbbf5b65939456 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:625e4116029353c5d633b3f1ad8ecdeff61711e3dcf995ae4f06e943be43d347 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e5c4d6d9dc2846630752934bf2a5bcd51ccf332 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:367549121a6bb61e637dc87330802b668822862fe306641830f73871f6af884b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3997f7ace60d53c22e4aadfb48ee5e0c83fa2ce --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28526bf52d17cf6a96dc0d76bc063f62b921fc77d888445bc7797bd436a809d4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7edcacb7e58206e5985a3ef6657865696121d2d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35d07c94c23c43cbad434963d32869fd3b56a2116e0d6539e9438cc42b3498d4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..144f3ad792d3135ccd24dc4b09235b4cddd93904 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7844eed14e9d7b283649df6ca4090fb8cdaefe1a2e11e00a4ee585b02227492 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..41f14c0ba811a638eefec59dbad7136a0c8b5842 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3343719b63a8b47f2cce1eadaee689e094335f68a2f333daca87e8ae4c09622e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57bac92cef301a7b15f45f5b15bcb3b55d6bee1c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10f163e72169d053d8289b207f15ef62ab0782f6b954bc734999345a96a4a6ec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebc6a84bf2f04a658de9b3388184d2589b4e4b6e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5afea74a9a4baca941c84b7e02ac524c0722f63081f4a103be89a14a4e43011d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a93c40e14a6cf0b0a93d3be9089746634bd5821 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f527988e6185dcf7793aaa250faa31edf32cfa1022a9bf4d5adab4a8d8a79da3 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df8730ea571c84da508f919e8d1b49503fde6f67 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3354b3d0fcb762ed208c35b70ecadc8b74bec8e431781c23fc6d06ff773ea960 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c1ad75dfb8f8ea2a721bce93d100002b66ebb23 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea478f669aad94f0727477fb1685a88a0cec2117e5db0dcb4d234f8c5bb86548 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1374a5824ca7350e0a812ff76d23d04714822b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1928cd7a183812a52b0e15ebc2e143228f410504450daa631576ae687a01af71 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7ef15355d5c05dfcd80cdc94fd34b04e34451af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dc6d66f42d69ae0406b71d0c3c862696ba4a862b86636eb16021d12d045a813 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c79f454bed3c0b39b08ad2d0cc04db135ed9e54 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:234f634c9f799f09db16e52bebe4d159c3696f0adae3d42f8696729535491868 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d995600ca101de1caa614fd85a773a93d119a542 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aea2b41f2edb7dc761ae5335c08692297733344e01ba897192814a190f185681 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0a7454329901f97d3887f1891304af0bf115ccf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5e641fe9351f786724f3b8a768b80582b46666a780b9845b1ec4815ad962f79 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4967a8c6c2b3541979567a0b6a16ed87c02518a3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd6593eae28144f0b60644faa43616cd88c5951df0dd644da86bab493b57a485 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36255e35808f15b22f6ccd6f15a41c79277626e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9207bc75b78b72396c412e9bad582cb76afec38a9d87723d8377132c76559469 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e996a196081e3b866119a29847260128a643abdf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b34f73a1cf4dc80bd22cf5356b5c52a63219dd7286ae5937c78345e32e4acb3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd271050ee8220f229e3faf8a5d51cfc87105b0d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88e1710a0f7a894c40a7003b2007e3f12003c9c98ad8d2905d2217fe3880a7b4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4d03f53178971354a8e56cd448010ff06c89534 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5146d875ae45845c891f40929b427451e18ccba273bd0d9617f21193d658864d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96dfb26818e693cc14d7482f6c3216e0ba1e5172 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7692003765bde7c14bdee4ab5f31ef65983b65840cb78dcac5997daf5abbca8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cc9fe4634edde2354ad08cfe80a66fe91431fca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a703eb5d50266e53eeb2094e4d1ad6ba90b3deefec0497b184402640ff24eb2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..331878ec3bc6f873bb484de5d72f6853f47e3b7f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e56fbd3b7c43117c3321a92d0a58f1f288b8ce4bb1a67a6f4c968a8151ad405 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e67b247a665eef3a290f5b2553498f221e8955a1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdfba78b640dd159a87c4e1e440068fbe41cfdf484785519d3fcb46da855e7ac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e2775d1e32937da9f4186710f1952894f9f6347 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd369d17001d8aaa7bcf9619411c8b20dc129d3a2d7bc7dece1d9d1bd9e506ce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2563f57e65ce32ba7e8ec4dde530f89bbf618846 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7b61d9572c2c969c324be4d412c0cbceddc703679e49e959b99f5ad81873abd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58d2662643bbba811a79c80fbcbcffa06e06a3d2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd6cdc05efccc61d147b96ea1b6ff399a1e9d9d01ed4db4d3bed2314dbc20d53 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48e62e262b70caf47091c04f054550ebf1cf63e6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7881cf9e9e74786aed1d67419918169d2890da806b68856e8773d86105313acf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..529e63510eeb4b28ecbf814a2d97c83b216272f9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:971c6252af53e479cc38b296f03fa3e42d806bcaf82ffe5f9d9c0f10b67e6a82 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7f5486f8138d5814a314ae4f85cc9be00b61a5c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51d535e04bb7a946fcbb139987ad687ae050661d3724f90eced2d74f58aef3c6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3ed62021d0d9b9c996b0e6031dfbc3717d6084f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d94371bd165537a6d833fec680a3815faff773350aba1449f563e39e98dc2ded +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e970b4a76a027e9eb0a3b2761e960b308da7660 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8a44f7e288218194f4bac75c2424c2d33091d03bba3879fa0dafedb084157b6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1098a3829cca813147ad6404897f9372beb4add2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:079650c922d45724727967501a551116da49935e529f36c8381a0d186dece6a3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9579739f21e4ad27c6db2bf400f6c94479ee35dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecfa89e03689a2d51b65cbf97d421d74f0eab924a40f016d8c45ad74ed777217 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2c7f466df3eff6d72e13f0109f84913da6e9092 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f83fe9c52af83467333d829389167ec09d20d22a1934f6b43a646c737113dc46 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ad2c1c4ecedc2f379a3d5a53e5a8eb7d5414adc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:913efaa47d117dacd599dee073af7de26902501415d471f5d680df0612241c37 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6397a1f76d80b5c0be1cef4edf692e5356962789 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce2dfd1b8e65c0ff1176c398e03e00dd64b839015bd8e618f3aa093ff96ad38e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad90664f2cefc57f616599793069d273eb9cfe02 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fccc597b71aa6208e170c8d018c93e3aca817baaf171ab7f2a628a85e04d16c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de94609275d23e07eac2de78f4f33b4710ed0a4c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd6ac188365d710b983b2efb731985fc187e740e1efed539503252362f5e74fe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4dcafb9dc428fca7cbca40da078c325c06232d5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd1857d5ffefa16a825357f932f15ad08276830737d9c9e0327d00e3f089c184 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eab59bb1201c2ac1e096651681f4c60bc73593f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1bb9128c47f0ba24467a14967ea90ed9bb2da446291f1d85898019d5668ee1e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..160273ebf04c9fcc52eee6522e4367ad9628731f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61c9e72d039609f3562c2d050ba6b3232576bf480a37f2be045b910c2ec57aca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..657fd9ddb50d1225a9c2d117b9339091c40f730c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b523792f41072e8a134ba7f1395285dd0c9dd0875d01df216c95f529005b398b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..abbc836110d39b2d29118a610e57da4706d25120 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0725ef641995cc000d3074c1112b93ef71ab433821380b193d107c7e1f776bd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1265c786f8cc75336ab74711920f6833903511a8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e2478c36a1f27b7836e45bd71e085b681a1feafe0ed22ef2ae911a550e2d0e6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78cf1c287d255bee3d29d12757ae215aabd4bc33 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97ebb0a700a21bb4e5fc7d235c5c46c271d6488e8cb3ec95882e94795890b145 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7fd96581560cea152ab664191aeb29077f633f9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72e5379c1bbe88c9b6152bf1a244d6c3d200045b17ada87c7767571529fdcc11 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c80c5b8e754ae2f76e5c415fade29fd3a7925d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed1610eb9af27cbb804aab7fd559101aa0ba80f12817d173350746926bb4594e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9df5faa024c7bf6a2b6f010f57814f92615c8305 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b89b69376affe020503aefb3a768bb92ee9e4393e1c1a257884090549d0f2c8d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af15a4abc984913f86ce352d1f70edb940a42ee4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a40d5b42888c2026a95fe5fc809ce50dcfc684703684bbe4ebaf036f6514202 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b4ec02116189fe4ef5ae388ee2c40056d8a4f66 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:decbc3dacc9d5061db7c4b2bf31b643f0c9d6df8f33f8ca5ffa998d3a41fc141 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6237c7519e7668d59782708fdfefa74d96edae9d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d796529418a30c9a4e3dbdf7b6eec1236504db53a185ee58bd7ad82191bc89dc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9f1d1963dd3b131ea1bd33e9f7c5950e65d2b61 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b1a068d8e7a19a5479d7a3272ff0935e911daf6968909deaaa707aac7bece4e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14b3cfa761a43b11f0216a250a79aa55f1b0ea72 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7f5e90237b2f87faa680c6db358619a4f0d35d32ab630f40736e0737e697019 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3634576da60f1d2018b7df2130d61902efacbe0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f668f36a9a43e65379f2f2be426e57dc5f4ffc58d123848c907f337ef43083d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..536ac19aaaa36a448431587dd001aa056ec009e3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76034c0739f4b96ae0d63b5e2d7c8c514ee18033f774c4739a0fcada41795556 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b2b371361577d266dcaa78c55c7a5e91cd879ad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd751ad81ff79e46edc6650fb712f920341163899f49bc56e5f703df6e5a3b8d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d58705ab4b1f3fa7ae2b62b351aa2d0f15cf7012 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f5c100aa228b3a48f455548f66bce612175208b89fc2431ac510b43b9266bc2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd5a9cfabc4db74b3966a3b69876d319db15bec3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24cf1a23d5f3a47bcbd5f74b698c8c1d0e3160f860c207dc20027713afe2fdbe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..796717a8c09f3db62f285b653c450fdc43b639c1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9ba70191f4f6f91234b9b767e42800a0fa21ab60d27b4971876f5286b481dde +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1180b239c1536e063a67ade12095515c177dce04 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:395ba29c314f15e975f4c323a6131a37583a3a570331afb755d6bdd0606133a7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3736ef591ab42891bd82c62a27a914a3cc0d012c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa2e1729d30020d2726ddd6e69351c24f66284566c4f59b06176194089d0928d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31c034dba98a73415ce2635e0128069728e40946 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c76084aa9d78c955db558ab52b409755920c81c9e41d043897a702c40c0a499 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a72a6236c6232de3ce154d392b1bab11eca93e77 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f25d5649f2b8ce41796ab4aa9bfd7bcd8d376daf5e5f2bec1451cb7fef61c918 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fc7f49d7144eee99692d8047f8db120c98c7a26 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac3a02709d221d8ad2b311444c60e4ace195edd70da5859e5013684d5108c865 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a2457d9a36b9feb898c1a7e13dcebdb610fd326 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:102b9750ebde22176e7c195f5beaf72cc15e2a312f26b2b798b135611a71360f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1ad5e16b3b184fedfc83588aed73afd391fdeb2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa4a54ca893cb4f34edeed4210b5cb5eda9dc5ac853a0d6ac456ed205e143a48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb63ed8afe57b8ad7ea391d8d7aae8a87f15c7dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f50e6dfade63f1ab17146cfae8cbf632205f3abbd3477673080e5f3a1b716e98 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c86c767a12c34f8a09b45cfc12b8a8e2ec81571 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90aae9c3e0b1b1d1cb197e80d55d7aa48a4dcbb9e5f6259df11c9b4369c66bfb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..67ae8e0dd4405c9f6cc869832280af9cf7c8074a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04438d303d2358243c0d971f81311f780ccc17eb96d8eae95b956e260edac56b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82df44d45e67d4e587073e295cd553d3dd88d105 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69f14aa2277c63410dd8245518c542546c624fff21aaa30175358fb6f5a41b98 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a606c82defa5a9a7119a9f19459a14127a370e21 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b98363d53d101f8548848e54adb473b8b94b1eaa35fd968219860f445b11820 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37a9e658b63f5f53bce7178bf506d41e58a8177e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dd1f5480eb35e3836be8b35b6775bac8df63b3df4c1ee7ea8237161070a0fa9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfb8d73cb28a656494e87c996923a35c072c1cdc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e491f8db8a75e8b3a2aa4f5144b64fc7b5d412f2d83de66b713eafc2b3382cf +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd5b46d2d22e4ed318937955ce8ab88e157647dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fd63837fda1134477602ff82b3faabb8e5e3d64412ab2a7d2804f14d1583573 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69541cff2d665dcbffc6b23c17f727dadef609b9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86e8e7b403c69b9cb54c9247c4008bf12d0d9b51915a13ee236ada6f6343873c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60ce3975a01748da03dd102c008b4b184b40e68b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6807e3ee3376a37c1ba396d0509b53f0bddb9d51a833bf9b6a6c2ea26f38ad8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..635adefbbb3317e3b0b74930c0b8a704a38adbb6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9df753e0154a2ad7e65a16ce91d34163bc7e8655ec2412a912584325826b93fc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aaef0b07ec34dec4f9c0129bb8bdf666a141790 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4e9c535991fed5503cfbf7e79b0904c3c7a36231c548276d3879ddfdbe0bff8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19c94322ea4834b0f58eddb211c0a460ef9c0e72 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b09ccd1ed982989bffd0db3299d8a14cc7eb289308146d830dfc6e84526a9c72 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8104753dcaf996cc35cc16cfe0b67e78e1882aeb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70c94439967461ff03d19d13d3e39fba887a94954a0f15e8b00bd3c15966fe21 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8739e4c02d7cbf344335b53df3ab36564bf0c148 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a1ea8742065c849fcfab323040aa7800f06e11c743a05e4616a30ed2566ecf7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..410b1002b3bcb390dacfbd8cbcd05617863a19f5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:694a4565821d96c59d6c31f980c785aef0a2a21adcbaf8805b53d7c023b25d38 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..791f5d9d0c3baff218329b3447edde74f1837938 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4a5199dc1a43d87f769e48b1e73329f4b2003d26691fe2949cb750cae5530e7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e9ef1840ca6579395e0fcb7c93f36210a6e3ad9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdfdf780e2720cd4871932fc4f12c3541f82c34c24d4c34d3a86d4a1f8aeafbd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9030c59d4bd347627f471eefae9eaf64a8f54a9e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ce6fec9051fed115385ad43fbc55f8738c95f31967f8d1ca9422f5c8357e97b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45f2a202da5fc96025eee0519aeedc987de395e9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4914188bf2f05d097cf7eb628be383a815989f728412376fbb6da8771a4df2d5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46ea767bd38676b430d743f2701c5f480e92e60a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fde3b25060749d1a2f598a28aa77d1561ffecc7489336e953046cd6ed7bb7245 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ebbf99227b2d9cace6e9c37d4f3e38892c7f07f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13c1077b4cfa61cb61907d25d3a057d0edf56cb9bbc9565a9e3f5c1dec2ebac5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4925d59ea2ce2bed9e7b79b2ec3c28235a7b2627 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aab317a5bb6febbf1ffc8b737d78b38fe5593d50c4a710d21c4ed63463515a2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4505579191942935c67845628ac48d2b49e50d7e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86aaec02d04911851c6f6d688acd2687157232aa046b144068cd9c1662026cf7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..173af1588e5b774e9f3cd48180a31597dbba5374 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db2f182413712d715bbcd6216cf5e8675acbd0035f8a15f8372e9b9b381f2bc6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdac4596ac4a71bdc9c8a29352ff7839c84294fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc4037cf9ea8fabc4a335281136b3d0a7a6d85fb1b2a6b90b247d28d64a8c418 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4158a42b07dc9a32541e5cc72fb809e62cc84d77 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5efba800420e2fca2052a1285491b3c805d214827f9d5ca11e2f0fc714bda9d3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..018f108e87e9967b4b41f2748cd1818c4b529e83 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f5fd461d5a6658e8f40866962f974a70cde5bd57951588253e07a04fee2e330 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5919fdbdc83e1183bc9a28ac3f2762dd19b5278 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e79148aa236b72b8a178132ac48c20038a98a0250c1b498e135f4744718ae9e0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e4f23facb53d7df330129e615ac5f5ca5cd1396 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20147753d0f73c0367ce08c028a632b4aa4fbdd8290055ee21c3e919c86b3ec9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcb7a170ed2c86518614bfc6413a7872c49c2c51 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:003f3e0b67f78ca2ae372c62b821933a138a205bae54c3cdd2de5669a1bad98b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a48e61ea76075cfc0ec38d619899f3e8aab0ccbf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eafe993296f65b5497769794b4c6b0e9c2c6f36eaf0a14bc06749a96728457c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff64591271482902de8a3d70526d468514ba653d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:108d30e9f4195cf708335f194b0f1089f3ef53984fdd230db8eaa07f81fd5939 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88a9863f74a67b656be02ce203b410e5c2933538 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbb353c3c655dfccb5f65a131250017cbe350ac8f2384684197548869e3ce356 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09ff8c2b3417ccb54f4df4045e978b9b8be50ef9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdc60cd47afabe1e655387d97e82bf030f2e870915966a30e390e65a9a239eb2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef3d989f429b817bb9eefed35e2c6cdf8c05bf68 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef4e28cfa81f43df2231fb272881b2b8d4c378bae1c20fab058ee6f49b628392 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..681be94af9e9b9c0ad3374aeac036a1be2e56b51 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a24ffd4f67ce6e6813a3a20fcea2fbdc1854401a5968dddda88b381380d4e85 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc7ba6b549647ef2dedc15c8a4c3ab8d3b92abd3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c17f02884e8d07d91515ee9f0c3a40489ea2356cec8e0e791fad02c20b9f40f0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98cef51e12d522a23c1e45037e77801548cecbb6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f227e5ab1620d03df9c02e8617f1c52d2c5179d52f492e53b3426f33a7d0b8c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..888881c21dfac2c3cf2d933b0cb5fe95b62a77b9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdbfd75c8ec4f7564ea0b5616fb4556fd5a143720aba39a7dce12c5796b4f8b0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..049d2c7bdcabff5173293608abc448c80350dcbb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:899e7f4b434eca546ce6cb0ef95c5fe12c7759acff1e85b0d3856c36cfe39c08 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53fe9d51fb3252111f3b9ed8b32133df93ceeac0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a9d72c76d0838f01321470ab66f28c4f23ad27548b7e389f50c56b59aa432bd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..412f18e202fa501a1768efb9d5c64a73609ed0a7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eed54ae366678e6208b998332a3bda6ca9d95a3b4c91680aea46a0ee111e680c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3e00fd4ccf051c4d5e67bd5d489efbea6d9602d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbde383eab3cac7a02a8920a5bf731bbc6a037dd51e39043f817541a42942751 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc469dfe564cd8fcdd12eb62a55dcb643ce2f3d4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c36c7db0048041e1921bcfcac200606153ec5fbb59853b62772228edae26b9ee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f63af3e7e0ca23375250a0a089ede2143073da22 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b58c60ba7b605d4ee7f7ba4aa0e1c9e425f5ad02e23e2c8260d1a7c6e4271d78 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a12c87afeaf0e0c93a80a8d3039eb20b9d00732 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f4cd3c0815d19b5263506140f15c85b2db13bfb526a95d32e6e6e8022c58c2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1835fe94af48cf2e97aa12b7bceec6fe8a4f808e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3731f0af1dc7c594d72128f94cc9937ad78bcb7803baccb4604f221f65cf6ec9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a30ccbcd99d890ed8ea16ebb1e98a367084cc46a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9153c952907add25b65dba75a3d3d6afc00721163a058c2022948086b96f384 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cea48a47461029db095fbf7bfefcbf4a32064344 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39b5e6ce80e7d364f5bc43a36252b2cc7f41fe484ee76fc5ca946ba202a0c9ba +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6e7db7c668f45e150b66490b74cea7133b66a34 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb6f7594b998088b982aded4a8771a56ffec7cc70737f82f80924407917b44bd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38bb9fc765ce1c24453c1a45a7ff79047bc3373c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:269ed6d102475b24ae1cba1e14545988de82ccff9870186981122b1387b49203 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a0c7abea91442de5c57bcd92a940f8e7baaa0ff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c94bb358ca3986cc70f680fdd96839cda9d8ccbfee856aac89a2e408f4cef4c1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7b301ff2bac1b5b2e7df28938932cda743b0aa8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5dea69d44a41a325b00843e09b7a2402b29645f7875543918e54102acbcbe2b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3714ec815a3719679c797eeddadd237b6bb4aee --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fe5a2f29a0d6664fd390321e7071949418924cbd26f26739283c06062494268 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eb6509c7249e6f003226c475d67bcb2b0f6072e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6239f1cf2c34714c5d686db725cf64b61efc3083cf653c22bbeb3558e6514398 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f66eb465c9a036b6788c7af4de116681a8b685c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e257d1fffb394299db4d801ab44d15e8bc06b3953ae17f706430df86255590d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1cba356cad1383be2f5116953aea4c871cbbe6a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c22f0a5445574603e132e875ded72beb9d74257a3eb783464507d8769be5b3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcb578910b0f552502b72d8551ed6a54a6834160 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0289fc968e2689943e54d90149ae57db9c1f4b93a6b46bb2981ea1a8316535ec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6309c1bdf44405e4c9b35f6c291b93503ee123f4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83b2503b1501fc905372946d538c0b71bb0dc3f5571c57d987b16c8a9734d3bc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6a86ab24f27bf183869f4a013a382895171eedc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f408b9852953cec4fe4d8512bf10f4d94be607962ec1f0ff7fad10b81617f048 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97a122a636b6a8500bcae49ce7d89351cd0c37bf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e92d7258f71d22c6de3d6a0c186531785fec9cae8f8f7984387fe35501736cd6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62cb7ab7bdddea205dde12737de113f7bb89bca0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e0a4206bb708dc18cb584cd530115f46a4ec52483e47f844cb0fb9c5b00ce2b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8602ee198b930449b250e28fc473e75b7171fc2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:004e2e2b2a37e39c7bf1ba7dcbcb9e927014ce64689a6f53e24cd4a510f8d10a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecfa1c23c8e47910d4e9ecd88bb97be614d93ef3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0433a1af67847c0b404cc2099bbeb87fdd3aaa02dfce7d9bdfa5004570db2a64 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..805a81b2f4d0e6f16e3ca8edc94c3902131386db --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5055c3216fa1e4802f4a22e02ad2c71d055f47e5d48ef5aaeefaefe837f80365 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..868a4a8a753912a5a8da9b484d1f3e5a10a86c2d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14b57cc8cf5d97b5a1fd31e381068946f7a3c7b3feb7c30cbaf1c1208796613c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a01bdc746ddca0a723237033560854f28f17260 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59726b102781e97661ac9880d90b95f64151a1d4bd76ebb52285c05c25663afe +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4d82b0e52f165b12e61199e70509f5946ca8113 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b54a8a3ead234201c601efc9a8d51c0be110f53b01b92d0a1ea201c5a7c4bf1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3032d9be1aa35beb05813b037f4dc5460c8264a8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10b63bc2d5c3ed7467e051b777b500eabfa1bcdd823407b83fa40e104ee94df1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c694c3135780f48cd8bdcc58ba4c01778aa9218 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc159b098dcfb764c1a11a76ad97f3b02f17ffa560f33aeff181db47628aa3e9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32e21c2b5dc03d2818a524315c6a0d89d2ac601c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85298008c9dfd86c58db0c2cdc4b64e59aa0d2b292a8f473782010d7232a8d83 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30ffc886d2be3b434eebcb4d97f1a0cb53ba94d3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab5c0948169df7a716e02b7af22c9688c1cebee85a7aa8514ba713ddfa4bb461 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53516a7e7b5f2e7a44abe52f3f6f7edc795cb3ae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1d6e7d27cc82003e6a2215ecd74994a5879fefcaa5c292f1e9092dc473657f9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ffd8968e5adb87d995d365439a944db28b96bf2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83a4cbc5a53c4f918d095a8a8c2451b9b5660518339ed8c35a84cc7d057691b1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ba168e69d7c7e42c79ef24ffd6f66f67e59b1fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a65440a9dd5cf74b85c90459be4f61d9009c16f3480e99d4647e3402c919fe82 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..154fb3950a891bea5ef5a57d70ff0f4da0b5e9d1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c32b336b61feabee153d203f6ccd16e514837f6a5dafbba0139b93fdca8c04b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad613d5f1b9c5082dd4a80659663332c445ef380 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d80ca688d03ac56f8496fa4e4076d9155f47984f2d2f3e8d252dc8cf8b5aebce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bf6e931011da902cc6a4760aa3c854af889a0e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d310efa22f1030c3d2fcd8bb635fcd03805962f5498e78a60128739991ec6741 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4086f1cb0384554b49adc52d5864fe36846c918 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99be01501d6bd40df00ef23bb9eca47b68bf4fbe49fb6ed66744cfa42ac6888c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2804d2bebe61ba08e3948a2c0f594cf6edd9369b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fc8a7e7f0570e51146ee959873063d7a67b050a73a562e79e53e126aac98f88 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..034904a8fcedb86b604d45589f675227dee07ab6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db48640b8e98eb90dd6fd00dbaccddfe93045dc8f8da5ba3a1f6e31bc6048015 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f976af7f4bb5f8f442492d21b6fa4806c05cb1a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71d9a3283aeeb9ed57e07c837ded744065cab11b27d23c1d66da8db31c1e0467 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..432b32f841a4519796752d544a87f7e19d1afc81 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38639910d9d8ffc7560f035b2483ad65cf5d7097be7f39f1f1a23db60aa9c655 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..867301db8297345b8fa53eb434220d2422a2c284 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8097f94f7cea1900ca5dd78e340d728c0be4072078705665019f68b58b26a27 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48f64ae44ff5e8e509bc32e0ff635fd1f4a1effa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f1b5c609d8efe51a544ee02807eb0ff057efc354c94c8b2d17d88d1d225438c +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d82c627bb0a26a1453881d04db4108a293953529 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1de9725c4b5b87c789ac9fc5119e9d8adbfc272cd03b3f6f3a598667598c9c2 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee7aa7ddd922b1d6d13655fcc00230ca4255aecc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a39c185b846d08d28856a53d4c2828b355cd78b29a8e2d5fd4f7d843f2f309ed +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be6509d654336de0c80bee60f6f7efd1ec369063 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1a7d1c1039ad969c88e29ccdf5f95dd7f8580f9a57f567c061c538baa84d693 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fab249a014ade8714a71f0ddba4e9f588b9f21c7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cb5bbb1c6de5bfb7256214b2b272bb8085b29b45cf235ff93963ae369652cee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..202e1fb74f8e02503089dc9665db35e71bea863b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d34623c9390d3fc91429927a734cf71713771e28bd9677c334134ce032fd3ca3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d2499307b91782241d776ae134f5c2abcc598c1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10645d842b83f9947c5c373f1b3c93827de8275b6ee5b457e38269be19f116ab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d9bec7a7544efa98a70c1be8543d897a9015fc1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15cd82d1cfc515d9560793aa8693af282514e293269d1266eae82465a49ffc00 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..67a46375f8ebcdda07e5cf97bc9c474a94437da7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89ea35e423239245655be85825c9c7e78bf12f3961ec166c0d9eff68d9aab78f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..981bffb3956d17af48c1c874524638e2874c5ca5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f0a00bca3ff5e0519328bb0c26ed8e9b7f9b21cba15532b2a955c54905f9f63 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e87ee95e9be6616e7d4decee9ee68efa4c66af16 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b7f11b441b066a1c83fbe8b086edcf74316704b63d6066278948058811e4b20 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae1821cb91d4e3f599ffd65b1c3f1e7c8c6adac5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d45ce9816e7d8e0360226ac8f8787b69b506195e6d7296f9fd80fd691094523f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d677f35eb17dd121f837d894eecd6095e98ef6b8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56adcf7ac2e3632432b79629df9d94abe3179073bc834a8cc278290d1265e0e1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c411e3257daf7e14b4107b5d7a02fe67c11b6c6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:509476f708c477181cc726242c785d2dfa11ec796deb1f5bb53a12c486599614 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..17b18b065f2fef8180dc88cef739ceecbcbd24b6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8063e1b4be5aa92d70c7727ce2fdca30d14f7e9377ad20dd682b7da2fcffc8e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65b669c7a7fee1d11ab60780e75d58bca5506308 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31101636578437ba9ac8ea302132744cd8a9a4a08df0b9976e9316bbebcc6250 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c18dfb90858848eac8166f44265421e274eae9b4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0593b780d3a78c5a5bcf7d21962cf3d5f9baddcbf0876966b740e46db4a5989 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..240a9fe62671bd858334cd27e8164683ee6a6fbe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bfbd06340d3feef02f65fb505c44245065e5b8529cae85cd78bb3b9882c478f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f15fffab13e7b2a9fdb6c5703f06951bc0514312 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a3ec909f1f4674394e1289e512cffbf32543767f42b74d4bc298d3273b5df2b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4c042f53a59b2f86bf717cd04a21e6a9c553e40 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d9b924ce7fe048b6e95f62cfdebff6b1baac7291b60c4ba92a6f86d46e1a96f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3487c0c66350288e3379def39cf70c970f208e60 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b70c4856e4d4e3006ff3dc24576667dae3b8d13cfaaa331848093e5c4cf9388 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4874f19de947086f7bd00e0a9523d8b848e1f213 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c81ef6b75d22c1c8f10a7c6d4b0b3c0a460c65c0f27abda990379aef30d7f42e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b149a2af239bb3a52ff6f15ef45f289065158fd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24843ee29b470ae7dfa680f2fc6718bf776dd7d76cafa0736928ffeef65fcb50 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b29a155fee5849fa97cbe0e0b7dc953f89428356 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3818559abfd1bab003f88c058ec7817aa83192a1011e915d7597b096d9f12121 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..689f85a2ff4719d937af82a80a89ec5504273d9f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:769e9790901df5118d2af2d81c32504c2b8788b34b00c519cc7dfe907f3c2626 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce861b0532c1e76ff094fac4016b05831d60da49 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b90fa399427a43226bad45de50f9bf270df22aecb75aa8c0b28eb28abe678f4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f085972b1485267832d43baa0470bdb5a13ae3b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c23c7cb1f774e470acabef81b1c760fa6004d3a5a8c5a7b0ea1a31b419eb9f3d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6116458d2573cc1a0195955af660bb13a2f857da --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8a07005173e28fcaeab5ac424ff0ed373ce7846f7469a6c2505c0c9f26e2e6a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..90454d8fa89daba03e8b30a4840282f28637165f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19b03a7ca820feeacc78303998e5f618c35d40e875e2233f5829d2b850189262 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..231ac72a122030ff7a60e339461721116c587cc2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:753f90dc737426910215f6d0635333dc8ba29d770f9d5829c125dca923c25d6b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c8538bb2460953e2bb394e103cbb31aa83a8eae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:686aaf2ae062a85d4ea36d0a784a139cf598fb4535b26ff2fd8ff58e84cd7d20 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..375f89c01e97370610dc98a99166156b15925eb6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:513c7067b70d4232331f37ff3f37223154058fec5f438be87341701bd8027c89 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9136adac829093849c9eccca857a32334af3e396 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea939e7565ac997db130d59b8dbac8290c84b716c97c4e8561c7958f07c51129 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64f037318d10f8ae1c0e843ff6d5eec65783b2f0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e121242d29dd61e45389d286be3c503b466cf2df6e5d9eff6e6beea7cb09560a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..57373606dd3ded861da36213ed8836b2d1df3a48 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:019693adfb9884c258fcfa6e683f0e0c645cab859d23534480c0d507496c09c0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d07bab1dd9fda633c3c9aa552a272e4bf20478ae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f6fec9254c5bbc0c989838c8f854412606e6300013fc4a79cb802fb66437b99 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7e151ce4261f9311df7158db3be0d2116e47b9d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:555a7d07384f2f3cc86a979d95503c85c1177e12faa9c465fbd7bca0a4388cf9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..062a96295654553db55d6c4625aac0ad8e764b00 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90787ea6aaa8a95204c77dc83473ecc43da106685d9437691ad17295bfa46b28 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..97c3e6dfaf68c4a394a6768050c5a1c2d2947573 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b8545f79c1d47092c54035a86fd03a87e66e89c02a88b7a049db176d168cb39 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7796703fe4e4bcd5177fed56c204ffebb980546 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:415694e00704ca627a0df811d9851bed7f01ec4d687c5c89ab2245b0f2f6b365 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..378cfaedce9c77d523b9422abbf45eb39ebacad7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be44d28b8c091b096f82fbaf47b3a2380352b9906d47d0ccf7969f28ad445bbc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50dbcddda7f95ead14cdabb16199dfa462c1088c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf6382c90f53a46095994ea3c39c005b724fdf378586749740ea07495e1d63a3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a63525a36ec4907012dc8540606f9f13ee12630e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f85565cad9c4464707122409d40b2a382a981a83dd9ed0dab9541179f50ea3d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd6150d381dd69ac9d7bec03c7724e2f0045b381 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a95f31d54ef08201d647c4659cadc8a827a54686580db945f562fcbd575d7228 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe0e5f2376a9d8fa6454deecc92bbc73232fdbb8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e5504f2684cbbb6ebe7e5a559ad132aeabcdbb63b4ab251393211aace1d6e5e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..743074fa2dbebdb4b36a07965d1d2f57cffcade7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4848bc2a15170dafe7c7c438d3472e4ae08a483e5345e3deb6cb99cf450d27c8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5210ef5e0382c7c1923c1d8bc8735763716968e7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:724313963459b1f48a4b6dc6720b575f1feedef6de46d922827794a029766a40 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54d67ad820d3773151c91f6c177feb4d611bc78e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d0f7fb8166d902002cdc5d58f684c605709c5df96ad5517ab5ba30ef15825a6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e22680f5f65cfe3e37f8140664309cdab321c63 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64515b3980a8184ee03435eb6ac3f538920612561a3c19981c036b63d9795117 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7141a140611d99ecb44b60fc70cb5cdc55d95e2f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b85a1ef05a50418721df1cb8d88f94fe9c6db94b3f2d257a0fce3805ae5ef82 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c81b50a2a2a29f56e3dcb1f1faf2bb0df1389b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8437319ad9ee12f31a2515ffe172495e2997fea32ade06437cb751d78c2e7bd4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..647d4b93ca624da19b7d31d755c8cdc9dbf4df42 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:471ade2cc326a7666d58febb53da6c6e526a58b2f74e7e2eab1bf98b275e1ef8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5f0948f33a231e6c1fa9676dc63025ebd3aa24d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:602bfa590f1df1abc74609a968122078edfd4d780a84019c38e8bc12e5dce325 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b790b5ce4434fb4fa679d740b51f88659eedc84e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf75ef169fbc695ddd03718a9158eb9120780b716e9a983e5dfd3d82fd86616c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f4324e0253cf670b5fde7d8582f701b1afa043b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7b5de29ecd1373af5dd3ac0122838962b7a739a9a4cdad4591463079e5721f0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84fd3f64d5e09f17e784318c5556b287c2bf59f0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed38e1baece1ecaa2255aec5346d7481af68c85eb2e1d4f060e30d54afa0d6aa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef85baedf7dd6d271ae9b1f832013ee27cde0eb6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3c021a4e0256f1ca29cdc003c744b5df5730344ebf48650873d24c25b11d8e0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d6fd91da4c9decf11a1795aa1cbd94e896c02ad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a74147b22005077276baf1cdc224998049202e9ac285bfa1819093f12c2ed602 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..10e47371f79ce90de5541e521a49ecb64641e6eb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37fd7871bcb6cf10fce2babac20f661c6b8ccc47cc847f7edd9634a806c4045b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..afb5edbf4017a87fac0d1441f5aceb2f1b4c503b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3cfecceb4393de8c87636b02843f3e00779a56431baba24ffd460e13e5eca48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c75052b03d82280f9623568287dd01420085d75 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89ba6177a8a5e2dae653819a03dc2e6f978450d358bceafea9880c1569b94890 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ec58c433d1d2149ffb2ffd3156ae7f7b4ab8236 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:698dbb0ef1a575417d8ed2ecee58a6616ba9e0c05507e6ad6ef8c2957dd59c6a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d31b27041961aaf883747c16d68a228ae3aa5c35 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c7abe44232eaca9a939ed2b7ae09ee040d8424595e9b6e5b80e2e5ca6e9bf35 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3137acac28b78c96a80e8b233a1d2b4f1229e45 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffcda4e1eac763c6f0aff308c9627a4240d582d92a666bc5b3ec8ac4e44c5f53 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b77a6b5ccb6c417fbb4b2703bfa1a6d8b902654 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f89fb8cdf4e915102b25365c502b0d5c249dc4f96b3458ca6ed06f63421e6c9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bff9ddda4edb40ec804cb7d96d9eabc240c4c26e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b146a63ba3f3c38a70992dd56dc237edc5fb876d7c201d843564eacbd3bab839 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c263f51a54346db2b36fda1fe886473b5a3b57e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:128b98831bcfc67e3fba5671da17f75e2bb694bdbbfb859d6a86a452654746b2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..750c0ead8c742ec5e52e26c44e3960ddd94a7b2a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a96ed44cfac9f4588e15b38fd62daa9b015b4424af886b955923c6b97f85702 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddc273630b3f8abf13b5a954c5f1c780e8ef1afe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c49dacbffe8d6a531a9bb8adf8ecb00606b82665d1af6c90a4d10a76be44657 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b2d6b06d5659d50cf0449b129ca7657a1e3a9af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:437c63a20c6b41695d785edf593a6d48e545b93de7a937cbac1c467c0c518816 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..25158f8242326a6de3322e81546f16fbbf3d38d1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d01d6bbbc814a34fead733c17d4b9097b490028815eb69ac082620479cff64bd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b3ab057187bd36bb17290b9022a28e20f41558c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6b22b57b0f36a75a42bc541d4b25c990f6bcb93895d8a4e0e093bb88828ddb6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71a6021e10f730b1ac107ce460f68c1088c748c1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b881c1eea8f134824162fbe7879a51c2eb7409dd4c4486a6c37bb1890ac4580 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4e8986c2a0600bda03020bb417ac2596dec57e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95b3ef2486d6e8dba42022087e1eeaf7936d00d2ec53b88051bf75547a6e8e1d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..81c7706548e446d90eeada3c270718a995c1cd2f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4f048a589f403afc7a8b6c3778b6394a316b250105a5a07f7eee57045583c43 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65d30944dd71857d71abffcf81edfe3fa095ddf0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37e84fa8dc4a698d416b03d6863ea45ae371aaae8cc34764a256f9a3cd62d6e0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9fb4b0d01d9ed2093254243f03fdc02665fa1fb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbd9b7543bbcde5d2ffa34df0178a949c4a35555f7c49352c7d76d3f525e0e3c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2af39dcedce7c52642eb16799d084ccfd76cc87 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:685f833acb064676f8a9e69f832311fe508d5fd5254d6fdf49d5ff77504263fd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..46570ac97c2eabbc72c599042a98ecea872d0611 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:106745e9d3e885802f77c6da0ec8cf85df41368eda037a5cf290ac2e3ce2eea7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23b07d5dcbb2b0a851aeeaa47cbde08e7eafb53e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fe7cca6c35eb4e115ee69ebe961ff09237395fe50db9a8898d4822a9f4a4bdb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe13d52912e01f935d3924b4d74a790de62c9814 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:537a51d13ebe35fdf6bbd768fc17fb0ceb61a1196e567c82bedf6346d9376b2d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71324ef13c67ae6787328e78777faf8e21fda06a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f81124a4599c6cce74b831339d2d112a33056e7a85ffde11b25e82830bbdc085 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5777cefe2ae9ed4e72768c7fbbdfa459e8d5ae5b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eafdbac056478a26914c1634929696cd6680914528556ddd352592e0c33be74 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eeed8b8dd28cc035bd6da190f2a0a7f6fa79496 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dba06c83a5e600c93f5076e3934fd147e121d8386b3f1e5f20e4e9a2bf7f264 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..540198a9a58501e2ce3b3e2727cd09f3e1585498 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92c854ce8ed014012650f506c7adb869a8dfd47eba71938e2d3f485cf9074adb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1628232e821511a02a21e4196f9c24b266755355 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81fc40c498d2e89d415239f5b7a2fcdac5f2eed1c78f8d10ac0212e263a6692f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71b43d44fdafa901159091f10c3580e114e36c9e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e52f83233d9d56505bb0be07a7fd8a8263947b5e67cb4f6e3cc32331d9134b4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16e76ef303a11a2529d0274e05c4b2d0bf27f86d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:247529ddfc3969809bb5adb834006725e35b3f867d26b3676f6348017cdcfcf7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..22945a1efba7ff091feb71c937109983ffea0b3a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87a9aa2710d91693be89922b283e4c580217ab9bf86a727823d9ab6c356a96dc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8cfb82b112cb74b6737d6e1c239a68922fe013a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7883327b38fad1e7fe3fd2e9ed79bc62be249ad8d8538061790bac48260631f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..296c8b8966106d0989fd7e51bd50a7b619ecea9c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3105c387bb5b8870a149750e4d50dda7d99d2bef85e6b3954f452e5cd0e9d6bb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fce5bc27bd7c0b4452a5b69bc4e75327d5a833cb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4635b3d2a777ccf08c464832cb342a3b9d09597a5655ad19ed5289fb2b546f09 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f61b1cadd41a2c735f21c1f31166d3717eb46b8b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4502149d36c69a6fdebe00f700983669fc903fc438144923e455d7db07157b8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f062838755bf27a8e371f56ce25ade146a5ff058 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dfb450f45865f704599a4b814af64223c9a0645108d63d7f080a84a9fc44c65 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6091165e2f3e54a8cbb8c1abe0fbf49ac2c997ac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d79babab3430b3675d48cc9022d25c567bc9b034a9b3484efe0a40f380748c7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..432c84ae81d41a2923388615c70fdf4cb63e30a9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad35dbdd2856d55c345c30daff2c77a5d645f0e0f74446f8ee968128dd868aa9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba3bdcea9ed98bf7501c0ed49e0518fc45fa03f5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb0275b8a51920ed5912b1c3afb4f1724346878d6494ebc32178ef50014f0a82 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecd3f42dc8c606618e44fa658ba08a106e2b9ec7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51b10025bcf59b1f9cc14ad8661c0c66d2a6f29f2b453ba9ec611a0ccbffa993 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c017d31d4b6f15e514a18dcd9d7f27b0e8a1fce0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb429fbfea55c921ac9e65706bd70c9e2139670e7619841ddae4766f5e5097b1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e98470a883efa655a28e7814970d629e46620c2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:799ea2c48d37845e0869feceda3a580e6740316763b20e1a0231ef676927ef84 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c49df691d65cebff7815ec5325419be9c6e6c11 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5df51efb984fe6785355f8b5ae248302534fac5b162a426742209d7b5a7c8a41 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e17d9c47242dd75694dc0fd4b79712348262754f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd66ca0c618e4827003ae38d4e3880aa332a6525e9dfa2dda42b9375b41d1693 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55195e834c9c2edd95c64a6a3de5d8820bd1d057 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d862733fa90ff783e60775f2e1a2ef80246d760964ce2cf895bf307ee839dfb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dd63a476850973279b2fd1c096b3cbe3edb437c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a030b4b4607a9a4bb5538537bde790a125da66bcc73d699b3afcd14a27bce6f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba8f8221cab6b518ebc1d0fdd78794f947149250 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:263bf51fa54d6fd36b8622eb3cec9eb4fda2f0a6ee7a021fcd0111342ae4a4bc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd8049d83c287162a8b55d6a4c7f0481ce83aa80 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:369ec256000039b499a078d3065390968ddc93fd8bea2691b7203bcc7deb85e6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dde42659da9fc3baa6b0e12dbedfd500ede0979f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c68fd9344002fb9e747bac99a24df031e84a850a83de1db71ae682438159546 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c55ca31e378a2691b632cdc4d252adf4e2fd421c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bc1e0837fce7923d9b40696a11eaf27f9ccb7877210ac6d9fa5081c885d1c72 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..691a60506e9926dd76936ceb075ceeb880ca44bb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ebc200c7d3c980e4fbfb2c2d69dc90d988a017d88c55027ac099d39413df8e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df9ebae6d344f27130fe5e9c37e12ef48ce69ee3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3148853e69433e114ffad8b5f6c1028c12ed1d3b4ed1e226e9cd368146053452 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b6c59b37628a4e380b4e80dff6bb29995e0d160 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c069cd1696d1281dc446a33e6d1f595ccbba2368873575bffdfa5a8ecb8b04f1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34a792bb9fe6ace4a8d677e84535e7d6ead33201 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daed8dfb07ae90bcbd5363894ab56575b00ec2060b0068108221c50be6bbd4da +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5d28fca87e9176ed33c462ce306f432df7ac234 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ee3653574f8e1eb61b8b4bca14cbaa3c95d611ae531c05589e109f364fcf815 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65694d7ef14533ec7c7ac1239b3b38ce8003a6bf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c73d413f67e50b9af1df9df0e8c325eda4aa52f2eba5a6d2e840360bee3f9ee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..27d607ac0065528f62b4bfd42d6467b8640c1c35 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e80f9fcd356a70c0dcc039c907d0ab2162ca35181675596405c7fbe31e4cc32 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e10939752dbf63045ae5973485a6414d7f27010 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f5fdffbdefb29e50a4e98ab25f00446fe90c0c35e505357eb4e1041f0b8a2ad +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..26626e424e50cba4defc2b283e0d75d284396e39 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3c9ba10023380638821e62524d89edd50b4c322b52840427ff46d6c6dcbaa51 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5b23395fe24ac9ce4be84b0d970d2f4f41ebd2e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:978083c557d3bc8ff861d9f0efd86c5d6f06e66a35eed89cd0e1fadd73194fb0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..530ed6edf9eef09c4c25bcea084cddb79c2dd7ff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2c8e5b8e10bf261c09057702c0cc618ef523df65bec997c03c4874fdf96b82a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f43799a5a036eb37135823273ed6341b607e3501 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaea48ceb8d964c2d78fe18ff986cd8d99c4b9014d426c7a78e1d8f730c9185a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..23327f5e3861ba12521cc55f7a33acc015cad567 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d2391ac2b1f4fb32dc0c1d52cb1d2705119306832e36b95badef7e35a375c9f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f925d838599a938ea099fe03d73cd5d0c2ba6666 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:901f80ea63f330ba5fb801a24e6e71c9f0113d8f47c2696e7501eeb3336bb612 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9fa9e86b5eaa4af02b8039db0f6452824f61a7b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b9c42d3b3ad56269326f254b6e260ed664c2ea71e58f14d6e4381a4296153c2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a29bf86750f057012670ba1acea1710dc262379 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd29b40936feaa997b1ac0b4809a319c35a1ebadac17cb73c50bbb03fafaf4e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b40eb93312bdc2e3c300c9355066bea3239ce4ce --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0823897442c986789ee9fc276ed12f08023f56524e49fa632b1c1162065f2057 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11c2e921014608c3f4571e0518a859cabafec47e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df37da03c19fc8f89578160ad2791b9f0153fdf3106fc28cc448f0f7862e466a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eab8a62fbe874cb302acdeb2c609baecdbaa2f1c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a26bfc59734edeac71b1b3a44c2016f8359fb97afa5f8fd7f7eb66921ff6969 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91880f32d3cfe21e815d97f759a5aeb0a41ba48f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8db62c4c50f564e212f5663a572bf621d70caaacf50a35036a1c52b79d2055a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..22f00d5c51fc3ef8be26a3e09918ed543084c097 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4735c0c7f240896114d355e5dc6b03a040082fd0fe6a2c65c89c4513c8d92ab4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05fbb7746e3504a3c06a391d1b89c12809606c66 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81798513387cc52ad62ce72f69b756c10556fd6ca1dda102bf1404052aa2b220 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40e32df626573c36bee4218f60cbeb825cefc7fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:670a71d6cbc106c9cae867d969eaf3a72d1125807b995122d5c34b779f87363b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee2f64883b86a1b9969a9c9d34a4892f6f3fa9c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:172b7c8652b46adb58136d5ceceea422c8445ecb18e49cb0d9c647da46aa0e98 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e965489a56455de7b8457e878b6f2dd7a7b20a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb2f605711e6cfbddeb659f9ddb4d26a80c844e01a2e2a59e564dfb8521bb593 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..423dbedf9a9282dbfe7141cd31ab269f69b8d98f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bf0a3b6840470c32c45e3d135d062119a4b4927444a90f88fca2bb79756b851 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8e195d20bb751148b90c92332d3d8f08c0285f6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0b2d5b1f2eaa14043526dafb6f125d1abf17a1363431d92f9915e75d00e0853 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56f1ed0cb3e7e1fa3d303ea672571dded4453cd0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63dc19114ef7e94bb67d3a520fd9f9ffb8b7bfeba7f0c437b6fbd993a6cec0de +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bcb708a9e8c079e7616ab162f277f07894ae2fd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baadbdb75f0bc04f282083becc537b27b948a64c7844ed6a6b21ad52a0c7c679 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..588d998e6579b3e0913993ab7b2cb639b7909f21 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b049735d96835c36e90a9859480e23758b156ed0a4e26f8b710e816994f6aa8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3165ed76c8e9354bb71ee9a6e545642b32816df7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94ed233b0bef43897dbfaaec27d0c0bf00230d30c346ddb21501a02e21c2fd95 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eb3d6e6c387a0ad251c5dc2cf250be912fdc4f0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34aa6f53d95a862d8368713e8d7f23a5904dcfb2361c6352b496a99857166977 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2404cd99872401c72eaf687c50f45ffbbcd77080 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53ee89490b7f9c51056f7a147c6d6907eb9b1c4a66e881b8143f1aec1de8895b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbc5332bf9b014db37a0ee30a9d8c5fb9f2e3280 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3210ebddbac63721405638493a8a6945657a498ccd71a13c15253edf1d8a6792 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec3e0c40a4efae42364b9c44621ab692b9d982bc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66c492e98a8121c2b9b15f530de7c766ef2b729b0e03856bd80ecce377dc0a76 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..448b78d830dda70e8ac205685a5404edf90be240 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20a0efb7c4f7c552b771303243703c9ff52934e8167d0207b37af9705cf88d99 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52b8727a0f79189186e6189e78a6197dbf2461ac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22080d70f048b7830b8af2c62dd798924a43d14387aa2c23352af9ac4c75d404 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..085871b9a80e9ea73680323c905e193e89ae0ad0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2496d4f8609d4ff28b4454ecdde29a3b2fd09c3badc58643e8fdc03cc9f93b5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f475b85543871b25a083d3541a34e16af9d562f3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458c806561190383acaf51af4553217e6565d0bf6d106a0594ca6b297d31b49f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48498df08026ee1aba494cfc0e1298dcac457303 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78450ba6bd8dd82890cc40dddaf59f398ebbc15ea8a230a5da3ed4cc41f514ba +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..613d7dbfbbaa2630de1d389c05637f8d7cec0e94 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daf7cc917307303692f3e1d03b4f61bf2c5b4cfa52419a12aecc703739584b39 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76eddb71bcac8afc95c29bd5877008709ede0878 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19cdead78affb3c0a80c7e0c6e86ed7cf3acfc358b499bc58be8f2711bc81f49 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a6a2a919d5de89134e3efb7d059b30696246ee4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9637cf166175fef1f0b7d9564615e1e0e305b53809da0c3c1d69cc617a914be7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d2db45e3b23fc7aa5552fcbe8088a28fe126479 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daac6cacdcf9e9132b4b2b5c3a407f7a1e6fee6d2bb5976ca3be9183ee175931 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b458fbfad39d5f114302a4c7f435564b3e71c54f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5447ac95bc85bd7daa179b9d5a05c235316c0fcb69a6db960365719d092a22d9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..007c977f042fb5caf2f8c2491e6fa0692b31445c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf9036667e2af4d5c4156913431e862ccd4bf521d9798050be15a8ab307d6b39 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e48027f593d2ba621ea7ae90a7c3517f94cb83f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06abb3873dacfa9fba2cdc1f89c7d948a98838676dc84cd718879641a2a9a18e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a67365f3fb4126f85eef68da78863341dc09e4e2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b2b6b75176c19c7a5cbac6f0c761e2bf6e036a908f619f2b89e557f5b553f25 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..30ed376f894fe4da0d47d84695b48beb2243985d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a89489cb90fb3eb5e4837bb8717cc6b4124e15b2d808b2c94e7a3645370b1897 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01cf05495ff163b5ebe90dfbb82ce0a25346be0f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c54f10c9d48adfff484a3b76d07401c312d791b287d0984b8fca4de9e07c93b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08dcf7e0652e6f79a133082f4e309df7efd31b2e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d80ff0839ea37fc73eba944ceb1992c69de1f149a87a4f9f6a424a82f48161a8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fc74839a784d48eeffaf411d3eccfea4e2e0f95 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f25d2641b755f9b2595e835d2dec1a52cd744526893e2fadafbf6985b7be35b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..222851d568e430ec4bea3b158e3b53428e20d179 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbe0571ed814850316830489cd3c7d13d6a34bfa595185d19528fcdf6919c54c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..deba89edcc0490a0ab825855974f28728e51c9d1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d9f6a26a1b51575437f2bb8efae1932cf540ba2ad358ef462a9c45e3f6ea41c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1ee93781dcab2779193b41ecd9f6ba023292b9c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b07529946e8205ef9fa98e9af66fe8612159ec54297e1068fe828390a4f20c02 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85cc330613a46c5b3fbd6bbf27e66cf8d275e397 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49781fd0c9a5b3018e0d8ed6b64d6ee9228002c6123f131ec0be42b2af80d50b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c02b07c49203dbee0e1f0e51f1a889f4f6d48a80 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba3e7ea8be262dd953ab7029571413ee0ed7c524d5cb9fec4ecbf666adfae5ff +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..753abdac0c24763a3f355c09b9ffbe5e269100f5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c064feaf9773919e7faceccba9409bfdef13d96e51df3ce4dfb110e2c23d5eca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b8f2f580b749eb36677156155e40f646b02678c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:924d0825a099a43cda7cd9ef7d774cb9b25bbec5f52053c8a53e27423ffd041b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdafcb8e32bc89719f0a50ffa82fbcf1f0ff36e6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bbde0dafe524a216e6cda49c0e707c2bfc87e5aded4c8e94e100481a5e8f15c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a8e2443aaab6bd7ba44530d57919f5883c6779b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0407e7fe03635b34137f25286a5b1b84abf75f103cf6448ec0af64484228c913 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f716a4256e660b574d2d8ebefdb217e8de7e3212 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:652cfc4df8059a964d2d05736bc6ee7424d429fbd937275abf45f034abc372e7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb7615b765307330c9c4098a9b4121bf1cd1a7c7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1016b64cd963f0838ba596937cbe38cdd617d264ef764083049a010a5f9f1767 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9781579859072fab5c4f03f4173dc87d4c1a4f7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77d2bfb80939e33c5fe35fe72e373bf8284774908cfaf5164b9714214372a698 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..440c51138cf7d270b3b46cbe931c67d1c96836ba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68aa51ee68f0f192a374fd4d5a04b50ce2ba5755fe819f55865e9488a9bf2092 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..455cf7f8cab5c1ccd8087e48e991c3965222db7c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34aaadae1ab2e50e6592fc0b3c702be766d0fab56e9d72cbc813ee8f6f3c59b8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b1bb8de2bb3a757cd90e98b15ca6c718d71411c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17243da2f29f8e2f7b85ec453b3177ad4945ef960b42204c254db69b63966484 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd5a5e5b685fdf37c8f19066f9a8c7d63ab4385c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad5c1f8cbcdd6b94dde7e8068367d94d384c3a98a349ae5fccf6eb9dd8481741 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..62cfda265b8c6a16e345cc0122bc13c176112503 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2faf6ab2f33b123c3ed1e2ca3f5c87c4fe404753302420fb87670e09184dd41 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63006d2678ae422cc505fced1b712b9332c199ae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a29ee0e16ad7125159e7aa8936273f873c9afc96e21f9ee1fe07e3d025b061fc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2533b70ec868cf9aeb87388682d4a58bf265dff8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f58218e03adc92041680aca6c2b0ba4f05d5e5f662f439a9146791af17925149 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..561ef8a7567ce977e8d06f29a262578e3c0567d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2f8003f88d432dd15b1246055732e9aa8d7e82d40ba0519e6d1173dc898295c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..21a4143562fff642d719cf2afaf2deaed175a8e2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e075dc3190dc57ac8b8e26b5296f0afb2603e061c63b33b4d1395afce2c7aaee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02df9b93dbc305e225e0abb579a1a8080f3c2cb9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ba0b4ca10a9c07c7978fb15f822bdc45252f62ea082fea93304adda0ff94608 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3379b5d49d7b8c04bc5314b6c678b9c2ec0210b8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9cdfedc3e96b84a6d8ae1f82db86cf139ebcc2fd75d0df78f64d6e24be1dcc1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdcce87e791fa587d92c7716cdca7c566fcf4758 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea1f076661b36720e2597a95079545c8cef438726b925d74b9aaa214e9afeb7e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8aaa2f97b42246546c5e4bc397179c487e307388 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e558430612db1f35af5e22e3e1884d4de086a96b213e2dec9d0a037f36ab1cc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c31497eb5a49ee68eeddfd3870021b96fbc70030 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:075143d08071c09279d460e800efadd78ee1b059d01b5376d473ce837f309ba2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5c835c035de48512d97a70143106d85ffdcdb82 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1df3ee524f3f6f5c718fda5c998982d61b7447c4171007ce6eb4c20d981e1c1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1287e652fa26a36a00f211c3cada23491caa9a52 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb739d5d37e3658d0b340e3860905efe956c8527e88c1a27ea6d9e175cf029a2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c012e0b859a0dd2ca70472c84e51da2d6b313d33 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd422f52840a1d74798d5c08deeee336a34761a7a7efaf93e0c221e3956d5be8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4277175106e5d935de47d37bd9067d716fe7e58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80d714bf4eaa1a12ea3a19b0bcfeca14b0c9d91b35e03d167030409ea09a3517 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf256c1f4222d5e975dc108c2561fcf2ce4cfa1f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6741f93e9f311efc32c2b1eeec3fd59d39917f9ea33bf950c01f2465d4dfd1af +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32c20a78be7d570bc7056226dd031c90d88bcb76 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0803ef040d6e67e884f0176778762da0461892202341107c7ca2c7ece40f338 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d667a0fc8da59201283a5bfc311c9fcefdb7db7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73baf498cb245a067c2ec18e3c265e1b0aa6b8cc090aa3437db1bfd106adab81 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61f050ae5ebca26bec198d30f7a8569b76d0f3dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e9d19d8e634c1a78a97a23c940b18c9bd947e98c5722d7b4127a4c88b5bfcfb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48b81bfc3c9efc650009184445b2820420b1de12 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a462cc068f338600cd795e1fcf7f66473cfaf3170c8c127aadd77ab65e8c9d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15fa32e0bfd63b07d967df9fc37860963bfadcaa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e4cbcf4f9f9b5f81cfaa234d06e5396352af1121ee2d374daf523eb0b8ca05d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3b0b49ceba2136b29125f63cf2e069125f4e2e9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e3b99b6df37a4d35b613856a49225d6b9e55d955b0c7d7edc639c0b847fb109 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..021a039338078510a744260195d9fd71fbe6c10b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9329c7ddb5c19eb2c1bf020779eff37e8ff5867714bfa1e395bc6ebe1794e53 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..127c6bea00424e1b8481f890a19dd810c4a4dd63 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c9ffd516ffd95215f0c825db5274222fd442fd2f77f3188d76eb3cbca68879 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..547b2053938b500e4cf49a6af7c8b01ed2ee307c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b9c9fe3b46e2aded7582b781645d30679279dd64cb63a6072e4f5ff1dc788b3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bc6dd6ee2a7033f1246582777a8090f886ea76a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6f10379b1e8b1c0a7f096ca3b641066602f2d592be12fadf44fb5e8dceb9d24 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00dc30bb3b0f84c93e287b26e57d010006ad2460 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b4ebce59f3aa1c56786e3e4ff9937f82791228fa06fd759a42f7f74a49c2f27 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ae411364ce3bbdb29b45c01676136b11cc81036 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4adec84fded05485649d3f3ae63948c70f558ae122c5cff9e514adf8f694c4ec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34531c87e97f39c888cd48ac597d91082a618f29 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdb2304256e885fd97db4d93c207f4174621aa9050929dc8881e777c29d7d438 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..98192604b32e41f783c78614c1e1096f2cd13938 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84940b9c4b5fdd23da9ca7a864cfbfa839d166cfe739340ec0a223165924938a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80aed9f3fdd7a46e205bf449fad3db6f0753458a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86ffcd43312399b67dc77aedebf19a3aaac6f091fab3985e8f5e511c2e049ff2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..756041302e3adfec5d912b2346e22481a0ee3360 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21d71315f11c67730312e0ad1c26902d35aed77ca2d9bf987754fe92c74de0bc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7796da53e344dddee86abdad6a2a74a955676d3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edd6522d28d49b531e872131dea968df4590d26da7638e01534cc430598f9bb9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be930a534876a974faf6cfa4e50a4e8da18eeb3b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae7ec4987e2b48077eceeef055ad25219ce18e01bbe0e02421e026fb4b6f7c37 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de0fea2c762178847bc1a0720ecd87d600190973 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eec35bceabc99e7e38811bef4f046fe5786447eb0659b0a465813e14b1249cb8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..de413d765c511da4a2f91ffcfa9cf3285cb6fd6b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa63ae65f19f85a360a56eae4b410ec4ee3bc0e26aa5ed031057294c74bdce51 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..852655018d8c6ad7f7f490024b7bed823409325d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e98ae9955232ad1c676b877d30309daa18d842181cb99d9ad31b0b7f1730e78 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2743621c2fa663e7e5ea14954895713904816b3b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a508e70e2c0257e750a5f15eb7e0e7ae630cf009e69267b6c0956273805ae7a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebac17c191fa6352df1fb0a3ceec0711880f15f0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad7eb5219c89dda6b0000b4ed1b2542ec2c245dff5f07b3e44e8ed8ba155fc05 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3d7434f8506e7f22b0fffab7417fe89668c95ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c61f8dd067556245919c49fc2d7f55fedf121f398cd1e9c6a29fc3dcebc6aed +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96a363016a811e01e330d51a6c4c16f9b215867c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f19b42cf0b1d3b329ebd503d3fcfecd338ddb0745efc7a7bb33a06008c41bc6c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..158b27c83e450600fcb71a063d042aa281d32b6d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75afeba7d12ec24b4f88a62d45cf2d525e8b3533a6ace2eedba0be391c6e78f5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6f106f14f4589d0fcc9118e093b88827b97d1ba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7249070c014ee74026d7921764921dd025b5a1ac7c27d6482cc1a4ad8694c1c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9ffbff9998bb487f5079a1e582c4cef965e06ae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cddda89990030c5280b4d94bce1bfab7c40a0a72b08a2ecb046a632a9dfd8922 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9e8bdfc779e7bdc5e4a9b586793a022841e041e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8765f754390eb53cc54ae15a065b42499e49cca29685f09819f324764e192d95 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..85f206a6eb8912b6dfd30b0c0222a60d7a3038dd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3147e53044d467d25f392ece5bc7d02d540b9e3bf362ec8691347e1744dbd8d9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0c61e60e1eb91c5bf4d8ce4ae61c1c94a21de1f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a45e3ad073f8cc7de3e1567accd3b40d5983d98358b9bd16936a8551f141866 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c59a3b3296e51bce65a0cdf91d556061fd0fb93c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7379a83f368a30f048a94ec99749d56510c076182b4319cf3cf7a79252743300 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d39f1edc2d69ee11ad649befcdbda627681ca67 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f75ec60d0dacfb7cb021e9117c57bcae01d801d6a1665beab7cbfdd95a947357 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f535d3d8b7e8227bdc4ffb0bc5dfb9e4861b2cce --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:794ba437daaf7f70c4b1cec4eec6560d9e109320557b870560c469761a43e516 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab3b6ab93a72fa7dfc366390ffc50e7021dbd1ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf6ddd5206ba979abfaaa9706ea423c8704fc47af49acd4a6d6a734b68e2ed1c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a6cd2fba01858bdcd7d0cceab960fe2dd920fbf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b1de30efc6adae3a1f25e404db58270d314c1fcf6e52c1cb3f2ca03f8941331 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21dc581128fda46dfac91eb19fafadc0213b3509 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:427580c1efe8e73f480106b5feab1611a78c570a7ed78d5330e1ff2997712695 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50e8c223cbb92a4e9b2f848e40f3a2c57a39e369 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c0b82d1064ee1a0dcb9058ce94b9f0262a5af5a5b8b8935b2a01e202978ff70 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11221b3301deb6598b11851dbeec41e8dc0f644e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ebaa2f26bd39dcf538e1fabc2218024e38028dad6ec827b2df3e6752084e1b3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..30cf5b5ab4c6ff0487b0bed5a7eac72b7e809a6a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d07418c53b89735c67a17c68b7e9f3a5d9fea9c07ae897dde6e1aa4d512bbbf +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5c992f495ed9498c76a6f486deed684dc4e5222 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe3f62614fa074c1a6ff40f8c18a899390220c6b48923d983f07b0c490025d60 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0a58fe0810d8f3207511122b5022226cda21c8e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db8d3cb85d58feaa1a39fdd1bec4419febefbfb478c07546d80ef089c7750673 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..811504647516d626cc1be61b7d0f986b047a6cde --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9045b83d2b34bfb2fa4e89cf3177cebc1be56c2d4de5a0ffa7b62d5b0ea492ba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c2e6fbb03a554094297df3654cf262980535d79 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed41ec13285de495ec9bca219deed1de42950166331c68a865cdd98dd6f8d8b4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47d40a453d8478db00cde61ce98980e231c40dde --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf2621bac06167586b8d28ed733330ae3cc760b2e9df88a619fa2eb3ddb63b9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dae5570e902c9bec08ec8415c6f42c0d1fbaf0a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ac3c003752c0aab3a75fced498c3f92059ff2db2801cffb0cb5627f211b040c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8778d87373199708f60638a170da4b70c58940b5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80dba9a698b59ecf231da0635ccd3a31dafd9f7ffe9d53623983a0f5762f223f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..99a9c7553bd73d276d974d2f1e30e489a74516e0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:766702e5bc7820b71f66f4f3ced97f63f536fa1c1abb49140d12d311aaee6e02 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa5a40a28ef01d1d2116b7a4f8e6f5ca03ba314c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d1a7023bd1d40d697f6f3b556fc05294d5912cf2aa7a095a2da22a51a2695f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8745c1c90a8d0052346aee139033acc350dcaee6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e76589a2ff6665d0a5365e32d3c1be9c501db6afa029afc7b85540cb89120f1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..100046d5371fba5782a265a3238c7bd7c652737d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04e59ca14bb5b5470f55946191c1568086889de8af583fefa9113c57f9842f9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6c619c4bc6c4b01c953a6ff6aced9d06a804d48 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d26c5765116872a714101b025ea210aa9a7e4cbc2c855d9260eaf502d219391d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ea5a47d093c9a9ef0c8b06505a380379988fa3c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4b911c54f1065abc8618d000961320046e1271898843b05ff13d7519850e9fc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a06ee8c2c63aaf0b1e9cc9a0eb4859a169a0497 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced81f89c1ea7c49a3b2d33cfec4323e6403076f746297c36063d5672903bc6d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c81eaf76806edeba31e86abd4237ec8bf08a41c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e53b0cf57440b75424945f3fd55bb1ddba93d9321e2f056056c1d950d0c726bc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..263b2b98bcb69ff36d434732fa45e89a36600db8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cd1761dbc3012aca76a79d999ae25e172b5637794149a87feeb9c9c3e56b8d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e377e31da2b47ebd21c80ccc46572b9438507302 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1d1b48f60b2fbe778f1652243fbe7ad6f2ed4bf46c0fe456e4c3710a69dcf84 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..306d4ccfd3a2571468cdcc92dfc6a0bf629ea89b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd95c31665c82148441fa55409deb6c866a1d2273cf943526fe070c9bc548fd5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..41426e40258d25c80d6cc0b539274f0d2ccff797 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5783dcbd96ea5e5141044267d063b7a49b1e185c8bc0d961128b931985b7492c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7fe62ffa9c3914950f7cc46437b341ed1e4203f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a1d7577b8e86e1f5a375b9218237923ccc54005941f46b2c2e110bb2fe6fd73 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aae1b5061d58312b22e8813893d31bb30af46eeb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de04e938d36982e14d23b0846e3f552e54d5d69808931714f0b5c4321e8a228b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dc2888e92c43a26eb64d862be88de2c87ec3317 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4090c233c9825d20d2c069aae4ea34fefd1e698bb7bf748a29f04093192f420 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0adcce110418baa1467e37bf81e8c9eaf567fe38 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e194da7e6d6ff9c02727a3ff064862a72d5d53ca53ab9529e838bcb0841a80f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..66b8899afcda294cd7cf0693089c2fb1c871f839 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:885bffea3d4e3729e64d342bd0d4ed8ca28694d8ddd9b2b8c1abb911943553eb +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9cd972738f44ea32338f1b3b966ecb18bf461ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb06f3f0bec5302d07e17d826683ff52946609c6c2f2297047f92334c6318b89 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9966f70e1fabc02c4dd0cd7787313c26a829be02 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:169d776e26c03f371f6aa3cb0a06f594f6a70b2060d929678a18d624a1d2afb8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da0c00ad2c02844269aab0413e5b74176480d2b2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:783c51db49f669933a56c8e322b548d077f2e3ed92c2d6c47160dc6534c91ad2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eafe513e634d7675acd311b3a01aaba323a17e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d1636a75f1e9df271721be43813de221d8fbc9ace10843e8d359f5c167a1749 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd12810d5a4f570368a49de4825aa98d9a671d05 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bce00f0e7becfb27916e1aa893fd9c36e8b7d5b9280f237eb71a97b68555b3ee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53868ac130613f51ffa43ff3cc06e1aa8e7f7a35 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9dc054fafe45ecace69bbbedad708c706cf6bc60534b6dd9c773d9d5a48b432 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6e8c4d8bb1536566c625a0923835c05df7dcd7f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff5034c014e0c2016c8fb319abbf37adfdacaddb5fd9a40228cf0bb32e8090d5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64748e14a359e2182f013300d65c559e117fbbdf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49028afc60585a3310bcb351bddf6073af4f9690ac8a9be81ca646fcb0414869 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..717238e8784c7ae6b52c92cd102a326173774429 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9b62d65ab6a3d9d198578d97c92fdff57cf46f0bf37e977a047925b74abf98f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa351f902367c94ada7a233b2676def8186a1909 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:058fe40ad597f6d2f23c0fb2981eb5f4234018af1ca2334d5ac7578a78e55eae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5780d671331f0cba06c051ec45a452fffe5e8c0c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c6e1809a4ab98ba1726c7045c902e6634e22cd38b1b8597537d3054397ceacd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4238a6e362e3f9e94a91fe246bc3ae508f65ab20 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86a6b36b5324910b320651c23f2e83c7a56aef1f8e2322c82948d54937b7c0c8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c884c4b1400e858871371e2339ab26e06c8b4049 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3118b92414d4e200a5aa0d97485a80b48d64db05200b52fa98f3aca2fa55395 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5c18672234f4af940dfd10d859585834b31b5ad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:773ea9fba0fb9f7a0ced9a8520f9bc3438dbeea90ef42133afc20b00ac30dce1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4112f57e8c1e797722a86dda91587515261bbfa9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:689c766b1fba162b9505f3ef066efb5397a151a7f0502703a6d2f543cb55c3d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..de6f37c81f7c6eb7e82d8042b2a75cecaba6470e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77b0b0e3e9bda7f8b87b0f04daca0b9d7846d99ab416c099569d2becd4b3c85e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a80b14c9fcd60be2e13d408ab63fa855571aa31f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d453770be900483e060fa4cc519f403b30256a9fcaf8f7e2e3973462cbd1d2f1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bf50bed074857552a81bd3fbdb7c27875eb9cf3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02c8fe4d185f4285fad02fba9429c34893ea05051f1ef28b62ae876704296605 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..809366894debea6f66ea8478efdbe5233ef95879 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a556fb291172dad8ce29186ead7d337e0fd7b99b555829edca9d79c6747b7048 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..87de894556224cb8cf9ba94bc8c5b900c3f1b66e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2a1cf3ad2d86e446889d1592fd3046930bb1eb50099de37fa2580a3713d53e5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f0a94be0313b6f3846cc754c949adce80d485b9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e28ba8f4e7ffad57807f4cf2e45c7b8838e0ac3399b11cb63e07c70dbf689a6e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a0f855437903aa0925728dfc6d2b7b2d90e0aba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ade9b1d806bd855366aa16ecfaf52f2851101d87f19d3b8727927434981f355a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34597726d7ba801e0c2e9e20805c480807ff04e9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0f976d83a01b53a3cb482e9abdb51edf2b699c7a8a7fc9cf9e287deb64adcc6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7ede08722a1d67b4c8353ffa3de6a78041681a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8568390165409b811009dceb56d5d5b6056028f1b19f68f82ead144357667e17 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40568fafe40240850e456e2fe21df2feb29d371f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:154c87e707e1b13f9146fd88a85b150209b543aa45ca4b9a1f617ca53baad7d7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..85e2a4eb251ab76b738ff2fba4d30941f9d0cc0b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:def61b47b715d29d4ccd6abc8e7a03966b4ae78533cf544d5cc7099b6e996400 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f5016e578b87e325c3a4f7864759400f108e0d9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3ccb10a5686e5fa4dfe74ceb70756f5127aef5a6c92c3231eda514359f79327 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..43e06306d0231d6ab042aaf8d95a21d52de30304 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18e0bee5e0b24d1d9b7036a42714a88db390b64d2eefaa34e1a21a794de27e90 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c843d5122582922e2015d45aee3e7464b631e353 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e515612b5b3d2c27961e759d6337fed47a3c136086d4ff0c84dc03471e3ac690 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dad31282986e83679376ab8f23ca4d485b798b07 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53d63034d1304668a90d30c04e0b3cbecd95ae3346a99c556675d207e6794aa4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23c12401d43b999998e1022e6ea97afd50078972 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4c95642b6a55261c330b05b0f1a203bda951ec99acdec1050f1ea16ab6cdfaf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1d382b25596eb91b0b90822c819c7679cb26064 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dc5c369d2f511efa45c2cebb2070ca181d88d6ae39579b1a6fbbcb56b072164 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..953e6b9ca16e5ff617cb179e49e3b62fc33f9005 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d57fc15bbe96496b580e1aeaf4e871c4c49dbfe7c8dd9990ee20d7cfa99fee99 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c4a62f8ed4fe017dea8a526ac0c0d8c8d42d819 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0814352daad7c53fdc67dd1c48f605d42bbc212d936ac55acbd79d2eaa2d2c9e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..227157b5bb668b843013053c5b28949378fd6a39 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f96ce89b696f853d36d6f303220f695efca40be91689415a26df3fa6c0b38d04 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d6f94c81cdbfe60e3cce544f86f02a37bd2ec11 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be117ae230bfe85431b3861e0aa5a74835b41839f3925f537cdac195206b206f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..933f3d9d7802f1dfade04ea15dd57587ca3cf374 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf1c8b7fea15ddad72eb74384abc233df3c8de2964a329c4ae75d3b7a9e18fb2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..456277b04fe998d1cbeaf2526b015809b17af617 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63cd49e1afa85e1d98b074024301ed504c2ae80182c012f90830ed8e593346b8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47f2cd56ce7b5280cae1ae60b35313947f2453ee --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9d1151dc0ad0733cb296082c32ce79cec3a513f58c8e6e6b58e68effc079666 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a66062a7e6380b846e226545de14b8e1c31b305 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c743ff23f9492bdbda88661f39af473ea7745dd39bab89a3d7c8f3def635ba3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0f8fe718ead957acfbdc4d5362ceb7f408cfb35 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aee615440d6b6797741f42c2e73571ace3930ab237a38d35478b8e21669f7b49 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f33ad059a519eea864695956a5a84147aaa05bed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ed3aae9f05edd43138b414eff7bbaae6a88328e7ce4412162d4a4470035db7c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09c09038ad259f2c30d54b35e7fc7cc1b8ad846e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11bc8e48bbf1fd5199940b43ae631e00cdf858761fdd8a4caedae8249baa91d3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c3c5796005229dcf9cce736e25e6b74f354cb61 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1accbaabc77b4f095638f86fd0cf0db2d7d2928f1fc0afe291b2ab9a6b9b757 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ae1187f5891f27e7ea48e01fe8962e320f5d797 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee315b99c72bfc7252e8d6420169cc1d5f9a183e8b558d0a5055088ed6df8fec +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c73acbc2195e7ddc9f8670e160958e3a9a9edfc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7d753ac95bc1259b907bde449d820d6bd0a3e9117674bc367576a3030c87311 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76a71e8fbed9f33426a9b56a80872ad81f8a1b17 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ae8f3b27e8a56f37c151a78af930b7b747d699c57e82fe9488fe49a8bdf26bd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..385f71aaf37032188a57e8113e6b4bebc58eeab6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98fab21aaa59b1e455f5b414250f0b217fa107965d3d6bf33d57be5cb738f2ad +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa969886140932f22ac8b33a382f9376acd94c40 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ece54bb4632c102d3408631568f9df45d039f34c8d0cc7d969814a9697f4977e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..20d8b2b00212812e9502934335892f813f6b5586 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f69c56fb81786409212150b17db6b0bddb85c7705933ce3a6d45254cb827dd64 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bac83ad89a431714f1742ac5811a2f9d6b2ee407 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9f39d1261aeebe404453cd4cca446f39a4defdffcf03eceb4617fe31a403919 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..015c050a3f6704dbb644e3f5b5e1dd76960fc2db --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d86cdb02bb168f7309abd4bf7ee9050c84f9c28853438876dec13269778e20a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df79387b195d48814df239f074c9ba377d843638 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5955c10bb6cdd84e6b9143d647a4693ed8fe5ba35689fef5d842602b64e8d2f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..651d7422363290be6e643bd24bed4931ffcb6329 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14ca85406c6f11fc058dcc3a5efc759d0b7be963864e375b2410deabba095e26 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..140cc7c15b45f33747b988f549b1c0ebcc7cbf65 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8ca437a3cf0c1da03d79dfbfde018c9654e6f4eb50a77e656f905b1b0cc8f15 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd1e2c4122a0df7939896d87329036a11439b543 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21f654fcee7426eb65873da4be127c015cdd69dff470ed8db9bdd6110c121c19 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e2f9f2938d89d9c5e72cd1fdd0efd082fc4d072 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cee2bee7154b3acddabfc76ecdd383828e2e26b18084393c24730fc1acc36535 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..709e8920dc7f9fa81149fea2492519e010a87d7b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c7612bbf321965de10406e5f8ff382cf8eae22efb94fafa059115a68e6e5a48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4e7833302a4851a90567302f8bcb20bb6977eeb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e762f1946a39088fa8cf64fbaa48a46435a6c74fea1d87368a4fd29d337d586 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1812cd1023c3f5d74e7932a061eecc9105a15ac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2004b9a8b777565560adf86b37bc0c5468b26b1aa7cc57e5285fa9b01fc42bfc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65e299b1b60a7783f88759769efb222632144d25 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd8fe8966bd775ab8c03c9215d9589df2b59bbbdc003e99c0dbcfe4dd9e6d4ed +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9ed2b32fd9341bae53b87003e4826e3846f88f5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0653264fb8338ec5f2f3b43d9f8bb58512022b9386a30471a162a931e3f63e06 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e30c5f90b397ede19d985669405bf9c37b5c799a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e97cd6520bd15195235725a2c908e8032eac2a3ceeb8d537011d8575ff92ece3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..12e8f4cb4b951587473d91685d95b347c32e683b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4ed76c644d201527b1f6228ca2ac11b477c22d70aac656829d1c6c0b7c71dfa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..241ed501fcc5f65c6b4bffa26e2ce194bc2dd6d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1bbf03b89b9a54fef7a1c7e14c0e61ba5dc2c172172cc62786c9dce2872cb3a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..31b91570f73f127eebd9e575ab2c752d44cfa732 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:942625d5113b959a32d388226ddeda2fa35dd92d295163e41f6c4986957f38ed +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96a7f6455a1a59d0014abe5bf1f8fa420357e404 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6263a0854000ca454d1714bb17294c21a690e328bc917b9bcf3f1228d3b2b78 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..745549c59b677866589414eaa4a161cf3253455f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68b94c8319a3adf4acfbde3dd1a1b2c180ca400a6f2d86cefa7660e842ecce4b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9db12be96cd6753fe534588630ca7e47276980d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:075c5445f9218c2ac69af13f3192bcd6163274c989467c81275a26a49e0ceeaf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..066c82c7e5c3aea6757fbdbf4fbce345c8abbb35 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e8eb769431302e1191f28824bac20992a8fd044301c69ab00d899a6e7367c7b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cee63796f2bd5d718dea4af24f338729dca9f145 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd3d54a936ff69dcda9d534e061522ee807785ad8b2acdddcd0634b144b539cc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e47ebd376faacd9ca82ac7b3138a0c0719605ff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21654e074ad69cc8bc05fcc51d4c2cb728140a113c8730dd31fa7b27e82166b7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7605bd4e10576674e9e1185ad21f7c1693bd0f9d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40c100697d73f12463e2fd5b7943bea0e6fd94bd2f0c33ecdcddfa81d56a6128 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eff45eba46da89846f418cb0eac439614cf2485 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:449e25ab579c49530323e0825ec76d06842a220d41795dbbf103f7b100bc46cd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9f9e0add791636df7ee2004899a04a29a90bbf1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6d49b1a1a5abd5fd8ef8987ecb7a482658bc6d660168e6d393762ce8779eb66 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7720fde53771cbabfbaeb50072d5d17cc1bb092d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f35456c6fef9a95047b97a9666cafb816f2956a83271312cf42399dfc2b26b75 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f851e72acfb84cb3838fe3c8359b85e6731818c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34b489be4f42a68bc03d34a98547984e83ad90ceadf7c3ae2013e56eecaa7b74 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..91c87f776014c37aa00f58bc94153330e2cd470c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbd819bf6c2f1040dba6bd8d3b6504685fb4b1ccc785f3ce5987c6455cd8355d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a26a7ab37286b2dd737fde0d4f0b8d2b1f57a1bc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5891d053b8b8c9256059cdfbbcfae65df271467bf4bfdce5d8316afa4817a1d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..06ead60874e1ed401764fa894577b1b1ba8415da --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:630aa80bb21364c045744fa266fac6b708414affbb07ff9bb3b18cd556ab8f57 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9126efefd9d776be72a85ec9bd4af921eecb3a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1592d73a510f760c48829ea1245ebe792d41f96896990bebec094973f27d19c5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fd29b0316e864c0d8b8ba5b06f563efc75c04d7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:303180ad594fb1bb6bc133ccbe5b33efdc318af221b544d86f6ab23e45cfa6a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5edabafc18723ef99e1f559f1d94f4786e16024b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:872e957320beb210d43da03b8df760db3163d8b60f667c621cee8950a7bef38c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2869fd4144dc7ae5da79e9b1e383deb8f86f2a3d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6182ccd6403b4b1afa141ad99e241b289f3fa818fe5c1cbe86d690ad7ec19db +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fdc04efc723d622617856e2cc2e17057bd703e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf7f4eb1c4d3a451e5d642a586529a26c70a21ffb7659db043a68004f0b77a36 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..997c516a8a256189f3b87eb0d0770b9b78c434c4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2aa48ddc8788fafb5ba996d2176047f96e7bab3ae9147139dc34f08e4972fc6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..819096620d7e43e9313dcad8280e50c2ab556dcf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6e2a4c444b4d82a01e6321f7603ca75080d63907b02719348af8dd2b7d37b4d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9554ffc9b885853f2bacb0ed5ab7d0c47f4a759a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98d13af8cf1f3fcde195b06ad5971e6b7605d26a8b4200a721e2f26251ec859a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da017df7e0519ebb0835ec15efa6b38f2d2515f0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94d97f710a8206576b637e391fcc98694d0cc20de899e9f5338237d8c760f01a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f12e0ad7b6e39032b1957d6a1a67bf70660192b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cf769f039f6904c58e60a70fbf38e418b967caa993e69945a80babc2a0181e2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66506fee94ca890387411a25bafeaa1d24bfff37 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd527445e713e6d381ad5346700e197d657fb6b215bbe46ab7c3a2d709be5c71 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec751ddbdc704a2ddffb0e0a877041c2a628c0cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f9a9ebe8c17ebda5d2db8fea5b3625eea25e69095f257d36b260170d714b7e6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..895c8c5757df4ae1f0c9fb5a8fff27b67343a04f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8123fc77f3e75a86a042d5ec538cbfdc8d2fdb9f9c4f24ab28e5e97249d17fe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..14fe01788bba95cf424d75df55a9447c8bbc56a7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f4f894d7a2a09d023e1cbeed2cfbcd4228734c72701ff1f7ee7df43721c7e21 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee3348d20b2e1cd6956c62eddfd82b4711e8df9f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a56092ca914f5c3b73200c9e41a7c63208005c7a789dde22b5e20440340d83c8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..18da5b99e7d1464b688f76bae01a7a83944b3378 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5390f8583f1f31b88eb2c14a3ad14a836f16912534978772a58a290a23c74174 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0e3ff50194698c5e9e71636b132e307946b8d69 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f9356d991beebcc226c91ed12155096fa8553cf45c497cd4c7764d1338cc6ef +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64f395520707b5916b38c49c9fb0c3e11aff7de7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:989f4c8250452f22e5260e361600021968a7a14cb0d03d6513c2fefd73f2391c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..835cf5e5c0c69f01de46985466307102dce3dc21 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:376230548df9441f53707921d0b2663134bc1b6c0de2c883b10dc2a1ddb698c0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1606009c6045e6fd6ac3d43efbc21cebc1256a70 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15940e8528524aaf490ea451b2d5f93a49810007bc44995e6ba8b9e1575abc36 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7e53c374708518382507d16e20794bd02ff6dbd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1714d385c4c1acd8495908bb82408eafb563f9677f8e89be4108ef7e41349406 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9670cf20257968dd154cb0929bd271f66868cad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ae5fb856a37bc87f5ffdc2794f7156a9c1179be06f143bd511b66f8f5d7376d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..afca302554c2938d998e92580d54bff0c3ee20fb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c0a3bec6f496ff222aadfcc3b73e4b1bda1d9e1e5b645ee871d4d6cfd59f9f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b38f432ec9d6de4477b3fcb30dedf67686238eff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fdbe22249f4d41d284189873496696d9689fcc2f85c91fc7207763bf49faacb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb446832764e6b93905692213dfe1737f972fbab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8335badf770e1bb217aad8c2c402db8b4b50d2b11577d9f35e201069e2cf551 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a13f096a0a7c689926c104c4abad1c749943eaa4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5033d30f3b1621485e4f5767d4db30450ed289d37631f27b74690ef4ec7727da +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac9c6387f82e6c321d340743f884abca3eb64275 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58f90d6a920a409ee510f5dc4f234b095dcb25298d0a4597795fad5aabd713fd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf470372df51cd7250f81870d8ca4e7e76251f81 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6c8e4b8aa8cacc8455499401007f4f7ff9fb19b543f071dc49608a55666e30c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7409bb9f160295e9c968f9b52dd033fa567d229 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65ad67d4846559e85ce353860b96da23f481cf4e46bf5ae9466d652e768f484f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f023327415b048fe2a526cfafa46d2bc30df7eda --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e8ff0f7201e55610aff11ed261f25a0e13cbfaa5f5991c0e41e9c64c9e687b4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8471ed0d07b52013bd3fdcb8609427e014e00ab4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a91569a3e3e518dd04392060c30594b7eedfc2940712b3eee4de01c60921b498 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3797a97f73bd24cce785deb8c9a094ceac48c354 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73423f12b023ff6636f42b01fc3c659d91063dc0a4d380b5dc14197f680dbf2e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34c2765c3fef61faa06d58706cfc6c61bec3846f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9b88e240347332d6b7561060c5678fbc5af0120dc8ccae555d55227bdd3ad85 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a56053e1b5a946596280c0a95a3059d5d915ea39 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30fa43ae6ae37c2c9167145b3d5f4874c973a81c99a922d03460028bb9d3963d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d7795c875919ad828b25a5995b2ddc66e116e7b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:621bb78f080de15f138c6ebbd8ef4152c2f524d781130b7013b953c2c933b0f6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..653c33e6edac0e08c7310403b0786e4d41355f78 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d39a9a96d1fe2e3143750a29d884bed3f32b1c4ca10c31e3355ae8230181ca8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d198a3a5552329b875246d643d4718f0ff10449 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f06a4ec272bd206488c69618c160bb47f060e0ed84bcda0759f5bac53077824 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400db19f5ed8262fa7c709e7654be51177825042 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:330c20a170972e652ca066a6bafa87242b23e3c36bc7bb4852c9c338df61dd64 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eeef43921c2983dbbefb7138795bbbbec340689b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11bd78e8cf930ef7c11a573f9636f3d8cd4dd732acd19a3d4bd114bfe756c8fd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9af6dac761b2760237be1577890cb456c28fc224 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:882579729075f8cc64f88ff87bf83b4c63bef87bca371d3edfdab00bb14bf98b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe4380410bbd4e94c791ed0fa3dd82b19daa9f3e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:555336ddec7037c8c1a2408d5ad3ef6ca79deab1e24e3b385328341c1e80df86 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..604deeb9978b557da3ecdd215c7e2effd995d076 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:514b4ec5e0da34345bca288dc99f420f605868f69c05212a856d47284fee99af +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..836bb0bc46d3e55638c9a8fc80d5d5b8ab8c3d40 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0a0500717f2dbe2dc098b3facd924205b13ec4ad411531a22db4f93e2cb16b3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..136e1a84e41d576c1b13325276df71d6678903e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5b8016ccf92fc2946cb2d6030640441766205c9eff706009c755b4a33d07f14 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c499139184d9d719b97c510f9c089a7939a72799 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07c32d6501898944b07591ac9b09d0b663aae94bdbae8c2f2cc80a9eef8c8632 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4d5c252cbc1dc90451052ee40c9654043609df7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e9fb674830e24d88f795df16dacf52bde3e2d2d92a3a23a4f3b0b64ba46b26a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75da69db4464ab12a1f0f37fe6bea20e9df7ef5e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a15d3b222d6cd13ae04035b64c5df22afd44d9ce1781bfdf6b3e9177458602d4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07af214770000f83f76863d2f3cbd847b3abe95f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2725772e941d4fb6bce263cc42442d077e251c6d61b363192ca543e59dd256b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..191eb06a8c697a5620a4828100d83a37330fb75b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bdfacb423da253a70cbb48656ccaabde250e737a6bf7240a5d821ccb40f5564 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbb5e30034acdff0384be7f06f532c568430a23c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4ea538ffc5768cc1b2d6c0d09171071612edbc3f12962619b835caba91d7d52 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ed3e8f27850a093635d125953f2b99a5ea8bc54 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_3/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd9dea4e4e05202f631f74f9b378e2a1f8403da1ad3359ddd2d7ff66a352ccd0 +size 11395