diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/lm_head/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/lm_head/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbde22a67f38c13ab7b5b874ba632f482c48eff6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51485fdd834ec63e996031ce16fc2da544bb5d1ecd5ab2b227af205859aabf6d +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e8671fdc4d1a973d6001a8f8691976caf55103e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbf702ae34ddf73874c1c829204d31439eb4375080e7efeae3eb5b930deecaa3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d18a7bb29d58f707487cdaa76e0bea47bf961cce --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8276e092eed6f22c5dcb8dd751284721b48c0388355a6a79d8d2de161e478f2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98f4c51f8b9682cd29154f8549861462ea602480 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0eed194bcac6630ee4f2efe7edc966c6e150b8db4ac2ffed12cb78663be9db8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7614f0ab8ef3030fb75d6c65e385d2ab54923082 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e70994f35ec110776ceefceec2750ea5fd8f15f53e9b548caca307953c4f7132 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa77b44c121a3897c773c9b00946dea3df8be546 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37ee967f3ac03f11b0b3d3d1e45fcc19e353c682c08241c32f409ce03651a073 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..222f18789689ad294a147554204f15244a2323ce --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee3929ec1023b1a9ef82aa34228806934aba115f6fc3a45fb6a7afc191b96777 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a1a4503d850a909d7f74a23696c4a42895cc277 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ddc206e5d38a66246b315e02136cd78bf7cba78204233b9e13289dc766a12c6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f8aa53262c4591695050a770513388b07eaa146 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da36ea30db3629b87f007fa2b5e3425891b936071bb371ab6a452981024a6495 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6362560085b3cd9a6d679fbd7d5f6ff0fb3bdc1b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f90f2d641ffbbd7626667a456476a291c4f9d6f51c024801d54d2adf2c37d14 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90779bcaff825e06cbcc84edd07545d91942b468 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b8710183d376e4e861f1ee2f17ac5c0d6711466614e6370e3cf8efc12db0525 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e41a1436d23c2f990eda9f1ddd0b4a54ad6c288 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdeb8619c9c4a9212d727f9c0eaed34ccb32739c13b2936c99c46990e72ae66c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f679e018edd4681ee52857baf8bbb7c89d355deb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d15d06190c26cc906e277c3fefefa30849564d4af99b1d9bcf8f7b8e094797c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d87aa17a511e40f915ac58274856f096be61cdc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5b26a5fa97df45a9f6d8c053be8d927b571d7792a6dbcf7421048f04c45759a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaf13d67770c53be912920ee5d7cfc5fb482ec04 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dcd9207067fc32cdc6e3998c555d9287395bd54e519c2cbc95ddf6a7542ba1a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..25955c6614b787f7b7c2d46db1c132a9ed336851 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5b4b5f9c7450124398ad28307dc259c67c5070b2766e6c378cf6897f6f70dc9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84f5914d3bf59ab20c87d402c36c8c1907e004ba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0da647c08e70a69c7cbb71c29210b22bee04ca1fb5c475404b012acfc454f135 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85863ac7e58bdfb5e7d7c74f3b4f00527cb18c92 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5aa8fdf09601e39659665b9c285e1b9c431d60936ba5018ee40ff8cadc71474 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9273c23c23f1aa93967e0cda1f351ebcbbc1c3b1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b92b3de360c74d04be4ec7dd3f70c8321efe28680fb4e3d4d003c15601741bda +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7b8384357bb9e7de2862823ae4931f57d02ef4c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:206fc3b99a0453e9d5dd81957617896bfce4407d17aeca33595f8dceb95667b7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95e39a1ee47b928d6eaa8a0fb04bd1c03b4c5412 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:993636e5eaaf8df06503b4286acfcb16a20e5ed30beb75c4e432e302b7b98bd4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2638f5462981de6dc715f44479cf41f7a19582c4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bf4db318fcdbd0605a42042459488def58bee224ae6b3a935dc0159de28f05f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be8d480b8043d245556350060b2a1dc7c63c3cdf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d20656788b8fa44afcb2501702b775b53aa9d0516dbbeaccee6d8bd8770edbb2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..abf518c6414bb5a999dee4c6344b22f2da1b2541 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8ae3dc765858513db1a2e60fcb2fd19f7351a8a44a3b14485d79cc257dc3d3f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd746e27c81910c4f104f5480f75b1c845af3fe4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4d647be3c28b4f760069595a2c2bc9f1ea8c612e103199287e796708a01f331 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0999b3d11b13292045ffd297a57afd32aeef97f2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cec95e4363bfe473cfa81906a76fdff8575f242e25fb1bc7adeb06f777af3e4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83c3b5d20bfced920300a8c514b8664502a82598 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efdb363078c957df94c9ede3462dea93483360959db371cfe23641d098165145 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9395d3b36213e11f87d018be568bb0ff4fe11c65 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cb64e770dc42e846c3d9c53346991fede52c4fc3378b84ccc91ac56eec72fd8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fcaaac13a787e0a069ddb95bca93d51aabea85e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e51289d6187fa3dab72f4c6cf1f5c7f05e50d288d24be2734387b05c36753c5b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2efe1aed25380a8bbcc208a53605d55c030b863 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3724ba721e1c61cda247a6d461fb650609b7dccf976f5646b9f9864fc896dd14 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..26d40d8b1ec85b56271dec89a525b0a155d75f29 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f97bbe3b6912ce3baf57c39c277cc710ab6d0e9c3e97aa3ada5884766d6d1043 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a0f700e06574145ba2aa4ebf7af5f8ef5aca130 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7250c17d8625abc4651d7fd7784cf7fb00f7bb631ab7457c8fc6d02c31a73390 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..331f77e3032346b414befccfe2c3a66e55be6bc2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee8c7f5448a71bece7dd7f898ff11d173bf0127f7f6195d27accd648e3304aee +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d07e453fc3af2636a52439c17e5b85fec3734630 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32510ebf38c7e7bf6533a189c4543609c3776ef116e3e496cc51160bc1206e13 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58bfe3a4da7a8f3257e9210aec3b565663a679a7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce18d51f320c081c1f68d7ca41981bb5195b102a6d88c8901e59e1dc76b08e5b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b7e5f8c11bb42e54e29e9ad590c2d30d1f1c620 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a317adb9ae44aec9654ab58b6dfe57b029a206b466c12f3ef38f2ad8a1899ce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ecbd0f9b1a6dd1f147112f0e590cccd11c2e09e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b173ead5d708b3711b5ac0e52c5f33dab59b2998d54d27c46fab8c97487cff9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bad6d2ef980afe2e5d37be513ffae78e79ce7c39 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246ec505669b56dc2ded7282a55785d18442560aa358de6668c16ee4c34cb0be +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4f54820aa8c00d69c1759fe96dc5d41bdaeb93a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18390084eb1219b4f84ddaf3a616d1e44694071cd783212004e9942c910a1a8a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94a5079d6203fc79a3844689f298df17de5603df --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4fd147594ec706e3a85719b2a3d9f6398e01e173e075041262de2b4282f8364 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5dd7efca81b2690acb2cbea7389475d00642667 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ffcaf83bc9b9dc3bb575b23ba24d90a2e91c848073989ebb69780a996a0ebf0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61d744160fe24adaa34c474f48ec4840dd7ccc28 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c233ec24b119936627e9e74cce545a659031f4930548306882a5b04961848db4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..416be1aee38174239f74b2b6f2fe31e111f61673 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4179f4ae88598c35cb0efc8e7b1dafddb73d80cdeaf221240e7ecfc376c5bb9c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1eec6c6ca03d7874318cd71aada4cb93da9936a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac2e81073b242fc2149bc08f2c4eb94b7064346d8e6eb723d82c1df276d06ca5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd86271d658681ed58fdf65d67ecec58c9914b02 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5730749955a3c92d5a960162836a5f8ad5b9aa35d091152f49d1237df86be6e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57829412fe5175326d9c152211e9d1bb29fefff1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb03805d84b3502612695c4593228659a26302f3b0b7dc17ef4dfb55228355cd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90958fa0052597eb386ad44b837c8fcfc58ec22b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02cb4a42ab119f9ede9c9e208a3a92df80c5dfae8b65c18bee0856a691061bf0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64aa8b4251d86d7e12d5b562829aad3598f952f9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53d26aa0c85dacbd1de91c2dbfaa639fc4396375f54ad7b2c099de0b97496941 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..291dcd37edb017b46abbcc28fecf313f896b18e6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f030a4d06289072ad2451052b18e62ec05b5858c6fbae6bbe066f86feebade2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..234d008e3de6193d9fada6caad0bd88456f53ca9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68f7f69df0a8495a233b7fb43f1f9774d481efc231491c157b69891eadf1ae36 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a843eb3f70105d8ca4fc1baa8ce295ecf6cc112 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e31ef9184e71de77dfff3ac17306555625a60a9c9792985717af1641097ec01e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff9ce427dbcd9852aed35aa98eb5e22ae157d7ec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6990b42183873b16177d138f63c0d7b5c08b76f5b3a1ac642255b270c9160d58 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da95c7ed9bbbd72661af7f8402de975177971d0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45e039c9e08f7353afe2bdb7675e736caa169954c95ad0c5ecfc3e772b2062da +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..990af7001bef6c7f26ee139c2553130d2b37bca4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b51936876fecc3c9437748fff1824da40d9fecb2af2dc5acdde76e809deadfc6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28c3e04cba240ff6219da7fc54c0597ce0131d6e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a72e4fbf30954c3f07372624527336280225b71f13c60f0c3de0fcfabcd707cd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..846afe1a6e4522373e9460c34bb9e4e3fef9dff3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c42953a76f761058a9e217d5c4e920a7ed07fe5e63074524b793b1b421b29fe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..87ccb9bd684aa4109580ca1a95e70d67b1345322 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ba23120c20cadbc82ee3c7d08684051d1c8d16053bff7c7de1e5a8abadaa4c5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37654dea8d0adfdf1b702f9f797dfb89c5a85faf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b99486b0ade4d41a329ed58c99a10b8be4ecda72128a0331b8936c0a647dad7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2036f539a85d21b075c040b65d29bad197cf1153 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e46dcb1edd62f7df9f2e82750a4ba889e3d398aa1edbe179cbf3535cb59cc3cf +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d829f743fe25bc0180e2fb9ba13abdea90eec6fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaff51b52c670f9db04f3730b1047d46dbfa86d04071623e2d0896446f8b5d7e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fa9f4c829e68f7f687f5524a645385f5276ad8a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83f260077be6251bbc6d100b2f8c1bfe148e9490298d6f1dd523afab92953393 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3bedc4042da5212f16ce881b0f847795888d891 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1b7ea47987f334544a9ed7acce114ba77e259605d099565506e149cc4cad361 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..26c22d7776c7eb65c37fb2a5802b93d9a7f202b2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b28a42422aa52e87755679975a203aab83e6faf2a043fb95dd1d300c40e5f59 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..41634e975bf9bbefeeb041cd6090fdf61aaebea7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfdea5786ee08ca623254f1f85ffec6623c7c6c90b31e3d1e97992c3740aa574 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bda98c111eac9827069a38450ab6e5451beaea7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b41e6b04165496cbca29560b37cc0624e3b393d7e1e381a0f3516de2c5f8a96 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5e396d53252c8f3958d8444f4bb16b8831469cc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d5080d055de9b85ff5c8ec6bef2d59ee9860d91679416418fdf70a1c50000b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1389a49d37cb76d1173eedfe3720ab9daed1500e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:736e4c79a06a64b931050d714f10c4c935c84e23a012202fc9fbded8df016db7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0caab41088bdeeab076be6f8688c85024e05bc81 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4451cec6ab54218dab5f2d1b3d17de7fc9e1e32e17cc51d75c2b6f9cbb2c0886 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3b749ae7a85d56cd46dd03201a903a207736aeb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb3e457d4d737779c7e53b224eb9b73c96f832419b0b7bab1f956b6868764d57 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10588b34050d6b4217c7a733aa9ff366f3e79727 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e07b27b6f417354d9912f69dd27f63777d935f45af76d50e3deddfd9ca8eaeb8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9125ebc1b5a6cad96855b7f3f8964bb0f23c2c3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b0550ba614ec360cf44da80f63ef20436606dc2e7b002a90d98ed228c9a5b21 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd2f53a8a9cceca112df85f82cf76bb5dce9e088 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7aed3be902e87f132ceac0c3fe82f53af70ad96a1598d6bb49f1b388ad4092d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44da18ee40897411b2ac23795f4610fcf28f928a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:718ae2c8bb7d17ce4529ae847671515a819da8d8e370b5b53a896eda7d1153bb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c531f0c9d77eefa9effdb95f45897c803a747a00 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae747d91f52cdcb8b61f139f6268d203e036ddb5ba819361ee539f5c7715a296 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37448c12b4d77dac6a2fbb00f25321da26c165f4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fd7c5013be56726eade1ca94e4f6f589b2a405630ffcb6690b186a3a524c33e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ae1944a0a0eab583d8a659e1a9ab0d92a1e2c78 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da574c7f2c355a96000409c108327d21248348b6c0050e25e7c0395c585dffcf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d5f17fa086d6a0652edca6fc7d777e4bec231a3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:249bee5bac0ed00c7e0b342c02685f27ba6ace2b3d89ed0ccf47d1845161b1b2 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03f79a9fff8c75eda274ba126e9f955df6ee20b2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f19e38c44f4ea4e05385f425379ec22f4c423a8e4954055fb10f89b591c8edf8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f1b8841510cd7818d805cb57b36f3e125e01311 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83c91c471058d46380cc5db5aeb8a4184e73888daed099a394058650d797b815 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16cbfabc653919dbd1eaaaae3f070f8611e5a3ae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfe018fa4d3e93a6907b25bc9f7c46dd5e91afff5b3a58b35c2d3e9cd84dc312 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bbdf4b85dc6c808fe2a1e6e830935fa26b35181 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b019d3b9d111dc258b783822d39a7eef5fab8a9e663a76df765930283da08137 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..edd88c1333cabee235c8a76bb817f4e9c984d08f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d1d71f885e43755cf5ff716434d3936eb576bd08cb67383924c02570d258410 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3bb4e2e13496f9e79be971e0da5d5aaed22631a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81d7c8054511ba682a97321e4cd503cfcb330f32bed406ea053fe13c5e29ada4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b9350182c95ed9c214667e47aa45b91d671b6fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9180e015197c1841cd91c10d8b3403d2552ad58984802e295c869edf61a13fc +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d9b6619a1cadc9e6d7020dc9de2d7bbfb2c3a6b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e27fbe1773d60c0cf756b8baef4912a0acfead5a43475081a8f7427ca267dbb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..52187eb83e03d22959e02a187fcb3e06df6f38a4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e18a57a91914595d4c524601ee01e2d37218346d525905e20abe173f53956800 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..369f2ceaca5bed4a4595b6a06e5a576600a4a728 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c6d6deaf640494c0597165236f48be8738316ba9efbc8686ccb2386b689c428 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6333920c755538d9df3df7fafee69ac5b44d1eda --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c680bae3d9b0b653f145a5c1309d887ae871f4588bb181cff958e92b11121cd5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd92aa1cf26a2383f46e7c26bbc08bc698341d1a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d850bc364c41a8b3b081d7bd687eccc861bb999b32344994376c79afc7bdf282 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eed85abcd7008a62d26910db9527d7422d8db159 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:197c72c1d8c0610e45c5b8e4fde4753aee450c8d4cf5321a6d0d433056d99cd5 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a6da7368019f1d11011543532e2e1e7a40864b3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b808c1bea01d1a52eb867339b58a4948abb6ee009f167bd305c4b86e42d4fd11 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c89e04729d0ff70424b32b1fd4e756343d6b0763 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65116a1c5d0a8f331c108f7529c3375f75ad42c4ed8f427ecce39e866fb9a0b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f592ae47684eb19bb0894d099b811c280134e293 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:394da75be07fb8bc491cbf224d3f39aad393517c833ba2c826141c567cdd3a1b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..284fd05394ab6152b7074c9f37dbce182277d908 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb3f025977d6ae1700c16090fb23a91e15a699b7ca7ef6ac40891508f769fe4a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5f84e04059f84190e8721badec1a405e1d44ea8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2f6a49a33fded18784af5599379ad0b1ca6676e3a1c8bbe6de0fd445b3893ff +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10f1fe9240c3a150615f24f73db67cd551b8b32e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50ef8f0c75de651221f47fbf2b4bed13d2db93d1edb7ca50b03ae73c86ed7ee3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..945bc4052ba06cde82c7f1a6ccb589d7970604eb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29ee1223e66a8594983238fa48cf599ab6fddadfd1af2531c3a40f60e2fde994 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..314d9721ce8ea5d3b326c1c7c2f9b16f6d180145 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55cd53f833358e4256e16aa83e36f26f8941728eb8383b81fa4029e246875246 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4a40df6272c9aede5793d9a8d68d2730895ee06 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30ac63aa50012ea9b56a72bb5c4180c6db40ded963ac468e1083eebde383df32 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9188452e175a7b0a2913b05d58a45ff35989fc0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:631e0805747e577dedb7ee3ef414ecd5353246580e968444d566bb9218318587 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..827a88f9327fcdf1d0684e76cf9f9e9940f48d36 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5216e830e361b55f2df038f7d4d91a0431b62e21cc044205fb5b8aa8620bf07d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0574e6322699ba194f115fc406d6130cf5e984d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd4f0a9c459ac8e148e2b0bcf7a62b16b52776ecf389028414b4566adef7d3bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ee93f9b3d317258d4eb2b6fb21fe377803d8c82 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e3f030975dd1ba92bd2ead293b8ce02cea7598a70c25babed46ba5a7ea03f92 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d26fde3dbc707a38985228e8f7aa8ad00569c653 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd2624c4055c831b77fb7a2ec04d7ecd250c2d83c573da003fa4647cf7ab48de +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f91255301ede91649668941ced94d807c3281d83 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aa45e6e07e1c45288b0f0ee2eca0b762665febc649b2f5b0a78ff0985753834 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3360bd444e6d96ad450adb507ebbc4d092d79bb9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22fb8c3656996de7606a337d7385ee560b419b038baa813e9aa88da9450541b2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..738919e93f7cd1f83cc8e49bcf7a5002fc3eacc2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20ba29e95df0be454177170c7079b8223d0f9c0f5a2c9a56755bdf543f9197d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90ac39366d449f751467ff2654b72cf35f614984 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7dc044f77193fe46d34b727af1e9b1a72a5bbff5adcd2b9f1952d9dd7f301e8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..218586cb82a5723fa96217dc45c3f731dea48474 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa3cc4b1a6ee19cf681e39a13abe52b64270193f1b1ca966600307ef714dcc7b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dff3644e651cedcbd7e972c3128ab1184ea3072 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:463967884ba488780f3f619d8d2a55a3bfcb5fed6a78db655dc59f90c0d3b2b9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc881558a7885acb3a22fac7260155708d5afb3b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eb3009274e6c4407b18846fe2466462c964812dcbc6e1e40326d6efb84daded +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60b31591eaab2034dc32447d88945dbd9b1e96df --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:610ec7801189ba8a3fa127be3668eceb67637561e9b33e4e57f8c0a92c2ae2e5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e59f38ef3658066892d6193766feed7a9e117e25 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:895937497b4133e56db1dcb1fd2dce2a6522bd36c1e82fd0f25553856d2476a0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..394689e1ae3a99ced16ce9902571894382af33fe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d09b2f94d3fd38f6fd788f1dc33fa8b0fc95599a11055ce1656f7b1eaf2dc692 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7493e315fa9d299beb9e765da327df009ccd6e66 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06bc69f8ea0553326df745bcd6a1b5ec6a38b3c9d4d58250ad383719571f38ec +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..696906115ceaa1c7a6874839ba081043c2b96057 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc5ba5abb140319192fcb70212c82cfb07c553f738b4b250654a14826c9cb2a8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c7de146cf35f7da7d374ff50b3b32d5315c22c3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dd938590eb0b4b2932936f052deea2b6a43ea25d7a4f2cf068578b831227bf6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..695779bc434b631411eab83db2580614ed18eac7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f83861281247c137fd87e030c3cfb5629ea5443f7201df64563fa3fc5a18668 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee0d1bea3b717ad31c983e4495309274ddb73bd5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fab9a22192c98720df0f151a9c6d4cbdc5b64f5d4b90aed0cc0eae3ff41976b9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..68d13669f50831235d6c1fcb0486c29336d03076 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65d2c22605df1cca0f7c09f38f37e60bec78afdddb062d4a8aee6c76ddd5647c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a08076a70c38e2b25012e6a84e3f2a9cc86b70e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3d58acb49c2d19366064e0f6c9e178920bc70945d596baa064852404652a3dc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4b073245dc0c61e4f0cc7e3c42725d273e8eb38 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9a3b118d8935fb113349f2765a68d0529496a246d2ae4f69acc77a4603870cb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9ecda8bbb6231d9369ddc8aa5d5d339d75d0dc9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4526552fc7d715bf07126cbe1f31dfe4d6c3c767c1e46683239fb8beff483566 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70ee43806460e19a62ae05167d66d89ac70c2b2e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f92df0c417f7369446777dfc02cb35097b3fb2855e34304cc25a5c7be1c146e4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b381e0185a74ceb78dfc5d91408cdc398602aba1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:267c8bc3c2ebe99d4e88ae7624ffc1e782305dbf86848f50ed92e05aef0145bf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa3ffa1b21d99944e686a24698271da12b8ecdd1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a6a4afc0dff4940a28938981710ec5a46f09a829bc2b82f505cbde2aac65352 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b6497dee177da1e750b29c92f7953adf2ee6136 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e552249bb26c8430245ec18c5a9a0829c924472956dfdfb82d9963238f6de2c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7170f4cedc6fdaccb20c89ccc1c5b3507c6ee893 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:523f7fce9979d46a7fcc8b919ed30a9ce20fc5a43d9fe78fc95b67a3b2b48695 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f7666cfd1e38a2bfa9bd1ff4b8cf8e67bdd5b02 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f39931bbecd94ec90f456e6518132b2343f8e6fbee6c4245cb981018dfa947f3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4317c71caee81306d954f8653ac062f258933ec9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae57fc0d20b9a098fa8c4dd8a62435ec04a18f759dbf8775d111bf5171b1907f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b243db539cd02908c8a9a725a77f8d5fe2982e64 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76f38ad49c3409d6c0077d960749fe4931fe8fae2c84cf2b63db46823e33bcd9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..454393e0c9fd792abec83a93ba2317c9d86c8998 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72997781d82d76c15dca0ee04d60b458d4be8b565085b5c18bdee81ea86865a3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..415cd6df096a12c510a4fde01028a9714e9a0646 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2304846fdc4892936229e882c1a419cf41bfd0865c8a46f4c49789cae5e08823 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2284629b55f507046aaf88c6713a411c0930a07 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c71e1ac522159b45ab7a8aea1ba6c9aa2ccbca1e80cefd4f0046f63b4bca8297 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7f921ccb63625246dc5500306c38fe4c5764d23 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baa4e61c1f3666093189a1b4ea3386895439c7f0f153ccdf13bb6cf72d3ce36c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01e7f350648e2e81f6f49973b5516a97c467c379 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa02ee547ff81c5a7c6fc95a88153efe053eda54f289011e10ccb1e47f352be4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9fbdbceeea721371a88edeeba150ff9fd5d8ea8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2517a3f9a62eb88cf8f4c829ef8d9af9d592b525107bd56c2d2113fbcd233aa6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70ef9327ebbde97b70c735df86a8f11eb00e55df --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c4f325db7d5f5ed7107fe4e1a1a885e6e3602bd5b3c7a1f9fb86b831197bf8e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9370c04101fdc36645ea3eb4fd8da2e22910e14b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:975b1bdc54c3ee21cd0169017dd9616a6338506f6825b83e74c0498561acdb2c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e38c0a73b0125325992453b7c028762061474f68 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68cd3e31da2722ca98f331939aecbd549df347a8f11664348d99602d11f5205a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f509182f9d4226e00a6813a2584449bf0d17111 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af8128e3adb5f4af195836cc4adcf3298aee5127af4557a6c53af8ace02d979f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..225071f442a865a40604619123b87dd4399b465f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22e9bffe88ed9d5f83f121811eaf9f0891eac63dce94c78731d0d8df26453180 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65478e02520da9d93c62c8d735e62be02ce6302c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8533faa48709c1e96b055fee1a1f4b36acf2529a66500b8d165f5f3ef3d87397 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0b3a47ac805203fc46c1c8212c2e634396ca773 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:758effcd2320488cc82009ccef97d3cc7f6ad14c6e970685a7e54880ec291618 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b25b9b9442ea098b39d23bfde40bf9c4d6db50a5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d84691430d9c55fb648ed873ea64e12842e4a1f79e0e9e7f568c40de28a1b971 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5df9d42c349184696ee0636b6c3a6572741f3d9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2254c0e57902f1095ea18031d894f84b308e7bc2d5a5f41760d19a7dc5bf4f2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7d5f74ea02727eab9168ad439453f8fb778ba30 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e90424a91586e2f80d622e4723b51196903bfc616da2bd3b69f346aeed4c010 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24e401121b34e656cf60fdb5e3152fc0bca3c6f6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c7d58ad8ee8d066c697bdde5e12bebcb550a90f75be2b391adbb00443354465 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09e5be40896c5aaf94420767242b164c24baf7ea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dff97aa9406dab26513015fbfd820ab4aea6bda22761a072fb6c9ed03484f969 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c52b33bc4b1c535a32a827592618b8c3a628d9c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f48fd2343c84ef5a34ddd9bb32012cb6a01db761f8035db06b80a88405d12b18 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..371f4a4e6ba4e8ac630a4d2f9f21701c18a90e23 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c107bef3e2fd3a55a34f16a8258a1e00cf31be248a6209125cac235b9c7e8629 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48c0ff1387cd3faec16c0ef8980ff0b93c492737 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a56588eee48b68cd68099c9962ee040752d785e65336d4e9ddc708f2142c7651 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60a15b36beeb06a38ccc90bd19356f18d4793a52 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d832ac67809c5eac686013013c4d25d38523b3f539eb4c9258da9fa20c269960 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3e6b0b4f98e0b187948b79905f7f68a5088bd38 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bb043d7db7e19d94d446b4def1ff31b64763371ea5f9e1a10c13404a4d7dfa1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b25701c4d3a8b08386e2c689f47e83afa1802a84 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba7b7a914ca46bd9ca365dde752021600335e4fbce1bd5bf6540790f4ec55300 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46c99ec20a548d15764856636f6d14ce48cbcb4d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46b6b5c4257958c4d4f98ea37de7d1489705949b2ab5d8ee38b7bfa624fa81e6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..37e2b94919aae3b9d15a04aee89714a01c9478bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15780e18642341d3eafd867ec681ea4bf9f90458a49518f3284b204295c78a85 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07a95509f089f6c13d554330c2d4a515e3d71666 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec7691e759799129219b110f0422ecdf8feb60409126ec59054427cd5f162629 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f96b4a429cf896619e1e61e0df92f15b9f3bb577 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cee57d2fba97170e2d8666000059c764ae553c68e3ecd91499271ca1e523e6a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bdbe47d77fcbc3a34c27d11334f2de18ae4f15c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6abea0ed7fd7d9b31b1d7ec25e698e331589b97f6a6220ffdb2b9dbeb245cbd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f5b15783b10e9c7920935161528bb4aac5a1729 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42ee85937c1dfcf7c7e37b3b7e079f2802a53e9d402fa70678d96cf6bb3a7a8f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..977b2ddec6bb373514acbe00367dc56bfc237e04 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e94c351d7eb75fa5d6977b5fd4cabdfbd58c91085ddbe7ffe624de84abf13582 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..389374411e7c4dee8b82b0eec375a4fe78b80a76 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c8f04f8bbcd1ad6db63c4bfe7aeb45ac5d31368b4d804f98fd78feddb832e07 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ddb21a85ebd887981199386591c262bbca0ac33 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f591989ff4f16a954302c719d9f7fe8113c5c1960daf739ff9ad8390470e925 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a940eab7163954299ffc8c5cd0e91956760fd4f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:476dca36adbdc419bf8441286361e85a5a4f154a06521f95d94a6a153049229a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b2e046f5e7b90b6cd410b56fbb5a8af16d967b0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d80496cd1332d4b1e6929d4b77913e0f8f7a75aa1b6e4f4e20ec9f89a725f1dd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2d3305c6c2f01f3360aed5fdba4e90e4e5f2d3f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea56dded038041642e9dc345932b85468f3cf19180fe394c0152e93e4ddd423b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..91808d89c24d4dd1bcb4302ab9b548e33036d0e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c63d786055d8bef1c2df203fbee374ba300f7c521eda60d70f8e1b7c1373ae5b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8c314896464f5b8f4451943b8cb087c1d00d36d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb97b8fa0126d6532610b82192f8db41f2ee836c73f2750e16a4ee39379b1929 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf78d49a57e36d8b125ff4e95f4ce393051d55d5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d44f5597f874e52657640fa48c1203bcbe89bec2baa3c9acbd47ea7336d5dd60 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be3454b4602d5d9a9f6e48c5ffd6b957239f30cd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8a03163c0229e6290df2fc3c493b1e7911c8982a25d41d70417383021c88f58 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e51914f9ae7be9afe25dd0d99a7d0e17c1f61fd2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e07bf4b187c1fc60e75994e2104c7dd3335818b467b4a01e13fecd3cabedbcc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0fb11665c88589e681c71433fa55053bb783e11 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:767075a1c9c750ed7cf7ec9f2e77b1b53658873688ddd6acec227acc4d6757b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9e9559b7d35a7ab346ddaf4634c24c4c386d209 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e680b777b993b56e132ea4846a16947275d4fdef2035055af4b85bc130f0123 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb721c034717434c2bc477e6d25047534b45e97f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44bdaa23409366c98872e7613f51fe61cb7a78c4b1376ef32bfb0cf2a7d0f44b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5765f84a159e01ff65c640ad69cf2ffb7bf194ca --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2b28dd5e162169ba396a6c25423fb1d6f5d5a6f53b1e713512c4ed9b948edc1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12ddb71834e5ea7f1545e48dbe8f5ab1bd970c39 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56d0e84b9c948288cd4aaab6186ccb94dc60b5df782ecf4fe5bed81cd45fc5c4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48deab5d5ebd00f2e5470ba357fad7ed089deb5a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c0877db342f38808dfdea028a5db333e40b255e4ef849bda575481275724952 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12f6dbe50fcea0ca7f54c6d2ba2b69735066cd7e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba8666a562c46ff136d4261b8cab9ca98424152f21eee34da5bc86e004c00e9e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0cf596ab76035840c20b3c26dec562b9a8060a2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11038f082e4957905edb4259620d96deef0a0eeed91f0d61ba2fb05351559645 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d11743a152c699026aeb788ec21095301ccb56a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b8dde5717b4a145d3b79834cd25d41c29b551ba15c76c1ad73604ee2c0acf6c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a87b1cf7eaf33c1f61f4d5f47f46dbcd1fc5b2db --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b96fa748c8f4c58bb9dc146ce38b32ee939e86c78dc019e48367d82bdec6b6d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30c20cb88fbe8f971a5b5fd5426f527ae79992fa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b786221a07e7caf51035d6237af939f238214ea76632cf5659b8109899758ad4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..87b460492ff6fd4f06b49972bb14aface94c51c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de37bb0c9bc0eb0251d4af328fae3d109398c9b1bb07c0c45d2a0a37edfcca04 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c047b5e5289d94ac760d17e21ba611b59a4713fd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:784ca580aef68028712047884dad52781743c8e0553aba9d1620906b6e0c3ff9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3e36c754a17bf33e6f47ca84a934032b345b823 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b662acae469d10a06bfa68bee4645f3676da65f1f8cc4b1977558764cc06d496 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd9e866f32c3b3e140f3975ebd93e13022bd4180 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32b0c28b79a6a16d3eda12037ce55315802e78d1b286927a89adca99da80dd21 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e88d4ffaf70ca05ff65c41cc62c309c257f40093 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:714ee4fd07c9f451a00b7118ce630957701126f26df71cf915a24d89d1273017 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9f355e66b3a9aaff10930799d01ca2032697447 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9949cd1cf9e5d6b8c69ffc36405dcf4dfc99bdc1bef102c9e72c2fa9d310b8a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a585a7c31b3b1682d15fb71c13b6cb4eb35e621a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00b968affdb96d656f736c904fa50f17161693ae75c3bd3736fc2e52c4b54c28 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84e20420e626f67786fb98f4e1781469e759ccd6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afc948cb40b1dd2055243b3fc15a78d4aa4f958a30721f8f412996c6cbd1029c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5de545e3e9ad5914443ee929d63fc0920e647a0b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4fd33df115b136b5b7f4520cc8e0ccbaf1c26bd591effa8de98c3b80fa3cb35 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec2234b14589f5eca5b873b987f6027a3daeba7b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0ea10d97c097f109059bfd23a5e005508957558f094f1055bee18a1f1b8b955 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0609b808c52c8f1432d102db83ee628487b25121 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c05d20208e5bf2efbbad8478376f515624a67877eb3bb3be78d6f2503d10138d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..24ce3bd4f5fac8377aae95e272e9f911dfd6be9c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb0d890db3a59b06a2bf2e1f9847a3797f74f1d0d88b001a0a3bc8219a677a27 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..434585109a3573929d3b00e0793035dda23b8752 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b589e3394520f954731146a2d2e6371f53db965b3663d84d8a944c2dd03fb25 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dd133cf20b1e113d25956bbad2c9193f498f383 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f847786b64136afa1c75a3aa57885a4c8f1f4ac17ec29214747ce30ddc26f1e1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e74436a5f9274a4c105900dc11ed306cbaf2c7c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bea4593601d7f5beeed67ed4554fc1d5314619da0e5fa969477457f810082b0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69acbec7709e13afc551fd96691fb5bde828b86a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c48385f875a2c16ae19329bcea8c30277090b8bd74ad90f2232fc63ab23c2f90 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e14d7cec0b198a6bbf50e2b72ada9d312c40f827 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a61698a26ce6e84c6e3ca45000a3b762f92a9a0478b55b9e6eeb9f9904e8dca9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56e5c6eca6dc6ed2af7ca455228ecb931259595b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f8affd47e07cff1c2c32a5a7365fcae8503a63ffba5f40de9b0ba0b41d3341d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f294e3804a82d5323537d7c8641e73206cd3450 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6f1de17a56ecdc6780e9fff51b4a9d98b4d7f6d4115444ba8d073264e34518 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fb9fa42919e7e4750e1e7e05877faddf26e2d45 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:281fb0754e141161d09b4f183513576d8436a6e32a5f06872b6356a0f73caa1a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1c49da2e986c8eede633daf15a39d138cc48cd0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cc89d74e95e95a57da0584af9a5a6b3c7c6e1f371f7790371895bdfbe3f8858 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfb0686818aaed1da94fa0049e5557f5ed876eac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545a7175df009b361dd97b49dfc9dcfde9c79ba3b3281b7729e59be3b46436b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..281e7668414f6a87ea0e11c70b0408871140efa5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:944c107ae99c3aeda319f6515a9fdcfd068b21d3138f92a093c457b59493f113 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0489f9c1e73f07473e6f2a8b002db7fd8e037b55 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4b95f0c66027edcc5d68c9569cb003d8d919df949cb3fce35a10ed694862e59 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79b4db1e1f780ff8a97669f405f3b5414ed98a4b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:174434f0e3a506e579f4d6c54ed6ed756cbf6fbc425ea7287dd7cbf4f3896ed4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf0944fe4e674f08698ee5d5e9e27691da019837 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:409a843e2985bca2b6c043a4c99fb47b292fa8ef7cd4d70b5ccb107437ae6419 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..87a84f1e7abb3f2f9e7077075424e71f5d238110 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d504102630129075bdaad89ca6770f85492974c58eebbefee67259d7f5b055b5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58956b5c752a4c5d6bc42f4a01ce0dce92deef3f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e2e3bb961ffaba46f269e072aa8a805cc9f962cbfb9f062b9bbf99dc4b7b161 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36c657d8ccac042a0373ea870663e146307c1071 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:230f83b853863668290e44dd55374f05baf31e9aa036ec81b771f836caf25c1b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..781cdc88efde45bf185718cb4a1d70a004b62fe7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2486792287ca0af9be77f516567691b01282a5f787e5b7392106006a0063ea2b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/lm_head/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..baa93d4e55b642aa828e184d63d1025150fc0c01 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0deedad708e14c79f139d93ee1a7da588427966418173459aec4f03b4544e146 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/lm_head/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..930390082a3d4cdc1bb98056ded6bfa21b3ea3ee --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:361489d3698126342e8113d70f9e8882f2694b7edbd83c6e4e09a912b17b5530 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..140b01e146ae9207e887e7793e16d8836001b365 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6052d02fa1919277949bd873f5bea01c10bbdb9ae8a5d18b9ff4e90ff51e6913 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..222a80c342e1b8cc011265ded80237ad0b054d76 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c11cb19933edaf6b31b32105fe415a9928a540679f3c6bfa0ed66e9e7876571 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4280292f2f14910c34533be1260722a865d037a1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:144bf00781f2b513ccb30c9f523bb149d25be5b6ebce238563717c745665bb64 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dfe89b22adcd56caba4ca78a1211685e521247c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c823ceed22b5fbca5c84b3a36e58d42c7bf8b9fc9fc8c08d981201c8d304787c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2ffed96ad647df0c91e7d0a6492fdcde3a718fe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfa05387693e612552af066ea6bfc60ef4f9f32e9fa3b3713a2dd9b345dbb147 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10e4bd09afc35b12986ddba45118df53cd182918 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73c17f65ea43250603f980f8cc8484d98ea20f84e6567e4401f60324efe4c7a0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f69aa4e3dba0b6d05ecb62c8eb6848b970480e3d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad43d5e3f01249d5659dfacad66bf838aad630098282e54505ff4af456e64eb4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2e9995eb2a5c53c790532038bcff26d565b7640 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb9df74b88348cbccd67ac632c3959939c57fb194bfdb2dacad7ac71616ffcfe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fad25ce01af4af07f402e3af4370fccbea6cd4cf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ea6fb910ef19e286870b9fa22925c6ed3c59a4fc4674a88eeacd73eb766fe6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9682b92ad9e629d7c0c50108db0116bde38d7923 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1425c1e5dbd814f45b0f72421fb59d60ebf906d1ab8060857e7ae8a90c317503 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a4cb34db0ca2611d5c9af47d6271b920c44e67f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8249091152d7b6a1031ad4a24e08d5dad10b156f62d6199ac8ea73bc3c00519c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..730312a880126ce24b82bf1309d8c6125c85d5c7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2dfb5571788b9d246f051b261c9baef1d13b086eec7bc27ca688bc4212ce435 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb08f4b79112d47c68d68d5e7c4ba63942b47ee7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7308151b7563cb2293b0899192ca00a7eef14b355a4bdb8e0ed2702056f83c66 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e431fd5fe18575104b285bde9d526245fc2e360 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c214d094d872c527d3f2b802928fd1e7373e243495c8f61608fa4a91262ff02e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e46d299dd739a1d626c2fb3d8ab2f3e96bc4c7cb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8efd0f2b733bca74790b60e3a95bf3739854ff420c74561f43a8ee89a3418436 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d0bde2410e29d92897e41a400505d8b73b42e41 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40b83eab9a2f8faec40346fddc1cfd1616eafba6735ce20b1412ca99f5ada034 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5bb16d49572db5319be6f92c2bba32a011f7782 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fb5eb1d6b90eb1886b3d34f3f30ec8c595087e533aa6137a5f2a8c1469c5bb3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9257d3dd3c4cb850ee6085e8bc95f5452ad7015b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d96a67d544fed06f05387ce973c375898de1071807e4dddf24db5d7d3ee88cb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..baa4eafa42f2244a1f1ce6416508199710c0d2d6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1641ee7c4e02dd6fa79a2499e72ba6d2e186daf745a44b1b3e1c85ce262e0155 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..581eba732755232b81250097b25df5d3cb8fdcd5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19ef1af734ffc0acdcc782f0680e596a3f789486397b8c0d0f92348414a08f45 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55c5dfb8baab6b5f2f28872880bd5bb418408926 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f97633aa08c27f6e6f3dc9e47a11de96d2a08ce9168d7def67dce319b969476d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..865f87f6657e3750ca94773ac3319765c747c7cd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:981338ff98ff4bd6ea8d9d9823196d3e513e0e7477021ca9c0a3d49cf659b877 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..693d4ae6907c71dc418321a98a69a6270e6ccdb8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56c1e4631786f012a984f548dd166437df4c4784c96af832e735c334c171799c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e82884863a2deea555c4dd17a82a8861b3332b25 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:133b2ceb1f098ea0bb7920811c3362ac928fd9166c4a825000f5e39aa0392986 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca40237fbb14a06012539a1f11ac7e4d1a610826 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31daafddbab35432fb9a8ac5fe126cb36778f8163b560972e8c55d1632e3f788 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..affdb87fe594863f33fa5253838570419e19d157 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e0a0478f54ce5ef78f82ed4ac2c65831c0cc0e02b0e0196a40d8ddcb550bfa7 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b5501efe494db370efceeff38a8a196fb7963da --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf069097ea6ab1eaec5ef64292181c4efa1a4300f0824f54dc46ce90b396045f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f14766c0d3e0f88751c926a3277fbf53d926191d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:531d401484528825f12d87c2f0eaeb07e720e64b386c96bbd8bc9f21cb20ecf9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7da41b0695eacb8b8949894a4608942a63e77479 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acfbf4d8a5c046abbdaf2c65809c9db4aa159a7942cafbef75b52d02dac4d573 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c41d776ec12728d866394747a380ee15e2f1975 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c2381a7be446959844bc61704d07009be89ebff1dcb56ab6e31fbb803a93f2c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2e4c6b2a9b13825437528f54fb6982b0e6cbcfe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ea78f9240ee409ac95f403c8e8441b675658d77c3ece281566c665145798f38 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cdd3ae2c274a720624b5d44e54c0628b727168b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45285265b2ae96c4e0de5d3b00f86ef150e20923a459ca3e6315087fa8e323c3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64d44c466d57261950940b25c4795f9bc612d8b8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c0a0dc6e73771b627975688fe9ab82bbd7cf8c1f825570817b29c735f3b1602 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a515f22c846795925fb56349d9a6f4e92c2f1ca --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79aa1cd67b9a4c87ad8aaf899f0c7651a40140c25744f35934faf3ee938db03d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4a5268696404ac03770c9cded468a887b426252 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1972e6a564a5b495d60e6882b98e250bb03d7d6c941401bc0b190e83ff5bb802 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8637c5e94708aab711456810cdc630ad39bdb87 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0949ce55ea26090d6ddebf24c5dc0725fbb5745561fe185e2ef5f1494ca9982a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cac29e84b24d76f4cba586e3f343d1e0c1706921 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e144e3887d3cc6e26140a1e074b9e3eab57b226628ad520ea0cffc5df5f230f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85658d40dbddf09a58082a41d08cbc324d2fb72a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abfc989680f54f2ffe1f3f4eaabe7e4263aec40eff67976b9e7429a0695ba717 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fd1021c6d7e44e1540b75cc90d766c40ab8b7a2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ad94e032e983f9de80fbf9c01d39c396a3444c612c19caf0ebfdb22e1b37f50 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa999753ea06e7e4b0bebb579fe4b0efc084b423 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bae0dec08371f46395fd0043024b77d377be116f96f960721829594bf492394 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9993c317069c6e620ded96935e07aa322f21a3c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b88b91a47f3e253fd4ec22cc2128eb5d9d33dd8814d96625f499299bb3699302 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fa042ce33cbd0391a52831c25c4f51c00ad21eb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af029bb7d7a02dc19c6a96297585a52e7126c79bb91c85f5e2ec7e616089c879 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2b43481cfb8885f282254e60ad956ac880c4ab2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfe790b78bab25cdc591e0580badacf278c3b98d0054737a2a7829fb69f682d8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d95418da0d155609d047b6a91f270ae76aa0bc1f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35c29b5b6a8b3689cd95b02a2af8df0b5d1b37e0e7bd30edd9db59b2b4335ce1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dadc3186933c6d1d35658c54ae1126f227a6e3bd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a34e62e99827407215796777cbf508cc944cc3a7ac4c7a070d1c364af1fb3d7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d590c7525f9807818d7a970b85e1c75cb5f8ab74 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0947eaadebc8402041e86143f2b41fde0bb77933bb69977180a516cb6f2f6361 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d401ed588e9c572c45037b5ab3a5e90c7be5b663 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60ab86c48bcd6fc1b5ac9008caa1136a9f179d72f543dde69ffd4c9c5b23498d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1299568e86d01adf3c377824ec10bee463cf08d5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:702b452018a6a4101c463fc3a40f580bcaf710bea79413b95d1a980058241313 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7514ddecae007c68fd5ed34e951852fdd4db0f1e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:146da4f843bb94af18f0ba863d3484f9214ac58f608c9e25688199d68aac10aa +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6eae06117b155353196b1d6f4d574bcc1b262b2e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c7fe008a3a55d0731f8902df5c875601f6ad271a894bbcc94bc748196e960a3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3084dfa2a046b001070382e48d8d7467f35714b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad6084de77642c111d072b0256a9466916ee5eea43eb8f39285aa195ece3b69b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d5e7f75006352ab8fcc90b5c0e795b240667368 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d50a414288bbe1f0d398faffa1d783f2111f60668e5c11bb437449ba566aba24 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1194c40495e1b76f91c34a29e3c451f9d61470c2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:102c4186a40e53c8356fb2b49ac221a65fb8ea2105411335dd92f7870d68e98d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ef0f9d226bb67e5465ce0efd6506ff58fa0e3f9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ec44d4e793c0a1c8df69e78009d68f60869aaf601d4cb392ff7f35d18745c71 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b2bd976ad79756031d6cbd76d103d0fb79992d0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5073fe8b741dd432bb2917230d139edcc764aa007539763cd22df3c3cd55feff +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac05262312d25932277cc8ee209ca65ca2925a5e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86e48397df062f97780549953a7022b58faac7d5ed501e3041272a9fbb7b7933 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0266d27069592cd3885014b0a3c8ecd168f04cc2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50ab928596e4c0906938da197b9140fba3c3df7638420f70717c45bec62c9bd3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bf1e5f34274a2c0f531f713f2fa8cf54ee9343f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54b0f1e7b197ae615a9b69aefdb3c1256054ace7d921708c62a4d2a4063a6345 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0156ad272a7c66a1504733e36b91ad1af9a326f9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:977ce55f3cb73f7d754a3971899118d729f17085f4eb5bb34d8f21a9fab293b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3398891a310662ea507bf459a2b8a1036bf5b8d4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dee3ee3f9815a8a483fbf9119dc3ccfae1736f5c073f2db568626d2a30f337de +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7d63487fc7658233788f9c7bec9692324952808 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56c09457b67b449ac657e991828bad07a871d8da13c00e8046832bb21e4eb6e4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..328191b9053f0ea97f199e8ed43f72657a5cf580 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1bf7fec463999e1fac1c7a30d14dc1dfc81726df53398f874107f3c676df359 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..65cbb6b22cfa7d5723b625dcaae2310d173c8b3e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23b727bb3a46c2020b7261fa195247decee77f21966525571a8ce83b4bc8a753 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c63b13acaf8603d9353acb4a27b26a465c53c1e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1f33d6bc330aab940999b63d1a07fcccf8f1a05b0c57bf2dab6395c53d75ead +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdcf788895b5cc750366736c10bedbbcdb855166 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea7bc14355040fca2a72d64478e15f1844141b32ffa214a4dc1460ffb6b6948c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1c19763674dfabfa0d7730c62be2827b20eb07d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d740f6619ef92a1962fc52ecacece09c8c84d1723803767725b4a469cd7eb2c8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2777520f271fd95ffe483123cef4dac20f91123 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a718b013809907b29db222a13aff0fa89a9a25e47d512ae24d7bb973c9a291ed +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7634936a10ad6c8927ac348d08116222a3bb0d6f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5642781d22709bfc0348297e67beeb49e0bd97cbc4ec0af0849ded3443a28aeb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..84ddc77c23e600f07f0df37cf116fa21c117316e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:098ce3b8a798564551eb83c1ec52187c8338dccce9589c2f56d45f40098039f4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e78c9b9876b21bd9925c40491efa4c48d3e7f70 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c95c9e3e5b157ff86feee682a69735449f959c67395bc8ce9aea5c868e39dcce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6da2ce12d6e65ecaf331ef5b067e9dd6aef6c8b8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff48c0fc6c3fb40e9cfc91ddea29a4723bfd0da56f0f323846ad83f56ab716cb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e43f458f758d0aef9568fd5a631cd00c5d0d0c48 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2757780d49b3620acca85505cc39c669b06da9f343d6232f621ad00a8b0f721 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..02fea042d84751a8ab7a136ddb761a6df8260946 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5d96f6fdc745b78f9d944df5898ca86c9d0faa6d1d83b71c52100fad251b621 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68a12d4b4dd7100aa9f467004d925096b13980d3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e00059de9a82be3e031714d5a09a6370146156442757109de6dc4b4d2bae205 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ab4917cc66a9d0de6d3109566b68214e1d5e8ad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ba8634d057a6bc6be61a9dfe186da6cc8241f0e5875d4097dce61a62810291b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..908dd220a76776ecf2a494e8bf5139f675de92f6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28623733f2f740718ef995767b5ad8fb77dbaefa9cf29ee6cd0b289a316a1f85 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dcf380f136dbd1fa946228e8f3aace92ded2e1a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:698aaad887f77f00ecb7872ca6dbf1ee8cd0361f9dbdfc5956c4b701fd79995a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bea7c4d7bd71df8281b4cbc1f71d02d6a8c2d942 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b395b601b560ce5a0e96bc54f3c6910c2214f1ffc5398f533ca0eee7b6d9d01 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b669d1a42864d62c375ad95cdbed1f2e279f48b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32560aedde54ca1e46b4f3ee9ea5d82f942fd7171ff226efba1c265312556eb2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8001bd79499f67b36f764aed425b29c5851f0bcf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5fe42029ac34ee9e2021526f6056d0b2c68357996e4705df035e15cf3361cc3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6518e334777475b88f0a7b37463a5465a0117042 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8d15a001f1d0e635707ddfce490488af42abb40a6123f78e4350810e56e3f9e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0598b39d41294656d0876abd942cedc887b3213f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a733de9131940edab46fe0652bc6c3aaf8f185cd530a760d357601c490e2af3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..24247729ce320142917ebf9ff63992e74f4ee6e6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3428f80916013c0b6368358da898a9da7b428b4bdb6bc5e3db663307c77a2dba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf3d05780a2c70d445bae158aac2129670b668a7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5590ebbc7f8d1343aaad2b1f05fd674b5295a74b67a0bbdeb86df38f826803f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5158a708e40c3351f76f59afca339a0fd1a1f4d8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33430dd2bd68cc8ae0b27516d0c8c3d6aa111f81ad1399b11b341a64d111c778 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c64b57892545688eadfe2312128a08b56d9cacc4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:698a8cc1f537e2db36c42798e02fa8d33b0ffee964c96f80d1d5b9ebcaef00b8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c6167b9cfcd7d49dfcc6e67a0c2c085355a139c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d2c953ffaf7827fe857b85d4c13b6ec8427660a85fefb942bf79a3e72f3336a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..676a59fae679669831706f5e3983fa257d748348 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:556f2bee2ed553c281401230a42ee795427b44e3345b0829be087369afc157ff +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5d821761e1b741ac07e34aac57a93d87809f6e0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1aa92f73cbff089d227d8d45852d549bf3fe84186d59b03de3c6ba6f1b6de72f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ee28167076a6ea32dc17a925b5dd035a9106b04 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:830140bde9333a284e3d5392d0681b20660689d113a803dfff176e6f76441fb7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c96d03f89ffe4224becad8a5c01151d8b43bc8f5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3981cbbe492311acd673ab9e56b8715a98f7d7da8fc383975cdaf6861f2b44f8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c89fcddd606a43492fa6fd86f72932a63a1206e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae85a7627c45b20dccbfcf2a5091e017eb9cc7d71047fbdb89db297e8fadbf2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c5b2300d530ec2580989d58db4503e304166dfa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dcedbbfdd263a91ea238eaf0308ad2c301ff49f61870becd4fdd602ef8582d8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ca5cb5ad6a1ff66654dc0b5388b9689c6b8c500 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3264052c39397514fd2eba4b953909581f52ba25e9373ce12ffd6e4a69c9c9ee +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..135b15d167468d8e9005dae87b73f35e60ad0874 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd55897ff5aaa77fb2caafcac985ca6f146ff755bb8c3e5deca0e028152bc33a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..168d06f190a1159e32d8fbe0dd11c230c3ef2370 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:decc91bda97c82afdea3e7a0fb68a4c69938fe0317de86e54d7f54377820ce01 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38b53ae7afb659dd5e9ef7882f40cc4a1c405830 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8e87612f6712ce76e4a9a697549ec805080c5dd065e34392a8b812ef34ee2d8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..106efb806db73da69dde90bc3d34b5b107509161 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a233fa42560b3b4e1031ae4c48c2c45f6d26b927147f15634d924b606a4019c5 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..51cc39582ea33def5907fa126b134b5d2f60f99e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c285d57169d1865deb9fbb193201a406b8a7ad794246f1e649205081c859712a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f81112e877c2461793f67b7e74aa5f0cdd87d3de --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29949bdbc31333e2d9c89df12c24884582ca1fa80c1d9089b50c4989cdcecb81 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b8b98ca53bb4db112aa6a73e96350e8947f9003 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cfd9c103cb0bf220b9fae40549ec356e1d9e21ae95e4d45c710457d751063c7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df0984490dd132b76baf58d84c0626b520cd19fe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a98809d636beff072760cd36cbc1c9b4cb90a1b948e6ac3163782d345a7c5eb1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1b2956c6055338b5c4fd817ba8e967fe26ca4dc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65d559dae1bf94a6ef60dd5f168a559c2b1aa287a37288a87499ff5bb5434209 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04238216f913d854325f4f902a53323fd51d28a6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:439b7a6a5f5aba680cd746e52f16c6a16ba088e589b966cf3ec4c901174fe0e9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7565be9e53df9ee871f64ad4110e4cd79448716 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14bdcd31a0c22f19d0f465ebd848dce1f6982dcde9db48c1395efbdb57fc281b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f92e689cdf6ad5def7d800f5d6cd113eb8be301 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df52a438ae4689477e5bda6d69628b624231c0a984287a736f0c8d35525b7ffd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64629d743504d2590f165427b5d49297291973a4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e3de8f15cb9c3a006b871c37aa9e90238bbd040961270ed68248fdfb5f469a1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d36198ecd381636c2f1324618ac11617782efe9e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ded64c69e3c0f34c63c314ea115c151ebe7b868670326f276537630eec685ede +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..973ca02b044bc110c786fa578e417c184d9c8b31 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9551cc1a9b24f18fd65897f747a90af75be694dd1dbded6a2c636e9090defadb +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3baf52bfc31661441a50b872de52fed0840b28ba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:285aa10bc61f5672b06f9075a1286e2c11f2a0001d1990e572aa5a0ac8ab17ed +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb10d63219057e0768e6b1d03a869c82c65da926 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92e27bfc5a260b86987341ee7d1583f9fd0669baabba395499a2a5ee569a9d11 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3aa30c77f158c90fe6950f075ec1ff1b5247b6aa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e30256696565a7c0ab1c47b791bbd26a485723614a169af26aa58c972e80fc9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..27777dbce191ea4f2d6225edc46f702dd7f84014 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01f158d7f42a0b5bb831ba35ee6639594c5401c3dfeb9637eae1be75b71bac64 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c6ec75ae2e809dcca95027c147aea8398f056bf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe881cea7388020ed7ea84245cf653295e649d5326422ce35217a3c3bd1ed36a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..520be7a48131f1da1e8ae209e1ed5ebc2d4f1dc4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:769e41323f35209eb01b441932a069074aeb345f45f6773f4e9a510d0b547a8f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d29c50f0133c448aaf5c3c2abe9662aa4af55e26 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1cadcf58284a79795424b3f6f2e66dc48e4a0147378c85baebb2c0a2f4e227f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e345bde34d3d95e5e95643c984dede1a5a12b350 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e9d41c0c8799cb9c09878d6ba1819662c28ca3b0ca9433bd11a9a322526f9ff +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85a2ad58afe8ef4717ab35afb0dd91471cc91b78 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37fa517887f4842708c3f882a8fb23e2de2b352411444f133317fb50edc5994f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1852ea434f0879c9c2c399fc4342feca47a3f69a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83bf5142eb06ff151fb04d2ed05c4a4f154dc507572883d45a43206847d979e7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be2a5557050599c11722ecf224a0b19e8dfa3459 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bd753733de138dacffe7f8241ea729568c2b5dba39b8f71675a98b9badbb011 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f1e9300c904d17e0078eb42a498f97e44ed15df --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:815a7da84211cb50bea6850cdee36063a109e4beb406c7cbe791c2e418d8ca18 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..351ade77733c5a09bcef04199411b8fe5f44e94c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03d63aca9240b9e118fdc08d60255e9adc96dcba7635c377c344b8638be087d0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8711671716cb2b44fb7e0087db5fe937db84297a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6e6f199aeab35b6add417895c3f2eb87a9499815a91d82346c19acf68922250 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2f024b10e01615c05350716cfff52ab5ffa181a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c4fc5e816fb1391af95dce5e4362f25cdff83c4171fd79ee8953f9f5e09b2f8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b04ad38ad55e0a912219b5c3418d32c2111203cf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8258a05b1807a03c1e7d095a2eebf1b67c55522b430a4a6e1b1b8d56c318905b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb9cea1de4e1e5143d8f9e8e4c41de1309c7a9ac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:140664db599be4d667ceafba00d0023bb82a80f5e5bf783ceea6da482a47b1f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c41612d7941e3f04033a9b80bb979f0c2bc87844 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cef837e508754385231c078f422d3f83d3a1bbbb87c12aed1f774b6cdde1030 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a999ec36d9e29b4675d9ddc7b1a2c210253b0d93 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a874b6c8e2c3290b7f5917f7c5be71bcc7f762283e21169d0b88c9af3105d55b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..54ddebb6ccf8b5394f16bac76fcd6de86a67ac7b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43e66442f32a960e6006f1f2b50bcaf4ae4150385e53633d0d6977d779e81d9c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fed23c4b5216d06996c598d59997204bdf33d4a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d6849ce38ac6f8090836d5b020d0aeaf773894504681278ecb9a4f9574a5218 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fccf278908ef1d160656b5d1baedb1e38e678294 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:322fbb9da81b39101f1f8fc1216b9b3fb6b39aba11ae65d804ab0d9ec87ddf49 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4e8e95d7de3f0232d991b68fbedd47ce8a49b76 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40d8b6f10a16ecbef6b864f3840137269c33840ea02de59670f57ed5e082ca9c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a190fb87347ab176fc4ff55fc66cc0f70d83c4b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2b20da14149162ff9603c12950fb87c26fe24bad32d05c01b2978214d44fc71 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfc50bc377dd8d024a07a3b655e4134c35f26265 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f72fe006b281f76c9f246ce370f2b501d7faebe61b9f1d96843cef13196ced1 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..806eae64c4582c00c02ec315dbc201834d73a189 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70d88a81d5399fa2dfa6ae909a98a5fbe17818e68b2048540716bd1a59b0d391 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2547e5217c772a660ef4c2afc4dd2151e0e11e64 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10bdae49e4bc7fad14e2edffc1e0e60eb56ffbe156d3c65da5c0ea26e4904b23 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a8e26369c13f1f8692d385a72c165a64953d836 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9c07ab76b2302bee59bc64e981fff0dec759406818a892f92ec4a545bee58ad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9314ea4fee5ddabed66e9311fb26f228739d040b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5a99ff522d58f1d4c73b1ec8a4d9f5681c29c3be07820166791b8cf1e4ba99 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..73a9bd06e4bf03df63f7a6785598e21da26f59cd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:671d859ddf3db7ef67b9c61053e9a55dec3e9e6f9bb942e42f9291d6d12c80e7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6132916f41a01e87b14f20a1197cb38ad3afad09 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e4a8dbf78c5e94c0e9095d6d8c3d84a659ec5bdae517189e82aa9cb9585f54c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d1e94e204368bd88d96a6de8bc6ece0b748a410 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3919071436e245db99af9fd9150067c8324721f9d2e673e78a442d518756983f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13ddb2a228e74f13fad017620e04467e09ce58c7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:986a28583b976d88b9da3172a98d846179298255cab8122322576fa7b2cfd887 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38c68e6f18b75205463765a3bdc7a582854be32c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49921e91967f20a7c347d03dd9f272813924ac30cbc269479d00111150e34003 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df1e2a3e62ab125f621c64ed69644cd5f77e17e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e565a18dcb8c5e08bd0d7e4a616c2c046dbe48c227455a16a16f76d72724983 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c2a8774a34dc0829e8e64969e47296de567fa64 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5ae41f6ea2f4ad2906347b97d2bc7b255c503b7d62aa38d7f647f77318e83a5 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dafa1c30e6cb2163a3ab6755314518c9097e9a62 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b6a95e2d15eab7449bc55ff4fb287996a68c8b27fcfe749d20d7079cdd67d97 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b16fe9c749ebceca8b4fc52f4b295e29fa4c94ff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d95259be099f7b6839af591e8ae66c58a5e5bbc1dd135f34d7457493379e3e6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a832d0d5928922b29f10b1c6b7981a2031f3ad50 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bae89ef6aa1078cd594ceb1a204c9bff16698e838c34e148f8743f43d78d8bca +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3e315205da678eb4a7ca3b0f916f1a5d70a3d2c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2de052451707e43f9b86776b7285188760ba8c0927a2163e01532d8f1e7eb9b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff57243a69258ac3b18b40e9864d9f9a3254bdb1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:451e1a2f213113ac436f9e4f2c332b976080fc67f0f3ce8938e2cd9e9c58630b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cc405925ea573a0eb77e86a15bf464f703ea5d5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:538d77f4b350fa4c2593ac803c67116b0ceb8de1f9abda8992c206e5eba6b81b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e41d8f4fb0db767334fe688e2c492834b1452101 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ccef2f9d0f6119de8c7029721061be993a2ecde269dbfdf14f46c996b9c31f9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..77e564f87228d35aa5dc13e594fe4f3637bab4ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dff27a32613c172d43880a9c1ad92a925b40feb4216faf2da1d69f5282f7ba6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0dd9b1ef19858be81e721045e5ce47ba4dd5241 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc0635e5831141bf884844b3fdfa77024392628760ae36ae009a20e8024f4c8a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c4d299e6e06188471138a77ae2bf1846729487b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:085fb9e6468cf43ec531eb86b0b2237a5aa181fea831ddaa6d8569fe14d02162 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00d14273ceb14292a5fd95552ff5ea1a0cf78b53 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f52d6360a2ddd59e2beaeb898582de3c6e20a8e11828545161857dbb6ee31603 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..74ccf76910cd497f843886217e994fc3cbe3825f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16ea811577e8b3f45c6169564dd6286549fe018a5d95374285497c16ce057547 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0c0d0ad5519f407639a86e383b93bb9a4d6607c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb7a36fa57a200c252783d6c3ab026fbe722a85c9a353ed9e44e0984543d6a5e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..704fdb2077849ff7e23137f656766aa9b0a09973 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01410c51e02affd69a31fe23edbc898acff0b5dc31180e39a73c3eb5c4c6764a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..430e5cb2565e2454a5ee9c585c5fcb94fba90171 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bca777111ef36de43ad94cd4c23041b0855ce57ea01a84ab4ad87111f5f3bf7c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7135c75c31de3a666ad946abc5282a950c94066 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c2621be2c6124681e87f2eff74dc836b32e588e641fcb1a15b13405f900f6bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a6ded9c7908713146ba5238d967a731074514bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82c7e0c27d222b0e2959aa9cb75928509640a0fc5b3ce52730e2384e6040a812 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..960d4c214b2a0bb71c7715f88df5c6219e3b0eb7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2186636b98ef318e3c5f512923edd89fd7abaa516df48f63aabaf9ec570592b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fda0a5466ac3a9580d5a490fb8e205b8cd15949a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99470f1d7c8502ac35059a0b7eae9375fa0bda68f32b543b6ca3db90b0a1f431 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3b8a75bf4bf0dffa616f6c74e11731000829a91 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c97ede78f60013a2b9a5d9fefacb18878733378fcf083f58be84ba246322e56 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..362e6697280d133ef33b998747a910ede521d56c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3efc0c0bfded3eba12d3936bfd75f81b502883a35eaee7c4bcde6b56a0c591c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..867a73ecebea5af0887e3e17fa2ba846bae61fc8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:921f7a2bcc49705a1b4209a66bc4c6d0c2eae913660ab83e85d5c244d2590b9c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e1f71fab4d918bf2141570d0a7651f2311fa003 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b129e20dda79964fc4d21ee9a189dec3b2df47095a313c518a987a927483c3ee +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a0841e4abb2f1477c134752270e6789f8ee9767 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1252e94a45a1311f45dee6e01ac0dffd14b1251e9ffe43fa5b45dd60908740c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..994cec7331caa883649be01a8ab3e1e1ceaeea92 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb86e4176419f849a151eeaa81dddaef25315b0185368a9f475c16ec5aabcc7d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..15a74ceebd0e6c7f1d181b6e125207a87a58baed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ed38a157c1c33cb7e2eeb9cca591ef3645ddc9c3b7378ce6bb07fb3382f0ba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0479268a5ac5832d827a8080252eebebefbb1b3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8f4f30746bc7a81ae7e0c8c2885599ed6775ea7537e6422aae76a81cd0d4129 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b9eb59b5d57c1fa8178499aadff3e6baa04a5a7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02d53320801ddb46ffb11f32a98d23078ab0c3fcae996aa8dbee047133d205bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee777fc543f22fa976c5c33932bd541aa1a16865 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:706455452b9c605dd6651851a3698861d8d97551a2ce0169a0074e6545876f86 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..35a6f05f7a7d714930f8017ad9bc47d5591fbb7e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a30880bf8986d6c90ad787406d9e30953807ee9ab4a322b1264039013e1b6eb0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dd12b68f8454fbf0f7a8ac4090e41f7f189a57f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a94e2f06983cbafde49f215d8ef4e8eb2e75139893f8684ac3ce1c092729b86 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..de274f3d0c50803797977eb2f4cf1e4e3eeda8a1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:609fb5629a759de87f4ca2bc8b91bdb6dcb21a9da1bcd8625625adadbafadb10 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21d83f9a3a0d7c5deb286a69eaf1a3a1b90172f6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4f7af65bb37fb4e84fc430b2bf399c87bb5619d96b526e2b88b8d0b88273a8b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a37ecd5cdc3552084b95f2ce965e3f6980691b28 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9974644ff779c831b9c13fdd09c0fbaa67013823dd32d9e8c1d4eec4d093af +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..43e057b1f5a980ea5465a52b2bb2cc42028a7d45 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c776b6a59cd95f60caff4b610041bdfb09f983905e2caab27c8c0320f554b958 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fb535c8be053d1373238a8f05b0b257e60f5d27 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88e68f560d86c0e509c780b03f6ea0e3a727d2efd744ff743935eba6a9f6b560 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1166d3d31ac9e61bd25399f70430f679c26a0c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cca2cad3b7f988b52a5e361f7d3703ef8f54a73a4662037952d4dac397bc0e9a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..65ddc9354839567bb316505084a008dc9952814d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95ac1c0827102f470ab835f534a3e7198e389dbbcc4b71d506819a0c697c8d62 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7701c6e6f5147f06e0301bd74061eb063400563 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe3b69aa01651d067b0d51cc9f4c31768070c61f30a9ba6e3939c2ae1a95546f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..191cf1c5ab91df3d663ea03b543f9832ebd1757d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4bb911d06f893f7c1a03f86b6e823cdc119eed556832fdf5201edf2f6b9698d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d18ed24296aff47930f0c06026095b6f636fc94 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95148e5f2a176896b589a3252186588dc3d036ef11fbfb229758deaf63fe7a7f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a6556b3b954999316e9e1cc756ff0021bf7151f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3424080c122015244baa1fa574720221566936a40181c604568e4612c9497f55 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68076340c50d620c18a84b7cc0ed2466ae0f6b2b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e1a942d7078ab591c1df59f58548635d955d37df15f2178351216bb43e6553f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c8358fa06a4949e7decf9858e6247ac344d60f1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a65794822c65ae700ce3a52350848a466570162ceab4cb6dd8848af00bfe3a85 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00c278c29acd2b9810acea4c17a270680912ed5e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2ab4f2a0b8c0075c38fde277901213b05db1e2821a87f9e871d3177b41c7341 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4deb90008cacf42a2fd36440c65e8a8db1d0bb1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc1518d23e03e0fcef4080c5eedd928cf196e15c9e64cf999923c460cde0c4dd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..777c5e54d747d2879f4dee3d44056e84c9ea25a1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c3293d917af40ed9370e11da447f5e94de4930ae750819e906a3f0c628fb5d4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7376e2a44223ba47ebb3f5c0bde7197e0e9a6bd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb48d094fb93d4e675a64218cf405a6115a81081a17bf9501b5d494dd74d0420 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2983c6770122f8106c5a6f7eba9e0974c777783 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfa6cdc425a56ccf62c7352d0d0998c0ac9b3293d1597fa50cfe6aa5b4017bf9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..df1d6852271b56e805c8abfaaabf93b6e13e3b0b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b7766ebc2963fe5b28aceb55d812b573e7b8d49e4f3aafe5eb287f0c2082980 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f2179b4a2d6a71bab03a7800b6205067724ebfb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7183fd49de5be3d1a423588ec08f5246cdd95599140f7c938a316e797651b8b0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..acda1c6b889ddecd295af4b241e7ab5414e5b1ff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b7bcb2aea55bad485edc719d320b54838a0552917bd22be7e52d0702f0a3c06 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62ddfa875049cf5e8ddf20d9b72007d6ceadb6bd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19155bb9815c8aa14a817b6b577ef24b7cebddf20770d4c96476713e238f6b13 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..892a2de6c82400c722ed4fefa0bec0f9fe93a3b6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dfc280f369d23e5b1530fb7eb4c293396894c1f366939598c57ccd0a01336de +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a66465cb80f1db4cbee93704a6c87e81de55906d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0802b1172e16d74e6a0fe905eb420a1d0b85868298a9412413a6bfe9e048e2c7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae57423aaeaf70d2f53d8197cff46997304d98ae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aeca7bfe2b7cca413d71cbe67aff68c40c57d6605520b669781dab02ba62d1f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..205e697ecd5f5486d3024a6d50e28dba1d98a28e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e72e6bd963f7af59ad712ddb8c205cc111dc6d069d413a2d8e3fdad256cecee7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1839ae7c2c7d9bf9f5a463d5fe942e72c1d491f9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbfccebd0b37ad1a300b93515b3bd94e7649f98d90f1d64517da9edbd944ae7c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01f618633f7cd30f321caa9753af3fc7b3ee6073 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fffd08d3e043dd9dac708a2ae14c9fb840f51411fd48b84692dfea19ea80978 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..226389a76f09e8b431f95f649129ffb2f9dd9893 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c84b9d4207bf28fa21e78a80a306be070ae76698d4fd825528eb8e708e12efa +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b58b671b7296cc4f7f92b27e9d2134e311f6d3a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9afa5356069465f42e34a04cb1ebc6357402ee2770c7dbbd1c580b54925b622c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..409b2307cf97137f1d2157efce7075cbeb998603 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f1328edea52aacd01b4374490221fbf5bdc78bbceae74029fa5ffd7b11c5840 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2285dcef6f4572ad2eb3d7348fddab853984c48 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c1aa4f77e7e39fb9d02b1c2bda6222c47cd3c421197b61887a31d59c4e52fad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1da3805cf49e13dca242914ea5f21575dc805911 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cc1cf935e7cfa71095cdb117e6eb05ae72d2a28e4b2b4e0ba4835cdc61f7523 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e32fc92ae530ec34bd06a79e94606bc11dce0777 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e53a3e4794f762fb3bbeaccf817fe1b7fe94d6a0b7ba1b7432111c50c9c0e8c7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..49d02ac2a96899cb845b0ef664524bbeb5eebb68 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31ac87b18c909554f08da8fd0d1581d4ec8d6acf90a4bc6122368c460a7c8e8c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72637026f73f4c311f23c1d0393050a7aefd9117 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d484eb4182ac9190cd58b5ee7c219289132374c502440426084a7c5d3e45b507 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..57993c4e44633a233c36a6f27b6e8a51295fce51 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5bea578ee2c4e623a0263196bbb79f0c2efcfbc0fd27615103d6f7529f5cac1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f06afd30e0cc7ed9277a0e0ef9693ced542e8442 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2fa78ee69fb45e12a951de807f2b89260e4070058dd7cda66dbf17b23e33061 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee8118c07d120478b3d57980ff615178fd8bd968 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9f41bdce1f971447e6b99ab154bc1130ff27208e32cd75025be50a69527caf0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31caf5d16228d05d684c48aaf4412098b14b49ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bca64cca0cce8e75cf56dc47cbb467df0b10783583e4191dd6cb2876fbe5d5c4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fb87631faee81cc4a8034059784ebec18fb7ca4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf0c88d9d12bb9196e9068584423ed6a18b39c142584a462eacc8cc03fb49426 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2590e623ed701ee8a943385c51d42906ef4aeff6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:832fffa100449669b52c30f945cf56be76ed078e79c708a1c502ef911df7109f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..63dd8cbd80739c2a056f9bea14381c90925938dc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b01b475f029a65e549a18271934cb656726ff575083dfdf7d60f52bf5dfe2da +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f82487b072074ee3f70a209661b1f9d640da298a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6277e591623c3bffe636f0fbaf7464e9bf9c29a6af9f1c87d8047885070762db +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08e5f8757559055e85495cc5b32f30970414a793 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cab094131d6d7f68a688b2cd731dd052f8faf00b08a6be0062daf4c9e44e5827 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed1ce221afc91734402a696593c26a370ebb37f6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61e5f1d6e8dabf04d97fffe42f941d02c62cde1e9931a123e8546c0565563dd2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3351be758f51743e2a94186ee269ba86088ef875 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb66de17b5c1415521de013e3a5976e077ee2118f31693a65e2da8540c780dcd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fb746d214cbc9009116ae45ab52361f36db6b18 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd78283c210e1a432559fda77f6437f9d2b0af397921d68c3736613bfe47d7ee +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea22a6fa4c8d4b0030c53a7a4e3984f7403961f3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34212767da04af121664961cc4e6483e281b5a3f443b56b0fb5fd75776cb9c07 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c296c7b3ec64a4349508d855ba6d6e823eeb788c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2abb5dfecdb24b66085929f9b278297245ee831f1007188da768c751256e544 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd45d1d6b55a1bcaf8dcc1b0edca2851987e1f46 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4dd9e6ed0053c0caa3b18358432ab8ec929bb8ee9fc0258c3b0b0a8fef3bde5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06e37c10862c951f80ace05de42e4f15bb37d82f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:961c562741b16ce33248ee015b99b0e9b03e8ebfa16bed08e1315ffcead4b445 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d08790a85bde42cc2b354c3a56399182e2c6d5b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef10345ae34152babfbd25d370eac4011c528f8919d65e76afa3cf34ea8ec63a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a0f8f8d02cebf157e83cddf45771baee480c6f9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2620f60933ab204eb299ba1ba39f61d38c06d914197f10448d90d879dbc97066 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e87db25b7de87fec77aeb484c49204982bff026 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:867306527c4fadd417be2bae944648fe276cf3222a8785db5397fcc06dcb042b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9548cbcb257e6383cd5d490c303b7efce6998b3c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b47b4a87f01ec907040f3ed4ee2ed3761d89c1cc2fed521cb6b5d236966a2bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7bb7518b29116055a023ebfc9346815feca1556 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a0317540fe414c5765329492ca2b5c1d52be159cb4da60da443dece851336f1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7444e199793adf500bb0d263cc2ce61a2974175 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d62b71533763e800b0b8fb6539211ce277292543aeff3a28022b9ac922cea46e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..10b4e85f07c2c6a53cdd5c5d44f1e04bf2fb6a83 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8394097cf827c347cf448cb8c3af9f2b82a98f794572accbcb74bc23be0d2994 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0e4dcf5d6898fbc905965332c5741dae19e65d0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eb9378e93d28aa003e84ca673699a61717648c2c77026c280d3c572fe617e4c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1097c6c9e5039371401972b66d114c9f7e6569de --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5012e566d2ab1c188e4f8200bcbdfb3625e92400d2e3a6f462a1b5b9d66162b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3c6e9e022271168f1e4ca80ccd5c9730782811b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d03862aff923a92ab204435c8e034e34d198f1da8736028b712d85b1b07c648 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf5ec921412bd2fe7222285a499fbfde046fbe7a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7757f2ea9c91b9f4f01e8d512ba459ef3c3f83c7ea2ddc5d8be38966263aaf2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c29cda78e82126bca23dbe9c4ba5593a1026234 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1652fe5ea105045142ff7a9d8e3937a77719cbfb3f9da4dacbe3840138e10f1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..65898114b636c306562e78a45a5ec4467ef26a4a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46825ceb4be1a345a1dfe5f671dd2b6476ceda38c17b478756f701f433c491ca +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d43e34d4214a92134fa637beccb7f38261f3d8fd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63f3d2e58d0e23cdc3783f57831b77551a44876bfdc0c64e10208446af81b914 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1db270086aebc1a86e1d6870bc43084db2ed2845 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e501cb01a75aa21b17c5a33840e3986905c495eee907068d5043eae8dda3b83 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a571e98b137c44bf851eb4ad4a15e460368b4209 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c3095f1849e6570e8920899639b7a5bc4cf6b9c3ecca8c1c79c95fab2efa600 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..158c08d035c56a4fab0a37f53933d93db9596e1f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70d5e4061feeb6f50ea9c2c5d30ab5e9e5c6f3c19bdbd17348c50699b2663f3d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeb59df41eefea45f5af3139fba26186b91a9b0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4a26a865b260c891bb51cb4baa60e81f7b74fb679efe96bc5072b629f443de3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5f3f5dd54891f5708909f23f7589ad2a77e829f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52ecb424ceab015b1be97afa366a3581e6fe661237e936174540b04f3d8db882 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3574790a903eb2ac5e4ab7c69640b3867f260e7d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a159491b4002c02503b76cc124e762dc13c82baf324b9fc6858ba5d745a489c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..99d31238e98186a8ac1f22929548d7b95b912a50 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12bce2864697006780343fa416dffc1572fdd74c9630467aaf4d82a2a2b9f769 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23aeb112366cf4c828951490e6a65ecd833710d8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf98ef2a5c2ecd98b44ed6f7f238da0b98337006cc2b9478d7b9fbaac9bc9c10 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9642ee0af257392aded7423a31e30b95641a456e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6099107371c986c7ac6db66da45cfcf59178678798e94ca69af953648c6a51b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae81b6018fb1bfbdf0bea4b9b396e6c5cd7f7692 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a98c190353b56de80055506c02b45fb84951e4b63d7e1b3cb4095c974832e320 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bebe35896ed5e5ce45ee6c3acf84008ec71c0eab --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72f4626a1fd021ccd564d8f637a45d1ad5f29bcad0cc05cf17286df50bc73c78 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59554081d859b1ab02d4cae32bf7913f5ce185ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c654504d1e7b76fc40cbd2a9a6fe00bfd6b85606b40bd2be8ff882345d3c38ae +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3038a77f5291ddce2532a84982b2911f45bcf506 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05acce9a70c08b1945a7b655ccf4bb39eecb3db86dbe9331e9c40d7d0fd439a9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..287f5b94cbf2e145ff249e52166beedcb6f57415 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b55162375b643ffa0463ec7ef17a98001c8b7927650eb6aef2598ab2c90fa43 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..066997262b958f3a4ac6eaeefcdba652795a2f26 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfe9640a240b21de39afbf37470353f984022db6693e6b383c27512babde02f3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d21abf7a5bb8d6762c84a0698885a71b2d216f01 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ffd5fe29ef355fc9d55d3e3f590c3ea1f618df1c4de468c72568fa8f81b6a38 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..73ce0aace9f0c35ee4f04ec699e88bff5251bd2b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c76491eb55161f20e30038340aef138c92f0be86f7f53e56480d676e9de5a563 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c8bfa54b9f866252bd7fa0e6bf1aeff51e55ab3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:182c134a5347c41cd483cf5a4c1e9f7d69cdc9214e2dafce3302dc6b8f4734bd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..334f41664cb7efb70070caa59cae1154d4736808 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:057f0b2518a269e9ae13ccf0458976ba804a5a344dfaf90a261947d6261e37e7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15703722b3865b4c94d7adfc41f0dc237e41942c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:077daa47a6d5da07c834d0f1cbc01d073ddae2deb1131ec41f3fbca1a00f261b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d6afae1304c6f8a578820e5656b1e34dcdeac18 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:099b4578fdd99465bd7209b3994729c8cadeb14d025622830c5fb666c261a5d9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95b7cca851513b82847a695fd1efe629a36712a0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddcc7c32771b9b1cbaac9b081217facfdbf76021b307a3d18c27a671d1271d76 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e00bdeaa984da94bc3372466abe8e87e0c740981 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5eea7add0244d5e23ba9281c3605280438cbbe75ec1799bd1eaa9e1b8d96755 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6a9d29fdcce4dd76fd619abfa471451fae17545 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96b9ca87bbbc72828ca8258d9ede2f58f454a225de015114424e77ce3e7dcef5 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ea93da6f12312d57cae045d337771136e3974ba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3240091092bbbe4929ca876048e4766f0f320f07c094cc52926fc534ce7854b4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..373e932069cc5630fee2f58cfcefa5f3be1af7ad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e3cecab98fede291fc4553f5a5d0601ab1662968a2f653e6d5aab5aec85fe2f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..74d5fef4d33649703eaaab3567357b56e93ce4ea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cb5eb7f09992b54c1320d4524339ade0ff3d87a5200304d9d5f506a866ae3ae +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..797fb86f028133210a54dffabcf12f7795000a9e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb35d985e7497a356503169b9f92d141b8ce4b67556b855a813212d3580542fa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5781dc3b287b58130683b9770492dc0fa91e6846 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c30e28d9f0b6e9168f67bd688bd8be7afb6eb235f2e62de56759af7dd71c914 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7360c07f6e05c31af7842206a1c6c798bf8dae8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eff68c6e1bb0ba0ca87bb73cd5d6e95ffe413105eb3745677a472500aeca19aa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dced0d531b3dc58fdcfd8563176018bafdd0e900 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a952129226fd18fafc68a32dcaf129491d13eb27223cbdbd2249833d6dab452 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f82c45c2dea6bea10f2542f6e0d5830a4e61a817 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc4ec612e0b01fa3224600f0c9c027505c56093e1b1cf3f2414d573d62309d0a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca83e7e196b0e74bd8e96f89334102e179ca80ea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0458c16398db7762fe3ec7f94de5d9b5b653afd89f213fd5f47d154c273fe39f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fbce22a88f87b05a895fc73417c63170c8dd44b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cd6144ea397206c192cd517f8335af632ee899055583098ac6cab4701d17be1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..863d63469fd6fb70e79fd6758d348792ab626838 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb31463755d573d37e6ac7f8d5ef6b98b1930f4fe89f0e396d2126e84fad6541 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..270e31c22f4ecf55751ffa098e3e6af2926fbbdc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52dd9a05d09507aaba15882fd9c19c2041ea551b0d9c7889f7e9b92e82399545 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..706c6bbbb2d187b8d3e9981d3b3d833a224e555a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:757677ba20296ee544bc09064eb28e89b24dc8552d5935abe7fc40cbf511b877 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fed79838a9ae697d7f6c11acbeb3b0787864cc2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d3925d4a45456a8318ba12ca34baedaa6e04da197e6b722847ae19c9ff79611 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ace6f881ef7f762fd77cc90b9b9bdaf88764820 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b066b513393e8d5599c7cf9eeb28892b5cfba53dee7ec9ea72f74cbaf909e795 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..411d92c55150f627d7be9e11f9e470f88ea74619 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:199bccdb5b0729895012d037e220bb5d1782f835df630fcb728641bb9ea99a97 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0f14bda0dc01967419957b01b15520c2bbc0d4b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:646bce81c1d8b0d9351ee23fc3cf1dd9725d357ada3fdafa32d88b4672471c3c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1320bba7a8e0f9a94437129b52b4a2646af44040 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:709c0b014d3da4839e4832d744eecbbee2b263dccf4444583d8ef9f40bc61964 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..29c8a2f9ae722acf18e1a5c4f54b51e92b8dc2ad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf03d56e6a5bf27e34d01ea587d6c5f39e6a888bcacb50acd678ab05e0b5105f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7e76d6c6a5e2e334f938c33571fb4510209fe81 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcd5bf9bb186370bd84e3448efa59199f6c27cb158bbf887575d03da3138ac64 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f99f9d4f3b7b9195fb6213dbea398ed7a985be26 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f48d70502f91f3c9de82101b2b6ae80ca8680f2bbf0dc95bd0e27b9b6502b15 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5bf100889c69af132e61289ed910da8d4359f6a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8b998277d7a50c11acaad9390e99b3bea322f461836f18f2f62e68b79b2c2ea +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..81a667b278321830dcf5b71b4379efece6d277d4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f44625c01d9d3a5438256afbb4bdceeb8e6c45cd65658ec95b61119afda456b2 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..125c67f9d0d32de81e2755230972fc4f27f11e3d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4de0594f446d0366fe4786a178cffb5e5947fa81230c5fb85d0dac117720cdc6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee6a3ecf5a2713095c6bddab9e721313e64ed6b3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:700de9f477a289e5eb93cdc12db0c87c8be7d3d12a80fcd2882af0f2c03bdf5d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6527f968fb2911995734ffa50b9419fab6d2411 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a9225c1811ef1e10f4298b5af81ee3ea5d2c2450486065fd28a53c39169cf6a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fabe01f85cd8cb714a4715cc2727f366991dbc35 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0eb09421eff4a967afcfb792e017e2aff7bde1de83e08bb297f7759dc050cdc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4e0d7da31b8edaaccad30f4dcade1358cb0194d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a05c88c672a41be635d2c4cf0cd8cbe0eeddd76e3f7b5f68acbb06f53b352de +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08e0952f47f195a139bb76dcac2796166a6b56a1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eadc843bc701b4f1ecc4a4cdcaa9a0d250e078a67dfa61317a375a186d3652bd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..485fa9c8be18ef33f511ac0a0e9e34c5bf461015 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a79275462221bc2eb5f5fabeac76937e7c62fb3c0d886e08e5876d3bfafb919c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07a1debef216ad3a2c05741bf6bc3d65cf837f5a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99c355af6b17c551447f1f57ec2179c5225ebc73c280c82bb06e8065fe29d0c9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a18a1ca02f606cb1e5fd88f348fa2fb98d8e7fe2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:284e32de776d493fd2022e5e6ea82e884280abf62d72d59db36f1d43c0cb36e6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d84a3fa1cebee9a27a64408bdd5b6355b69d5c34 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63117f6f5d3f38590ad23188717ef976813a273fff909eac88d58b626c1c1d71 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..533adccc325b4b7dc12c7107e1b3c80d3b9c5851 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21915f679d470be45de9413fa9a7f0b6088f615277f67f10c9e5a5b6344d4696 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a905351a029860cffd7140694331a30060f79e5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd92f0ad67dbc107a1089d9a9dc309cbda46535c465ba38050529d10d3eae691 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c7fe4431d78ea91c456904ee3ab4b24474d27e2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b003247693e23c2240ac9dd551a1e6ecd018b014b17cc370acf45c48938bbfe +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d11c82806fe168d3bec41943b165164631ba59cf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b50cd625e011c2e25c3e56de6124d7b7dc40f6ab5ecf8779d4dc653d21f54c52 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17e771bbdb408f6aad520db67518c886d9530f33 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e9b8f32f5fed006fa7529fb03d2f934d47a5a253f0271274f9e99b3619ff02e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bc943d2639f5e409e0388675235069d9d57c1c8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6c17dfc3577213eec275e5d2d27245805197166c15d91026158208e82355c6b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4b446373e2eac0d1a626854adcd833bf03191d3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc98978e97e204559a2841a135699cc0ff9599182bb862a9161de7895ef8b2ac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc97571acbd323f20846aca86bef6b684cfbc225 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:280e6154ab55d17c066e24cb273f648515e3ea05808b515b1f8471bbcf5b295d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b961728ea1d09f7ab0cbd9522ccc05d18c9d033 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e734b5a768f23e04ccae31ba39534c638c4147b48064c508b67c9372a7b9344 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..401f5130384c319ba7ac913807a961b766226efd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b002fa8e19e0d31e55654427af33f83932249cf5c94e7f293aab52da187411c1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8f6942fbe57ce3dcb66a91fe76139db0f067518 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3974edead1e56aa314bb8f83b3b378539ba00f4e19f9a1586b8de04c7c173095 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a104625dfad7ea9d775a5f419e0114947f4e2ece --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ef2aa39c809aa71018ce86ad3a1de565b431b7e6cf88938a542c6336d68d647 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9091859f31fbda1c3d6897cddbb0ae43eeba8ae3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed2d58d2028ff538835faf80ef3d8e2a371d82b511e6d9c8b293bc05b1176927 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e30afa03f16ce9bc41e7e42790ef4442ae20a53 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed118c31c09e5ed47a4583dc35ed33252c157e7deb3604fdd3061bd62b7ed27e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ce18ed024a075af98e58aebf313526d06b68e3a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1a1f1d07ede209e88deb40e1c8cadc1d85dfe1cbcefc840b8a2b8009e0af548 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f032ac9f16d1cf5e106e507e8b40590230afe53 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f155ad6bd2bd90e0935b19b639252d682dd516207c6aa31e90af9287f0ddf055 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aedd20ad07dd617e8ad74fc8b997a9b72e24efac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19dfc02ad8ab163983342d0a53199cf6d839db5af746d7a86462989abb85f3c0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0377d8213627c326ca001eeda661ac0c56fb2300 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:985223cb987e2ea0c30b72cb073f8af70787a1f04e81f8d822d4a23eaa37c005 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ded30374aace9127b3174a92457e98c67c549385 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b92b0f1ce20f118ea5f441cb51b2eb987fe66eff37ea5fc5d68f22044d3218e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a4a09357c743fb99968cc490a76be4462c80400 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:127c4df604f0cdac0ee8fa62b33d2abec94aadd38c54f6fcd60fdf191e1e453a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9afeb8fd9b8915c7acdb7d8d95de47781966d91 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb897c12ea22dcf706b9ba8854d0c950c2c3f51f92817e2e74e703ea5dee2898 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9e97d6d42458dd0b327af983c62aaf9c63df092 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3c0b5777f18e56dbfe44135b33a8b28a4ed033556d465c99f4742c3eebcc012 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7325cc81a013dafe7a4af61f50c57d76e1f1513 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f45cd93a4bdd94289cc1cdbb45c7d21762edd9bd45561f6d4ed90637007d14c7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e109dd423793461a3e9800d592fbe4f2e935a997 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e914ceb476a802b64623db1cb5b2e67491b68e1ec24824fc424e95a47beac120 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ecb2e2e81fea6a84628c8882ae09326acc1face --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7675231ff95ddce646684d95160cd864d5a6d91e058b4b1fe6cbad516ee28f12 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdaf81ddf6f4582eebc4f5ef584acc0bbb6b68ae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:980c24b8d8e845c4f25753e93628ba6cd0f0fd47b7495b7dbdf9459948671a22 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bea68bdc8e6e9e1785bb2daf378902e36764d10 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff687e2404c5a760443b690db37fb0afaf81ca3463df51f182050903b6ad5551 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb4e78e6c1ae8e30d9bf7eef02fe09ec0d070307 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:384fd275831e005e3e17a5b83d1ec3c9736d9fafee18f8a4513891c152cfec45 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..faf6645b866e6f8e8e9236cd64d83cdfab8b6804 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:603cb50b4afe4d36e684c70e0476cc35369f6e1dc248c62a898dbdb396bb6438 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c279aec439cf77cee21043908eb0ef32dd9650a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83cc9de790eee9b7966cb004fd8cf42d74ebec70807ea9226f9d701dc44dca91 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7952bcee5ffb0eaeffec293c99070472da0c394a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bd4f2de4631c5934eb0c923e12bba9e1e73f253fd3cb5cb38f8bd1c6c90faf8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd16a99582176e9efc034fb4d99deb8b331a2a38 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9beaa41594b070c0bdb68806bec0421231b57bf3f5431ba71684db9fd481cc9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f575649c03bfab6515d3f0894a2691d71a9a4555 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90e3a9c3c4c97c5682c807404e13928fae9a2c7be3c4f37c0dd4432a31d6bd66 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..760741134dd857bbcbfe6d73b3a5940210db0e0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6263c292526ac8613e9a464c1c0c738072ac872a7c6223d0be04d9a132ac4468 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e68eb703a955276fdad2ff390244b2fc142b1014 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c4844fe81cfe4198e98bf283be6f173dcdb58ff6c5e46ce703e3a470535a868 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbad2909458c1277199fbef84215a6461d916e3b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d7851ae58752092b9a6b1529773d7e1032f20c76993c0ee39b8005024e16db7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbac88885a75031922693822ee0a03b8e012f2bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09971f5c0bfc3b7ee7c007d5ffdf50d04e3bcbd9233fc03670b540dcc81bca96 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4771e8690ece2dafe79a5a4cc306e6bcee1a4196 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:721d6716b02e898a24544cc2827dfba1d0b80ffc179f76347d970016f6da04cb +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3ff71e69375ae6e53fbf76666a4b21c91d22a29 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b45b399e92150fed0b85b941543653498e3fd8c140744342bef86fd587fece3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b61952e30a46eb0ddcc4f333280ef41b213fb24 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be6b0fd5e46cc008fd5fe0d6a840c1a9a20c6f96086b2d01e5a0bc2328b11e7a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e742f52af9d26c5f9e29ae4ea02cdd6debe9cc08 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8241f54b1baea43233a7e364f9862a47f77fcf416d3c0676c8e3dcd6ddb81fcf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc75ecb0375508191d777396d59166a0875a9928 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2d54a6b496d2d4d392fdad389b4eac651976e204fb33630831a455587cab0a5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d07e79dccca166601323cf495d644fb2dc58708e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9455f567d0deae3befd33d17594c3600951009779c111e04e2d3a10352c3a324 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..88ef1a9a27b382b3cf6c6ca0406b7e82c44beabd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e18cd0342ec25d24796dbd3b409592c15f61fd820f3a04372d8230d9ccb27c6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..206b593c6ebe567e504a286bce06791a04db2fd9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c959f6c73551c16ea12484987f7a288cc8189a8d8a5dd094d24c1a9453276712 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..029ec1f4c890baf30e9c965b9bdc95c2911d1014 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c3d8774186dcb52567b0f1892621a962a595f935f2de189ea2a7932fd459762 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca796a2a812f5d320de559e18eeca7138816dd8d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38a3d4b3b82c1eecaccc9059e09d42f068641b0bd3a7e9a9f9f05929e4478775 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d84d4e5cd66f03586550a4f43f492b906a3d988b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43a674f98a07a119a864a0da82a02271de08a84b05b3c8f568b9d6b979a1b33b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f02e20a7be44a155d03ca1d39969b58db801942e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9ffeaf2eae2ba3294339fe428c22797ca39c5853f7943f37cbe15462363992a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..342f725fddc1b401207b22a000821df847d977d7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b48c61b45b73c2ee44c01788d3f3951ac47d8bc5acf06ee469001bb941016bfc +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4d536fd9731fb3387d7e6666aac7e4d40f73fb3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c592d2a9fcefc094447794fd556309ac116c3f3080ed5a88bb991fc22d87048f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b88e44b547b9e0eba5cafb2eb66e1df4bb712fdb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8aa77cb8f5fa7b34d3bd70d413d0e7a250265ed28325900a7b2eb20a12e0a39 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0f923f08b34118bd7cd09906fd388bfde42ef34 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8edfb4b00a13ec97665e8e1badeab006f531787973ae9f85e417a5bd24ff0e1e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..23a981b0487ca353d584ba43e6924087063c7708 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04380793f85d90562290aede59afc6c8991acb2668a3cb3b0ae302f6478dfed3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..323eccaf8a2f8b78daffcef1ffb88c1f3cbdbeb9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cb1b2bb208c31ce08253c63545d890692a3cd61487f30ee6954b9c9d8752941 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..21b2923ed10351643f9638ab8673e8df8c9a40d2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bdddbbf7aba5a7e8f9895c99180f5d0bc9c1988fbadd3d0988bbb590b28e1a7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6891a5d0f07dca7f915b533468559e1ec8e63d9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ab9200a99831a92b3da275127c820a4f2b90bca2126f580257ba22304a732e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1db2808144e7c28cafd7c64f2d8031d71b8863ec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9655489d54217b51f1b1e9cf3d9bb6390868b395e50ae822529ba66dfd77d6ce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..209de2d2fa9d5fd599160ba1b76d93be23bb2538 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31800f3c145651e0db41cf5f85013052a16812cdb16715b8775c88a1c390da42 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..97894f937a3a6f015ff416b6a223bc1c61e4ea9b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de2fe3f43326231090dc7468a6cb82865a9fd3db490e3b6f937d3c97febe1e23 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eae8fa922968027041bd39d810d0dc69d989c597 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d78fe239f28c2a33d85c24163df404efc8328f18831da4b9e7dfd2b7e543ceb7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9e3879da1761c4734da102dd9c619b1da5d394d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cdd159a35268b9d7e6b669f2818b198817b2d9e3cc064d807296684d82a21e6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7133d384064f2e14332fb3fb9863ae2dd311b63e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ea8238f257b67079e466a2aa5a12618169cb66d34a04f6896b8f2d37d856d3a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cb105f055395c49a7ad2996c2900bef87fe1aee --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76609c6ae05a36c2e84c33e2307cddd7afad6419f905e8b65059a7743776023f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c81a4d4d4e9feb8d8424fa2ab94f49d7f419dd6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53ea4fcce511ba207993b900be7c5aa1c5f73651b0329bfad888193e5a7f8db5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9368589c8cd045cc14765f50c725a5d2e0edb0f4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60869894495dee3909cdeca056f60464cf963c1e589318ff71f3d443b7c6914d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ece31e91d2f39c33b21363c38b48dc4cd87ac478 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e706545707d7b2463dd90263111ff09d7716492a3c6aa04a3e420c1e1bc7d62 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce656c8788cd590b0114d62e2909270d006d83a6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c5bc31b4dd1f8a24382e0c18658ccbabac8530e569fbd7abd64f9b2db618b88 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..611f596ec580c67126f3e84fbbf1f74dd59ba24b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c718f9fc1b05eb8811030625192ab3d164659fe56822b77a87dd1b6191b83072 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a6ef00d42cacf7533ed96368ec4ea965bd7490b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba9d5d85f310233ceb8856b757cf1f3046fe4dea429038629e420098d0c4fec4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8c15fb0a762246acf018b5efa128cd560180e2d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:125fcc2b1d684a7f48b565c37ef75165ccc9ec97cffa99c0958890209a4c9d5d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae43ed6f7a24a7010109a60ed3ba06b9b4330af9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2be2a154a537ad48af9635e7ad4a5c50a8509fbb6c438e8c6a3d29008a680c5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff4946c7da4444947099e55620bd0c5f45f0d71a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85b9abed76e763a0fe5b6e81b1d519f01f54e4d2481b721032a779e560d13dcc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e838a7f462773f3f5c24cccce7070bffb13dced --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07a842b86ce0932a447f8351955b6b9882f315263137f786e5cf14d3158a00d3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6649f9332ccb4c701cc172c79653d46b732ec6aa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4690bf7ccf90810c9574209ba46e561dff9a52c38aafdd8682c8404acedeea0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5f508df12900d092c836435b1a1cb291054bcbe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3fec275c28de65b9223bc67c46c9845b2c7387a559cbd84532221f159a2ee33 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b214ca5d76360965d36839dce4bb3e5a845e59de --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4172cd596568dea95c88f18d6d3abea40b2ae9272b6c7ca11f5465f4792db892 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c014d9dda6a67c9b8c6bcc44652ba1b4a971bc4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eba5569be2eda6f8b3f7e6ff5a3d5b752b2e9d4cf6d2d53f5ae3f66d1711888c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fceabbb6e204025f1871f41a6a6b5e8c0902394c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aea8727ecfcf0c0cc6ae3a1da99921a7c7f3cf108602c99be5ae163b243fa222 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1689b8944ad2e11ac3509fee5e584bc077906aa6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b71b404ced1173b8957810827760e109f6248da86324a18a241be01cd3e1f64c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b9308b11e182c80b1e3b89f7499e11fcb4f897c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90c134313f8d41d31ba5c4649ca8d0e141575201b65e6c43dc1b43673b906275 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfe3297ada9b50cc3c5f1d7b54e14d9a1982ddde --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8be708a24452a2acb6c6ce1e2fa11e2fdd688914042224cb68a90250479cc03 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..41a0c1c1506376386f9de8eda76249eb63139c3a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3bf9dbe39c09a653b380fe8bcad982ff4697afd8f151eb281787f9efd148259 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..902ecedca59724f2825d498db99b42265d57bdcc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8c90047fb6b8a092eb59968e8f8a6d9dc620d3d11eec1936a68a2d6f57cd5fc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6da369d94d3780705cbef7e71df5d4cee713059 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_14/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a03453908637ef5b8f76310fea4f25c710bf096bc134430e7daf6ccc3e311cee +size 11395