diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a70dffe0b0056b5edb756c03b1475f21c632fcbc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d35167f2489863fa4b6f2268b5b3ccc9de25065dc3286fcd21e6a62d2fb71e +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..defd54456f974b90fe6d384ed0cacfa989503d3a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5269cc232f1cf4b9aabf99918dcb87ea5772c2b4cd4f584518b14c7c43132146 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6b6f2435f8ff976dc728d264f6dc8a40c1b29eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b699b6bb4054e82d81b1a1efec7c7f404abfb630175e00a618cd40d8fc0febb5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..622c42ef6e3c10699fa1969b6876b72228e24c09 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31eb3a88ef9069cca54c4c4626fe8d1f337aadbe1f9a8a62f412291bfa9c005a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1d31c7ea85cbe1ea709c403936d5a7fd261f127 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c50f8f1a7b72f224694b5b6abb7cc28ec478116d77d3bc5ad10364033a13b48 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5b8de4d307b887b519ec87bce052b11dacc69c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2ff80d45e3bbca40d8d1e645b2d852eebde22012e1794568d244d5aa6357349 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3482e05d5192deabb15b0f15ca631c7df3ee131d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3925caaff701cd815b47b317a362db5e27150f4e9e8f7f1fabbd71a03f24b05a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..379b6b1cda2e31a9bcf4f4d86b4cdeecee416833 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:164f357fe20afecb0315bcd5a8a6635f8b67b843b99b80eb02810d148a03077e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4d7e9217b59d541553a6b63b9ee37f307dc6275 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d318d7194edd37b93f5e88bfbe1ad4fdbdb6d2cdfabc03059dc3588da60af59 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbbc5784c8d97d0b5d9acd54ee5cdab1b78a5d24 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246b3f6ebe7c495ab85401fdd5b026e88cbfdbf449dd3f22788a21de9639f174 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd053cbd40a36fc012ca1ca3a3778b700af3912e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfb1e84f7e1188691bf4e2e7af79429ee255b089033188fd1739f6d742c0109d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f627659ed4e0c67c8ec381e15e30d6003735dec2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:845ad30f8c8d0401c4670ee86f5e1839a6f2a12754193f689885574c1ca36147 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7770db64cb367128c8c97240e5818a5eaa7043b4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c13aa27ee5ba1f85ae0035f4961918ddc2810f9f52943520d4746ac98fab2b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d025f7f231bb5bd38a716af44fc1c55024d69937 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a68e81f7d972c9e51368be212642d4ba96d23c4730e15ddf2dbc9690bbd7c747 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2197b32dd2f473be1713168c6f8b1a8f7d0dad2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:589fcc105bcf5ef790a61585b74496398a9ef718fc175e087de1da545aeba6cc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94440fee96083c07772d07e6494eeb880558a087 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cee091ba655c50aee42f4913ceb21f3f7540cf335287d2a05a984a6f124f38e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d064bb681d6b4207d56a18353b7dd00e52d455a4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:873aa1f7e317e7cdcb423c55483b4e37b9c319ac7c5166f38fa83465443e6ddc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9060eb71bdbc74d21e2d4ddd93f63ec1517bd2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf21a68594833f74f9681b1fb24f641409d7c4efb1f74570825c006d52011551 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5124704d5bc03b76ef95e48a7e729e208e61f3fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7ab3237f8354e881ab5de4e4b732cfd2675e02929c61abbfedfb746e1bb83bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..386371f9cb955ccb83d78bd8afb66e0f863e4ad7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d22994e846c392ee876dcd402fed8a0888c778c7d1a38e14fd3f3d180cceb3d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e60973683b3245383e2acd162639a42a70727a6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1774f599ff954ac1bd7ee2ca0b84a2679493c1815d1b2cb66c1285afcae3aa0a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c107b67c66053e92fd0dc41810fe8e70699ab421 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1694a821a1c4867e4f10a4bdf10d61f491e7879f799e2fe002ea5fd1e16b4a3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bf1a3b5ca5ad6b5bbbca82094b678895e41f803 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9b8dfc925bdcf50c2e0e704cd80d7ddc5d981f3a27a75987f135c2e3b1f6da3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f267f7f98c062df6c2e96d457097a04e1923083d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afdbc1d3105181fd1f6b5121ca2de2e3594423d4d818a6cba93da32c556e0fb5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b840cc6327dc0ee921b24189fdb9a75908437867 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60ecc022725e8988ec0cd45904a57f4885660b8c8d512a41fa278cf7ab2bec48 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8cb2949b05b249e22d3109b1e44c3123105f32e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02b88bbd952e0c8eb7235a33f373428dba6102468b7e85f64a05f6e0f3bf574b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1026a37e5a3a31a7701f8eed2f5f3579e3864e92 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:508849a5691c557a455c573fd555776538824f644b018556cdc2b49f57c16bf9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0f1fd16b1f8850efe215c047a7faadd43e7171d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6795cbd56b06b9b93c4e2df395ea5ac3f693a972d48aeb57dd48a0d7a13f9b6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..687e2fdefd7efb285f622dde1ad80007fac3836a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3be8b8c44dab8553b6a17db1e5b3e64fcddbb1df7b56cd8783d369cd06c86a1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00cfe503772682ef1ec48a0074593fa11e7179dc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:076daa3b80f4fabb7c370ba2b2c039e9819cd3216ac1072cb32ef0f651e7ce8a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ffcd2bf2946a7aa6ea7d87863222ec86f3ecdaf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5192f2baa582ead79bac35b31a56b99d25c909c2257c28a9a6dd011ef1cc8e9a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..135b4a851139ad57dc6e3dc89c8bc55c45672903 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df65a38d501c5674a4b6ba1524bfd39c95d3b050a2d9a444d60d023b207e4fd0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee32462a8a00d7e0547a6638969c3e0cad362530 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45c81763ee6fc0a3d8346dfac40a0747de993bf167cb825102b26754ef624712 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ed6dbe5530f61176b59e0afba8569d1aeefce3c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9a6c07daa6d90a2ba29651d57783238b67acd245ba24299c9ad938420b09cd4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1710605bc31ccd5294395ad08bec8884f2ae6c83 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:893c39bfe7a1a2bab195237381106eb97b4ba469b612598cf6ae6d7f9d84e0c6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29034422b825965807e962e4ad8203f2d61ce1de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d648286b2a4b11ce38fd3a435c17cf1253327b99ceb6f8f6b76b8267e8b0e424 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51d41b44a7d958eba3b612e67e38f6e41560ec00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5025ea7f8dc2c912b407137423de5341b03859cab77839be9e555a124066bb94 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c7722e0d7e988a27827b321c18b78b930fd399c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de51704ba4a55b25d1354d9062caa6177961e5a57c3aad2ebc954a8df02ebaa4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83b476e395a4a0de2f274abbaf3edaacbe7b4599 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e83ad091c7c774de71c54ae3608b72bd8144d550d5b8abb2bb62d826735fe31 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc06e2e04558212b17ccc722e9379b83aed9aa98 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d38ab951c5c02a5e53a11fd6f200b16eebe0009aca914a0a0f4bc4fe6873857b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1be873afdffd72779b5100320ca0ac729c50fd60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:220ccf93816cec7a36051febff57ab57fe0dc8bcd426f5e2a6cad372fa635263 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f9dfa1be69d04424b7d5acfd3c8edac5fa7c358 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4077607b20ea69e80b54e7bad94d3af058875e2f338b41ff2a7eb1360ea8c94e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2c132d4b1f28cbc22f3390da27f51ff6de41fd5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46861a26c252ea788b4a7a723553e129f4b8b58ce0f699cf53ff82bb5f974584 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf5313f7ca513af17f79e25b0a93a1ecf2498ad0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63b4acdfa5d792c7c1cf3386c562b8763ae795745ff4a1a2eeeb59ae7fc9025e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c68a575886d0e4a3bdb6570edf5c7a969c169f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e688b4b539966b7c68a1e7b925c1edb8b4031a3e89d4aa5b32073b7d7e3ffb26 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47b842a0e97bbd87543ce080be24f6c7a6543e23 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dac56b4d8c0330327566ded35b93c668722a6fb10e181be9b7d1f05fb6e0e25c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6042e22f65706f5ea53143568caf3b5b81ebe273 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f0d2f320cf64abe8ed968af31df26181f3e11134dcb4fdde3739d829c8c5c25 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f988e5c0b1ed61397097506b300b24855629714b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d19a4520ba92f2eeebe53383073c141e027a490104f2b9d1e3e52aea0217f4fe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1b462781b0deca8573ad8fafff62f162d0d3b17 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b18f65e9174fecb848e9211d24ab3d8522e9ea77092878fe9f2ce37955ed8aa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91ae4bc3d0cdce4c285469c3f6761f878e882222 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fdfc62703cde8c343f44c39566325bd501606f0704238c23cafd3ec5f3ac373 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..843cf1984e2b913cd6a2f19d9bb27b95d0a84014 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a13fd99f719b20af948e12307214bd73c601ce11657c0bb11290952ff86f4db7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06568ea2d0910f849bc210b0d770625a78e2f730 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ce99b6585b70f9187e6389c4f5feaeb6b78f26c8d234763fd35687b1f477e4d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4dc9cb54e2db4f51f044f969fd16973c5d5f18d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e870a7759990bd189227ff2dda9731f6c8b93ac89a11aa3fdcbefe2244814ae7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61180aa663f389e080ee191c51f5a3e990bac657 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26042f772a9f0d028ff08c65f9f8852f98c84f626b4bba7c8fd09f43566f33c6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80e8b6bc7909287971f59adc97f64027ca112180 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eac15ad3c46590a43fe8865b028b4f28a8158c7978143af5ebc5c829a194f38 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a9f87fd788db4d915b2677a0843f2cb2ec74db8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20395142ff218989019d7e1114b6e5519603816af4599606e93be739ada13f89 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57bc6111e2c56b06dd8b862ab6fb02bac88d2a3c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a730453a39a5037d8a2d32e870c1c49676da557d4211f1dc767a41735e2cef99 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9685670262c4018020f41a8c1747b9b188c26db9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28a1c327a97303c29b93277d91599f59ae17a0f7900d80d024c64ddea53f7f54 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1a4f15282a3fc95c05b7f591c5f918c38e29719 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02f8da503d45758be2b3de0de7c878cdee905ce50de9b50eb545d87305c664f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebd3d021942067adb386fad097d3630e25de43d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b3b130da3a89418e9bcea53d6d4e8bb92e15162697c0c8cfffdafe04c19cd52 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4812bfefe1d038df750c2e9b869ad3a44279f451 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74b13b985ccd98b67ceb41eb3da0f13e274d8db15e680cddc2bf8d9691da06f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd99b347b94661a7e7d1fff6919d57a8175f3331 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9adbecea6ab8c12b2406e9989dfeee1c972fa2f901f0da9e890da28367f7bc3f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3eb188d8c5c81ecf251e7978b813f61b0282dc8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a67211aab7c35836b3a05fd1358b719679a93775d9492faef91cb212fb652c5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..945405d4a6bb55688323485672b13437728d62b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c180a99b6e5638f33d7b0c6b9c66ab176c5bdbf7632b60af94d1504b46e1356 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86063558a62e7c4f2fd97c1b81bdf5e1576c29fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:193976a588bd342ed3d4dae7cdd01b6e8b9c418562aa6a66190a038ea575424e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7df2ee09d0a2385fc2648b5d5588fe7ca5f896f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfda1b98c248e2ebd5a4892bfd56d8516e616f1507608da6b04159f67d978859 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..287bffa34e735bb9646997152a6cebde3bd5d97d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dbf6e3372684960f9c8629d09b17a6f99298469363b0cd0dfc8d6d5d8989662 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2602aaef8357399eba492cf1ff97191725f5f704 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c089410d46d57ac6a80201b2a920eb728911a0d0561c18cfaa62297087fdebb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b19f735c5a039bd4cb9556e937dacfbfaa4104d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37398c0c7c339ee4bc9107e66febebce8715124b061df15a45a2b5815eb23759 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f9ab57ac5a284604a0e5f956b18c0521f5478a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c4a427903e816aac1a6af8fb6ca5e63dd06ac42df5823266a843e2395933b87 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f43e3bc8ec40a4059196f73a3fbf94b13ddfe574 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4be0f79ca41c662b3cf0875b3712feba8aa0f1bda1412a30d4d20ce624f18b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fe008acd091245ff89a16909b420297ca8c505f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe6dfe7b76404720c70a101a4fde97c1a38abcd0a88d678c2062eab11f8b982a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f3a118aa5d8fec1a3444b778e4e6712ecff5ac7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a4bc8d682342317e2e3e0357dcb5938f4f7e04bfd23c73815cbd09cd8569e8d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a518eea2d0c22e8e5dd4576abf725b521678c5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8437cafbd04b3f19f0a3ad6edfa6fb66e514bcfcdf6e067fc29e2239d3fdc0ed +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aecc532960e773f8811dba5f82920ccf9dd60b7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2cf221cd4ecfe479051790c3c9836f1ff9d48a60b7e140144239a98c4267b24 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..613e659ccc82df39f2f4456b2ddc7e1d133e1cd3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82be26e3924e293362ad6b404e6c1a1614ed5c50252f8feb9f972ffb1663ad94 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..88ccbd26ff02c0f816b266bbea3051a16909d32f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf064d16058e73d073d0ac5e45fafdf69c8bf90c4d440c28bb5c6fa300b9ea50 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23a88b34dc3b1607c52a6d3309815525d946ca9a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebbe27a88661e4f37be24d54ce9dda1d3ac56ff91d75c78b1952c4d2ca38d13c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..402671bcdabf81183b8421a79a5c54c4ee338e55 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15adb1b6f149033ceb4405d9ce18033b709936d9df314e089da2e529411744cf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..128bbc7d4a314bb8f60dd7475ec6f15e8ebaaaf3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1b890fb86c264c982c037f7297cd5ef60c58809301b381691624d32b2489b5f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c32ab74e37552f4dce99f1e9775d27c0f4a0b0ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37c8e07ea16af262b760f4ab8a9ced527fae50b3efa7650b66c826acafb6f288 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b849cf6e962681fff2e2beed691e5b522feaf8ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:876dd783ce499c03db3c7f3032d1bcb501e76c2ba3a75b05b891b94f296ad738 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..124e43253c59c6fb5bfc4cc3e5ba3a5d2e89d294 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88d55c9b82a5ef2c77f5f556d2af790a67daaa416298894591ca15ee0209d16e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83d715eb8480295f66147771700512a8b6ce3b94 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8d9464f5ef40bb421be3d176db9ddcd9ececb60a960a0623a63086e9b001991 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68daae1c73fc9bc3038857438b23497456dfddb7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae5d4601cf3274dadf438f84894ed4e959c0cbf2810bd8b346cdcfa1a4480df8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b5b4bceaa17c515989aa01f083fe0bfef6f8f06 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f71f8a512847392d7300d23f9f55a190325b7aa03a38f6a04fa4b2e2c466388 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94e4f4cbf07983d48688e1d66cf770e5c6cab37b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edcddf0450c3e7e86573be6b96977b22d92783024d3d0280fe4a08f1f8197192 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..870e95207ed93dbdf6fe69289b5cfd774e0e9573 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47e76a4f46fa3ab24e27362b8da1efb88a99403b60fa8ad26727242ec09d7539 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a826d38435b3b389ba3f823be007f02b5119312 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3cb2cd43d20a07e0a7dbbd7bb8d9d0689548e4e28bfe97326b1fed3c67b2121 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d5cf723045c85c442eb90432c69873cfd30a151 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c28990950919913431348f02bace242c398b6a4434bc2681dcf23bd6cc0ad188 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a2005b898e54e9d03fa76da09c07a3480fa25ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c51c7ab98b01556091706a4ee0ae57c885353c8651c4dbb64a1516cdd032c09d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4fb33cfaab6da54d400aa950a88be5e382a89f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d796c555bdcfa0891daa11112c48251fcb2831fb1ff56499189c4041a2cf8b3b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0c1693c52a01bc4ec166824a216826e71d5a2ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11a5441897bc86777350f7524eef5c6fadd6b1daab5de63f825f0e0cb0a64026 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96060be7e073642913126ff86b511f13eb09a01f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:621633e7b4802ad066c08c73b2d1edf6955199ea248529348588948c354ed18a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4feadf9b42a8f63a4015cbd2116a13f1c2d0ac7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d019a07da8d9d7784564d2bab02869961a6201881f772c68ec2b301a24de201 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..733dcc1cc50c8d25254b9961a8f27baef641e976 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab9e7fc71af27e3b58941fbe53f56687503a2e9e2adb3929a14d9ebcff704146 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5344b48b6c75d1ac850110a614eeea721cdca37b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55f53e4a5df1536993049a9ee05f085b9e6e5f999976edb6909cac4fca8e5e1b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11dbdc6a8ecf04553c4ac13ad1e85afa6091c586 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfac744a56a8cfd70c4444aa04d2287ea613fe68aa0a9ad0d09416e8c525654a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d39d8fd8ebf76bccc4c3db0846e398c27cd00eb4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd3da70ff4135f19260ed5cadf795bba26d2450e4b7de0a43acb76a2cadfaeff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb1b27c7ab7c47d31ec6440318010cf79ea50176 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c76f129b644ccee54e97ed4bf4cda390f5969f3f173d1ba9568b6e84e79c53 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b9249972fd7df337172b99f033e43c237ba4d27 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44005f9fb5fdf73e9483f101294483acb6abae94c2712d5098b4af8f8461b269 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f2e38adc9b52e0c243899bcd9ea85a9b7d696a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0775845375965b5069e8acf8d6b5ab3c54cdef6984088368c2b02b944300b85c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93b9db0ed7e000ee6573aa49d681cbd32094e156 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:577e9e582fbeca5fd4d516a94a651f621600bae72536625261edf9a5381ded3d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffb3d4cac1e5e47830b1856e9c7d303dd0029d03 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9afdde34b62cea1b11c40849ba2b7cd4c1ae9306138f1d7449fee687f46a1899 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d90eac86156d56db3dba8aac8a15533c54f9c0f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6808e4065986c85ca4e65ebffe32a8c690172286378ecbf27dec908380a478e0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24617362d22d565b5a604d264872524325cb877a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:805f35ff044c6ee562f5c6a66252670cda5c5529b3245ae0b6bba7766a269092 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d8aa3cf81c9b08fa23ac33349c4cdc5d2192748 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3b2bde19c82fc0bfb1772cf2d94d71edd3e2137358087c9011f128eed2847bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea7050da5947cdcca5edbb34023eea86e5dff19d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6753bdc2847ba0c834084c6ff73876ed568144cd28b7e7917368d15364dbaacd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8ee396a5db03565415bf5c3f93b9be55e6c8c13 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0619ac49fe8bd250ac9a1fb99ea42803723227ee174bc24b96ef251c14be4a80 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9a05c21162e6fa2e6675116a0ed152c927fa480 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ada7f05350f8499a49d4e380cc76fcf928484370fcf98d5d62361ba0348b487 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88faa1d309ee0b4bb4d19d75002a622830e5fd2e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:903ca33578f8fe6d751fe7ab902ab14e04891d43dc6eaf59c950edd8160d7b65 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc50b519a9d92cbc34e961f71d0b75247c0bdfd8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b526ed2aa27733e620b6c3afdea9e784e235836ffa7a0e0722be6d6c2d01b088 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e57f86ed153950d6f50875f68a4cb624340b573 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd9efcb8e5ddc6ca8d0298d144d0cced3ca32674081c777ddcfb15c975891a45 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75fa6ef6b5b9cd99d9263289ae5972f6b7e7d4fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b004a8fcecc5a2741d2e8d16e8073ef2201af43574d8541e91b70fa9f3f0ea71 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ec6a72b1c0efbbea0ef6f11c00f54293296f310 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30ba543d6d301616f4cff4e1e6824856179010bd4c2668b2628540c35dc886c4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..118c31a0e7cf24c8b91f9a9e783b456637eda202 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b2822f4e354ec9c6bfed42f9ee62c5d3d05001e5364caf994cd397f7fabd64e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3877495cf361947f53922775ffd5e33410095b8e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50562aa999cdbe573596a8526fcd9d949dd67c778bd4b2654b3d6be3b4296978 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d489f171742ee8730af2afa4a0796e2aa5f50240 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:050b49b40c28a280354ae77fecce612ea18b18975e980db82128e6f82f8d2ddc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ceb485ac4a4aa89827dc314ba3b2a3c951b84f2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9046a48a9e13152f40dca78cdc15d715afac9a7af6a53d6780768377e479578b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7840d91167a53d165883bb9122274a62c455cf8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd17ef30633c36fa8b6bc025e9c6f2502552d213b08c48c197e95e021183da01 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ad392684147c07152954e9007ffb47083dc4a3d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fd195ef31c51a33012a8cc5892c77078ec140d5caceaaf89da8ced62d0b58ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49af0c5b9c45333698fec7cf273c1b0854cb09d7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:186adb96756601773e84205ac3bb02fd9bd466ecce79b86b942ab731f3bd5a6e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..de5dc6f69c955fce4c1e3fa03d52e81a1691ebf4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf9ea3eb91144e43c44a61ee3ed75cc6c79daf7d69a980faca4bf1be97a5278 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c416af4286864f8c88e1ee74089af28e04fcc50d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e4b031da68b7ce32b3017f0f6c95d2c4009dda7feae9f77e77f14972651ab50 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9cf0d8c41ddba6146e4a6540d4e163d918f9f87 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24955e43b674ab91e90b9652c0c294f93ed215052d69623325b2ef6e2b6a540b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc6ce8f0fdd515d262e3e0aad340d544950ad1eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:015e6d2084adc8f7fc16f3777c7ba104a99406f1f68fd3585acaf831b8b5b1d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bf5a9f62001d5897c92793665dcf7538799fb4e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:790f224a44414e51539b655cfc2a1a825a05d65bd9dbab0bb9ae00cc6bb57248 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb7b6dd04755592b83e19c0225d12ac6760ed303 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a0554f3f81f0f5aa7876d64f67741d2aa46e9ac6bfc521537c1a7f4b918bdce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fcdacda2e7578865ab48b19baffec6d9597eb5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18c13fe465f0b091749d1b148a006a63a3fb1c7c4f49f4ce7a4c429ae1fc0c4f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f0203b5ac3b4580d3450c47e881c060b6b67dde --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f947bea76bb384f9ee1bb474cc47d9ccf2dc241a652c720dfb8c4804b669867a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..844522aeb394b95f47a5ec4648acbc14a5fec010 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d11ffc55aeb114fb0873db1961e8f5a93a4b01e2d6e808f1f0a23fbe2b0de3b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ca4fd8cbaca6f25cf9bfc65d2a28df12fd0e555 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32e10ebe55143629888063bf6229e1705e0da8e6b460703f9d3a7bbeabe98100 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..803635a0d400ba8823d9e1225627369627a93d25 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1343bf9075d14e1e0facb889fa5bdf2f7e92ddae9be4540d9dbce22a8a277c7c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5beefd1732f864e710b24aa158b9a1c1b4240a08 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fac2c918b224f7e9206e43a436535e301587deed77a40b7dcdde25fee6d990f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0a3aef59777567b533c3046b8bacd569cba926d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ccd6d516c1f0bbe951a48c4111a4cdfa1e6929c78fe54aba7a277a43749600f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72694ac2d3e7d9e680634b929ecce049efd6d80d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1cf1ec1364a351cab6db629068994d9db036feea960c7ffee054f25b197df1a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a963b8af528eca2d3bdeed6d91134341e6cbbf6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45c44bf7310e7d9d7f5d5ee320ed8765ff97597f9661a9e8678f44eb7b3be182 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..21a79ef94dc2cd0f811c13b670db19667bda8358 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458fc496993b9ead64e8d47139a4a8875988507d1147630f1ddc3329722c67a1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a401162d30499fb4564c88a63f0105bb23d53a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cd9e2931df35a603c315ed899f7b967a16075a6797f625430134908884bcd51 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30df3ffc3e0b5ac0a04df4402177e368cf3fd083 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f12cd45cf0c26636c19f8a6b3fb7eaa1d0e02603660bbdc78a5b2974bd977fb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1489700b6a9919a58f536493e0537f9fb9c96915 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af25ecfd042adbfd5c525c08ecfec7f5f686e0b0beaabe93035df4f57f82d002 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c52d53efb5e366221c79b16f19c6a1c4accca5b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a48d85f06c4b3aebe0b00cb17c6887157c043c540744babf0bf0560992460589 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed2fa60468abcd983cba7036050a7c59189a9e2a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adebb244080a65602478346951bda09d18a9835acf65b9bf792e75ccc07c5c10 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..67f4783003fe49a6329074aa41bcdee151718552 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f58b4aeb455644f1c8026adc1f385217679b1c0e9e22986d2d4bc5e25e5883f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb5bb9cb72ca60b3ce08b2f3602153a62812cadc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba1cca7a38d27682b7a2fdd255bf3a8a6035cd753fac307e051c0e21f2c5c4c0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6834acf168c797a486c1f0bdb5ac68ac5f098fe5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c3a3998e941cf473692ce5c081b7b136669cc1863a30dfdecf364f42f22813e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef5140a810f21d0a7acd67c4a723e3aa62c44d61 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a93a746b5e7f0d07036afb77ddbc9fc12144f3203159f03db0ffa9668fef87b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c33b588b67e15f07ffad89a2962ad8ad3055d308 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3deb74dd7c7d82da7d3be0c7d37f113c65838690f5163d06abf2acda74720b61 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92243d870526c2cf1dfdcfdcfe04617941c8ca5a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff2bf55ffed5c3fd8f2aa66849769eef615ceb93a2f223eb28bc2b66f42796b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ba469c2e29c6c967c0a6fe8080d2a9ad3e91e23 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea83755027ea0ddb11432dff0669def0f70d6dfff0b2edebf4542d99422079b3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b566660a12a0834cf18738da09b65e49c1feb3c3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c557bae60e7124de0a2afe5629d14bf2d9f59a2138968c1ef6b5af4dbeacdd48 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8da45acfc3ef52d1532c91b17c304adcf2a32d6f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be5c974193be636d1dddbff78610500347602d5fbb07a0bd682dcad6d6260ebe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32d061891499aa42faad2d107add7629babea278 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac6771d84340250b7cb49ba7d1c8f0d985efa23f94772f64063b33de7aa29099 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b38a40977918203898785caddfc3a800adb97e91 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af571552d1d1c73a091a81e10024c50b8d482790f5211d7bfe7a8e759d75f5ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38c270c9b617829ef15b3e9cf21b9d257482326f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20980a87d1687c0fc0b8c2e7b23f40743d41f7c616572b91614ef0295dfb5faf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fafb80d3cb68a1b7acde139de2a0f0801bd7062 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:993498f7b5fd733b8ef4e2b9357f8c25538c47fb42d42432e418efdf7ae12a5c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..898230f595e84e1757bca43395c4324a9cc467a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1268faf06026c77c1732a47357586409ef4064d67dbef8817883e8d44d5f7fff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf315a25fea11da28de0b612a2bec263d146bbb3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9c8a463c71a6daab9ea7e0848ee60ed1fb1e62aafac510424236c569c1ee757 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..314f5ed40332da9a84d345475cdcb71417731d80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e9420049f307b9783921afaac29b042d9f858f5ce0488e426eccab0966406e0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70d6cb204fb6f7d4a32be918322fe7f4ea690b6d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7df9ce15f1117ee05b175bee400cd2a5c1bf7b245b8ab5556703794744f10d65 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..099f51a7b9d1cf853eaca0e04d701ba851aecac5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c441cbfcc9e40281edd05c07e2b712437eede422007226022b43d70881453f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dfe3d58320f7db7ec79d1b24cb1c947cd95a0f8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21de31df549ba7cb878408c9f30ea2e5ab06734e6b7e4e2a96efa7a721aceaec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eadb6bed8c82ebc24f1e09c75ca34a498c52da3e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb4d19fe2c807ed495adab1126fa961226348079053ae93d736097cd0ded6c1b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c33c11f5ef0437fc721bf07058961d1a93093216 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bf49e1b1f864bcb06a475514cd654eb09ab5eb1fac70fdad715e6768b429e45 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..022a74fa78363830de3720fbc68a78db284a9a29 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:481c56e2b157498b7ead30a55002d371e2998010193bc4f6af4032ffbc184a8c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dffa7674f1fc2b01c9354019e2ad430493d8fd6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db0908d86af18846ed6a04e8fea6c16b0441095fbd3717a240b384a7bf87c02b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..67e62883206c1fc4d671df783db3ca3ed5caaafc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5abe39159d2b9e6e5e0b1d093072814e48bc87ec8b85d7cb2d174a3933bd5514 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6806577e59ff061986e77fcda30c78edddca1ef7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c711890dce59f30f710f25389bdfae56a93ba8be77ec3bf885da47a5a20e68c3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2be534c450e9eee2c6b6c4669c815a8fd27ba1b0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d11bc64e62e28037df22910bd0ce49ec947fc2296d8b3d8cbbb2de96fb3a14c4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b93aaff114ac8c6fe1f4de9aacdebe24c42ee58 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49baaeed31a87eaa4a6b2845baccc3c6fb6774e25cef4187da7ac97895ea8fe0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..33603f0f0af8350a37daae0828889bd81fb7a99b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0dada96c241a11430f9d643a442e229df062f256b3ab1252d9b6fc0ceb90fa5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..962fecd8eb9c92736513f7dd1aa2b9c27ea2bfc1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e932b023c5dd2be07484b5aafbf278f3df3ec8ac69d6b384a8aff1fcc8653a2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..22aaaec81c27782259b293cf944bc9e2138cd2f7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:595919b50265e2c59db9539c53deaabaa8b7c88b43ecbad2f3b2a2d00a7073f8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b48c9d3227cc6cbbf0c6eddf76b77a061d61428a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ff4f4d5c51ca1c7bbf12b1cac09894153be398498e8d38a37cb1f46e5a11929 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c020bbb78481b913580d68593d066948ab643d7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ab16ffc64edafc2e233932ebd40b775f630529c1d31366bfd6ecef7777c71c1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b93bc9ad51a9ca12a6e7e0277d80b86c2d95bc8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae22a843b9e86b4bae6c820b5f7f0970cc797cc961a823938eb605b6e4aa8e5e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fae3c30e7ba6ad6f5eccdf2b17e0dd0ebd4bdef1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a6c53ea4809fa8f919236ab8356aa10f7c0dd9264c5f6cb2ca8e00c3e44334b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80fac005a425a33f8fea3bf0846618de5c856a41 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0600060481ad25fce3e715e8e7a0f0fc3c45fc95ba28315419ecd63cf99ffb64 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5315376777e938ac93926f48398ee8d46489cfe5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f51ec628b6bfd5ba04b023b4f2a9b0e845893ecace069c3ac2b8dcaaa5e73a2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..455dc3f4095124f2169adfd566d6fc0a311809a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6537578dba36f874c694b435c885f644850883dc65e0507449af44b513f231c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e2676118f54fe342aac718603db2c0726b176d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cb6c4d1c5b81ea9977972fa01fc754e4fc6f576e482d222dba8dd9f96719599 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3898f7c5c9f6936e57040f3c52a89bdd612c3431 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f8dce7fff487dc137ab5ae708b4d6e53966f9e1bf2ac35737cced743a656897 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd9430e1e1864e4e1f49467ed5026d976116a527 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b7ef8ae784e46795755966433406155f4f9ac394b5bb9ed98b31fd3d7e12271 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..25bc94cf6ebb3b4ee34b1479dc43c526cdc1be9c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:663d08909abd623120e9495033470fa46ca6b3505a7e76dcc2131b62bab97d6a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddf6013ac7a4683482def49c3a635d4080106c47 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fe6ea05d91faadfa4a3bf298d873a534f79ffcdba0ffffb332b1f9a02c5f6b1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ace75d2c4dfbd538dcf82f1c862ace1d9a8d429 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcf5343aff0d00fa6e6dfbca40bbfc061d65a139683025b32d1418d72a681930 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06d9345ec8a12eb123d137f488f1c644712ab4c3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae80ba1e8ea1628dbadfec25361028c419c8df1a6f678e508d522055198c9d11 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf4e5b1c3dc1db2d0d96e66de0fd25067bcbe109 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5885d2a142b49baa7de0dd7b8c64644886c1545041a8b1d1bec2f81ee43da6f9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6eded38fa9be6e2f5e203cd2cf77411563809bb6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72991e5f4870077b94be311c29f1f9c41f2ea62bf45d57e131d6243070cd913d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c47e48f1d90833e96b5e847c798762aa62ec390 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa29355d8229084b24824a7597d2d0b1fa087c6b43ddd703d49845ca6282f3e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1be9fdf5284ed595e4267be8038fe03dcbcdaf9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4ffb32fe6ba67246fba09dbe462a5037588699d864a8530411a572ce0929ee3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50a1f949fb9c98c55d8b0dd1ea220fa53e63b0c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbf3a27eb39841a5370b04e7c4bd6306118ce8b0120df9c82ddf3b41d439141e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53ecedb192b97326a99a2cd8a0cac790f51054ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35c55c4ccdb3815fb1f79b48d82147d7ec8f590483925de33511f69cbea1df8d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6bdd919283f503a5660b06e7333775f816e69d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:122e6b54883a2e58d8259a450a396a9bb6070c12155e4d41d14bf54abc568e8e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6c4cd7ff71ba45c936a952cd4908cb10f2670e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73512e58d838f186cf5332f05b8992cc92724c0a04246609052a98b9933fa0df +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2b61196791a5b756c2227edccabfacf8799d325 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1b0fcd1c3e29d79d0f444127e0f5050aacd0a6319ab509c7d3f4e00400fba73 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..041ed52b4f12cab87906932f3fc2ab466088cefb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:939440f177449871aa1c2911f198f974ccca6f8c418a887af415d8997fa15bcc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64900c9409c2eb6b60871bc1f216d4c1bbceffdc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31019b737e99dd4f92df9bfb9508d02ebb240ae1fc72fbbb5fe818e535a545ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..31ba7deade7a531dbe4df74a552c77f7a70ce21d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30a813bd1337589cab9c9b191860e99c5d62c3aee54345c8b8842d6a854ecc89 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..059bb2aadb0a09ae653c7f961d718b87de8c4aae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79eb4e03e9d60a8b8bcff3ba3c9d040e64a7fe971a9de48c6fdd19e9e05e37fb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..23fc67f68eca9343a636680e381b1a9744e41c25 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9097cca802f7846ff7735ae087d5bdd72879b3d7063dd19d5cae0290a97d0fa0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..900bea75c5acce8102351784814fbc4b7e05fce0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e0040b0a30c9a11f063f34b34e0200523ccab23fd70d7b924631eedb9de71af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed47b147552bef07130be0e96b1a74006e9c3e47 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d13d89633d6f04c183d2130406b54ce93854d64c2e1b2f2b4a8991c2c5e94df +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e75d56d5cfbca882f7a5c57410bc85f1f2f8eab4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3be3a79b9879e4e94648bd7c0b923349e092c1728607e1b7b422b3f43057ae3c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..663f13e640370e15cff871a8776f4fc010b51266 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06792affba24e91e2800e7a7e81179483269fd762833eeb31bbaf1580a2a02a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c49501116ac62b48d06ba9c799775bba7f4a94b4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:007cdba0071d9db64cbf3599b067150abe6f58cb15c2c99f9c0816e322facd61 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..516bd489ce0deed245313ac6f6a811994ab73c00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43cb63a4046bb036d669949d8dec7a13ffeeadab54b0a9486935988ff6fb5492 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da0e07236459bd20a37221c72ae37e379861493e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:259624749a32000718ccb4d50452592e77fffad73b5042d66031fe915c4ecae1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59df70825d82ebfcc0a0b4fe3bfa6e69c9f08fee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f678ac9cccbd8b6a866253f9aebeb2ab0a254737bf317a5802f4572908583bd9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97f93f25edd15a611443bea5f5b99a9accbfb103 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:318a688b3208eede67fab45734648852d301f0fb8504df2cfba9fb7bac5e2f01 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a375009ce33e47d40ff8e2f35338ff051039253 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:758ec5d5125b0a6d05371a77832eb44de4351d17a0fb2828f3eadb6410d229c7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16ba465a65c980baa495b6bd84fee1ec4e009d19 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b9762d82178a35bb07af4a4a3a2d49a9ef3adbd7231562b13540249641b5c84 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e464c51ad0968ed5c9587331339281241dcd9272 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:682ebcbfbd087a316c740dba2da4dc74e654720fa7e5ead9bc2a09fec611815d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9345472492649c3408d45463a1aed4eac5418773 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9332f5a668d9ac6f7484f6eaa0a1b307a80f2088bf4b77316522c5fdafb8380 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a28b987c623f2d5b45befc95e4376b5721187373 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e75f5b1a9f6b64e361b67a1ec147d23610eae7e03604553b0196e633078c5b2d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..83642e29d0cc134aaf36ac3382836fa570f4afca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13a7ec8df625c5c6ac4ef0869ce4bea03d3478f2bca4aaf54e099a42a526ad1e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f094986fdd513c78ad3255e91fb9396201db0966 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8376db2abe7af97f69f79e00e2956d77161c24a40557179a72d09cbacbb249cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69dcb3050044e128dbd31e13ff85722876221dcc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3a19328bfa676fd9dde4196e9838e78c2a3db534613f649ea80076aa986cf23 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2e7366a1482fe357f1ce01cccdf51c3daa0a437 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afe203a69699fcb96b80609118f8bfb1c4d9cde9e3ce2deefe3ad3f26f0279bd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8af37928b519e61f59e2a968508d0efe8f8f8292 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2029a4df4970f2b2d269ce6c34a31760e410609390bc63f84910a06f52ecdbec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f323035459840e72eff0906256e7949a12520753 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e836b89db0b721f6d2ef8d738c7be9bf278f7f23eeba802feaf8fdc7947681d3 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd858359652d99e312ea62e789d538dafaf11a4f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd2d7d0dc9d891fd3e3c096abe7959b107befa5399581b9be70a1dc44bc82d58 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..424275443c2e7bea03f00d3cad5719f6ccdb0ea3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d44a24c841bd522912d03b255c423628656bee469b321e0f78c286ccc276a9d9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6832096da2341f4531c19d65c90f9f19af3cbc9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:528cfdc128e01d9113c4bf62d6df269acce8ae98e119545d62d99806fd050a82 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6baf69d299e69ab0d7e6771dd748e87ab82c5371 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71d5d842a7fe32af427fdd13d21c4c19288c520de498d6c2d38b00f91e9aebf7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd261813e62fe267cfa51d28158e1e112f600e7d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86bf39e4d3589f22032d62426995765c832ab02462c54826a29e0fd63c42cca0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..419da0e613cc3f852cb9b1a492a61d2e21849700 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d0c560326eacf352ab1fe65f761497cd37346ae5bb85ada2ff670bf90578951 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4e5cef5dbf924fb9c29eb36eca4263b8c0faad8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:192ea7eeb05759133499ef447f91b75113762cce1f1dee757f6b045dd56e85d3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c1deb383868b9bafd98a7def8aca366ac5d8681 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fd5921bc2a0ec347331394919b2bc0c6be93cd81dde78608e4a4b3fc22fe6b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90548a806fb3348239d817e5b68dfd0de94bfbbf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e205f8fd2850bd8b94c93e30e841581527b65a65c2c2aa25385b1e0fbe3228b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..22894cbca8ecaa258418d465f247a41d87edc053 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26f44b2d6bd07d91a2ec1a0edbc91c6984c4babc5f1cef652b501dd5856f4ad5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1821033627eac25453fc320855eccea89851b8d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef51b1ad64bb1ca31cf0b417d0d7b0b499eb916f8401928e6f8003cd34bd2e03 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50523b70798ed27e971d596f8b380162b630796a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c49c09fdc82967e1f7536b89c9c279b5a8c3e36d62da03dfe5ead779108e9a9a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a4e222085fc4d06bb98c6302efcbfed9cf7f3d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30f8c34f4bdbd793876ceefa7a5b9e31a623eceb4317b70a3417c426d34a361b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6aa3e1638244b4966e7f498b8bd98cdbfaacefc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d26520c3f89d77c50f7999f4834b0052a30eef62cd2bd5b153229d37a2f50de +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04fc71854535de9a391cdb1a6a2b000d06c4ca4f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:700ab1cb54c92acb8cb4651686ea44e6bf9976751bdc5d49f7b45a4b2cdb8975 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f62ae7241b560f64a7db9da0afef14e25102889b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc8e4314f2cae2adc4c457b893fb9f7b38e364efd4f012f5e9f62b441b471c5e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c404f5bd9abe7b9590b802eb2c7b255d87d1a776 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd9a8f2fe6e46b5082de148b84397b5cda597b5cb06239964799cb4fd9f3ec2b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..397e5d33f7c4698f40932b376092a432a7ee90ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:800245b68d76fe4622fac8b41f2ad1f23b71171cc7291e92166eaf558d630900 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74adf9c7a7c80f7ea4fcde5d460a2a14038b47a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceb402693448bb90c6caeb26d0d608f370fb9609c71bf6b1972e4f8f4b01b7fe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9964b6445502b61d5ea8206146e96dd1e0401183 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c119e241422e8f41bd54200f1f7b177c2629091a959b7f9d446b0af0f758be94 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f6e61023d9c9da0cadb61f2c2f7203344c02006 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efa13ed01174f1d9a6482fea29b3add541c3a43148169a2b5fb23114a701fd3a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..361b0136c205118a9fb982036be9220d8f826fac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:482b20620ae4bba0bbf71b1b2e98c26b97369f4f80a949f336c9f5ee0f0874dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c324cc2f4fca32c72660246ef280b9db13df400 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e67fca0860907118776b21054194ec1728094a16ff48c631001b7b4d8ff24ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7fc4ac7782ef4639c072f5018562260ce0a5bb5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a64e2dc833b77b72ef5a5f58c51bb52113d69c9a2cfd2a58f6d1c1489ba8506 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0763eda06d4e9d639d2b8875586a2d61f4bca75 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd92d15dffdd3240a6fbeec5194d31eccf66fbdcfebd65cb3d3cfce8ac885ef4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..34e060cdd4522161d02b33a2316a0be518b4ea02 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:844800777a1ec3a3a4eec76f0c7d4f4d88db3b3d975da0133b98277adb9eb40d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29766a779b48b896360c8677da84a4a9a90fd8b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a11c05c3840d4009741c01dbee7f2c341c1191d77745716c2f0572b0d4e9d4ce +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0664669c983009e9844baaec2c86f8558d61e1c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f148c90c6ff8d9d48f373963fb5487d5b0fe65c1729b0e31e507e96134eb785 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae49c091ad0ffd1fa9267ad890bc30939b5fd4b0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b78812dfb3d121075b6addb22660137ce3a2c48cecc418229c9533f4a448f52 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48d419e75e559f932df229c088873448e1382648 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c3919a32f04535798a0c27c1c08da7cef95618acbda2b6a8ff16b0ed5b9432a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e73dfa68c19c28447d113d6b5cdfcc470e8a722f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da71cff1415023b5903ad4efe903b15aca3070f50e6dfee9ea1771ffa8b2980c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb01216b68840b56a4fef0e496e7add995bdda73 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cfab9a815a374ef41328ec0f8a5b3bf4ad2b103bdb740b4dc5120cf5ec2ee3e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4206f567d0ecd96617cc863b4647b5fab4f783c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cddc3bb27363be6bca2f17c7dec991a031d4d48119c7e15c57c7c40484feaaa2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c975ff44ea2a06bddc10f3373ae34b8e8adb9552 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2878590cbe965545ffa627e3f9690cd990ba678508357609828612fc84ac83a9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3484cbd3a2baf48b472e72108b8fb1b1617ecd6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:675b451c9de8db03e01b547c7f525bc8d6d91891f82413cc78c8da51d8fbbe30 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e14bb588e42e58a981f3364c32e9a623cf9e08a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17042af125f5628480fa3313cd109be656f07c602ce017eee32836891d607c42 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..787c0b799810fbcf94d488ef6e94caf8f1af2cda --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b44d41ac563251f6ac293bf168414789697f583f0e08ad7e2cf7ff99a6258712 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64a18b40050932a1034a6c92d2f315f262e0f7fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53fc4072dad6a843f1d169b150656a1ef015f50cc899fbb3af2d4b9a954307d5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e7431bb432f490c7520a436903b3995992148b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee68800b208c449c78a10c84da8e17c74aa480b23b92876863bd1cca67272dfc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..95aaf7e69e83329cc37084fff1c60239290cee26 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc129f3e6f5ac4700927c0aca9896e4e567196bfde9f3245912173412dd34464 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a0fe7b4a10d3cb75ce632cb892d06715fcc08d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5ece5926a4d7590887dd0f1dcd04de6e0681123f2ff482c9904e9bf6b49c0e8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7704600d481bc9a0b3e3e655fa48f39b26029795 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31a9e27c5ebaad1496c48dd45639fa81620e66ad8dfe32ff8c8cb9f8514a169f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37797155c00ebadac38ad2e30625c52484122247 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07b9e7f8ea55318583b518953848b26412025ce29b098970055e5349169312d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32fa5c5b00e029ef4d3218b42d8a18567a559af8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cdc8cb96d774e987a7332d746ad0f5ba94d673eab974ff07ada563cb13fcb0d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cecc337ae1a9dbef9f8334289fa8273c824975c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90119aea199340415c54fd83e3028fe4e54609e229ddbd9c5f75bfb4b4e92fcd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7529fbbb35473316be4e4e833b298e46f2e03c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:423ac68ed594e2acbab1cefef8f79d02f8ebce726cdf34ce5234596509f76712 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f622b27a4406d00d711fe6f3c67cfd6f658c7f1e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee0f4298c59d3f53c2427b2f2e54d62c7fadb1d639eee2a0a165f072cdce1364 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2e58cc602c3bb59bc69d08edd1aca95e610f5c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41d838f035838746e5b51d29560ab226294f2a28b200395b5bd9d13376611306 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea5fd5efcd8183bdbee1d7fc34e11824acc85a32 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aeba286d8dc5a58a334e2ad1400d45c1cc1c1558601414b40186a7ea6c2dca4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07c124c1a9b10022e48d34ae67536a5f20d566ab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0585e0bdc0bdf578e1c48bb821a2b3af635e7dfb16f69aa2bdaf11c98c70307f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b82e3102e2f6a6d1adf02d3b8a056bbf7e622d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4434b295415d12fdadbfc10a2b882600b5ae443d12db12993f7ed89f2082504 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a29b6aeff978e5888d04f6c38c916888a3c96e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c09174040edbbc0009c21be5de278fc543a513b07018b99944587b65b029c93 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba58fdc732da30b3b1893b34ba5f538cbfa8d84b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eca9313d4e5ee8a978ca8f60f32bfa811ebafd42cdb284e7d6e0a7618644d97e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0724dee1c63782a5579c836abe9cff0b376e3061 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d472dcbf783e82a2ad2fd419acc91750f5801d7fc95671b45bee86c7bdafaf33 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a414acff5512788f377e2b24b5b2136e173b79c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:791084451428f485be2e3b210504b477c92b5f81fcaeefb796ad719513a56f4e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..602eafae235ed94efe3116d4a2f0443fb8828500 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:863da37dd359adeb50e60d735de018ea7d473dcb088214852b9ea6c9e8ff574a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5af92acc1e0b28da9742d847b7ab450e02f3f6b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:131311175ff04c5a3efb3e069273880177f7195cb74688512fec503900798524 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd6bac945c8b54a277126534f55a9a442b389118 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7720ce01e08dcbcc03991960818b973e98d0b9aa57fa021498cb7bef04b709e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9b34aa398818122c6e48adefaffc50371580bac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5029071ae42d8e72b3baca56d52b4b6b27ca955b355e3d9ae28c1f9798c38a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c2e818308165734c8c1a3f5dfdaa18b043eb348 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db179aac5d5235998e3b15edbb30d53a3f0480dda83ff2fd4082a57e956e5197 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecfe60627150bcba911aa73e6943ff56f4b67dce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4911ba1c0e659be47c48c87acd20d8f03c17c471cfd6bc63313e66f2e870b940 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5d26f0f3abf421a13cf7b0a8132f3894f0210b9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c184ee01e8890c99d24711a900a5e6994a3700b7883e3ea5c5b14279902c2c9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb2a64b7e4c643025b32184bd22d25c4d7829fa4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddb71e995b15087f09b7b8b9479efc4832e34617ac848d1e641a0e9303046c3f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5a043c011b05f6a1640c345ae4a9945dc517bef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb23325b0b333ab4cae3095be5ece590c5cf513732db503eaf3deb172fc8a78e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..518012089192b0c05d9eaba92dc91ba340b2c2b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13f062f1c094086cb064ffecfe2d50920e644ba43fd68ffa1e76288bf1a2248d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ce90e497d07b44b8b443b8fdfca7882610ecf36 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:420f4482794e673feeb03d1dafcbb44052b546d98764d110965e87806403ec7f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02ff37c6133c8a46c21fa9782e13baba64fa18e6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87090f17c3ac834b7c3dda79aafe781a71603257d41680e5a9c2860f93a22470 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..970298782f080747c8166f7b7c0d0567c13e5575 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b46e7594b0a17a9caebf41bad1a9665b93675bea4df127936c9aa4a2e56f5dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad872fec08bf13f4095845e80756e02a5e631277 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a748cb2fbc978266708b40cccf190779b702b6bb26bfb0ad9948d34bf59d4b33 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c03a2817eca796cfc32965183b34206c6818c5d7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e27f1cc1e3a3f745d0444bac41b164505a2bc1b67a2178109d30b2f11ce5429 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3024666e635ac6b70b91eb91246495851dce90d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ce6c075e388ab79394f91dcbd8fb8845b23be34d92a6e03a90c1167f2315d9e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..318f9dbda2bda70feac25f18299f3d56342782e0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45f9ab1ddf943ae4d0636ed6faf338dbb70f51064e80fddaee315d6ae29ac1f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01a0551d51d9ec9793f42fec67204f23b948599a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef866e4660df1b1e1cc0261013b9b0bffcb333952ff6a282d6357d61561a7664 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..87aa38fab30d3bdf26ce1eec697b33d5ddaf6d83 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0c9536117f99370aec1cf42699d31d13614654a496ee45a28767a8b141b966f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf5a175c4d0b1ec98ec327e09675b6f3605996f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4213e51f186f1824cf28b806bb5023c8a1b91d0688cd14e3a2987ab93e3d0e9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bed4a8f33b10306188a48a9a89be60fe388a8b0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:611a2b6de61f5bbd02e74049101916c52568619e5f404f5a4bbb0abe63319450 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f23063012a5edebf671b436f6cb91740b687162c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98d38bf0b9cbe78d1fc965d9f7846d1d1b2735481c4e1e51ef6cff99969eb090 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..77aa168bd6ca480b29b951ab59ded2c9fea5e6aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5805ab9d30b7de3d3094143b1d2b71c261b0578403f9cab40fcfc09048f7ef00 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dc57dfa38e32385f87f2b56b58dd5582e6c726a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5752dc96b2b4858e6f47158bfd8d3cf53aa8e1c88f92db67064389feb8bc90cf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea8bc51d96eed52fa48744c372fc6031ba09b095 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f04b1d8b1c85a8be337819c551369f49cc476b8dfc5101605a5852736aa2d33 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e533f549529614913aa49f3c047f45f255117f1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4beb0a6ef9c597025a17e27c59eb5243a7a68fc7400e4ccc9d93a6ab48da9ef9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6517e30adb2dbd86109f5f9efaa5f8d4f2d6b5c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47195e2633408fba43baf86fe95581814809dba8e9389b685e3491a4d5df8763 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f6cc07c46be5d67a9020499f5131fd475405030 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2f48f01a8ee538bbbf4d2ae2eaddd94a8f1ee3bfd8f6718916ca8b700b4785e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b093b71d48e825e24205a58066478caf0cb65e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1c625eac37dacd0f3bcfe45cba1458d37ef004865c760a56be85921c17eb190 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02b811338857eaaceb19c60669ccd2d0045ec494 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e6ab3219929ee58694c237131f332bfb013cdf2fe60140f556010c217a2ef9a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fc8ebccea950874b621236f02a57428b20232a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c9d55a414562201703fb68cda4cfab6ffa9f6be2b1c10513c00835804c74c66 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6081df82c8e1374874da11a0995e00e66214595 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a5ea8d9f18545ea0904dd13aa3429e99054b791f228da6634c8a3f38ac14e0c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f22db6d7c0a09ca7f7e7d91794a5227f76464bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c65c8cea1cbfc53e929ef2dc9c915e9b56bcaef1756fa679c57fdd024672069e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..410e61269785c18c256157f9656552466f25a74f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62d3a679e648aefcec66a55756542c2e6b080b3c52d95dee6424418785ca3a55 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7615dc203f8ac279bbbf8fc2bd6620fbd97e93a6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd509fa0ac49e7b4f7362803ec8dffeaa4ba11d715244b1979f05bfb2ac91d99 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c99af794d4ef0acdd512c34edbc8f2ee7b32e58f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29f6fdabbdaf82932774410738cf0b9b2923b6ab1b5e901886608f583702b9a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a2e37f20a37466dde207fa836ed6b96f49996e4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1455f790cc2730acdc16330a23340b834f4a21fde4c9d47776d8df2e2676834 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53604bb89202843ebb4aabaf2524fa504a3b10ca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76e3cf1db982be33a223b7739746d0bf56248b13650f199e8fdfc4c3045d7a5a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7753efaceecc6b7dea78904372fdeb38c890eac8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72751b3ef8493d49f882aa2696db6ef21aa3d5868d0e1fced2d278559ed2706a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e774cea96cd30622494f925e365d931a6b192b1d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6163889118500eb268915b38effe3e85f73a323093c2904200cf050e43886d78 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebf5874187722c4f4ae6247ff38a9c71d846936a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16ac70a0a2c57ae5f0a65b34c5d5928036391aea635996ac1637ed9fe0776b25 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..324b3c16dc3fb47d2db48c8eec516f29f6a0654c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e89e226058ce8bcd2a14d838da12b600e26686a66c8a0e54773acd85330e7f54 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..87a1b272628604cf855ee85a67f8e61f466993a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20cb474bccd8cb814e8d5dc1b3439da55344213f4c5ba2051db3fc6fba8c1cb3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07daade6b9379b1397c01acbbb7bcf07201e1ed7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c854b28e2e77fd14b85927379833dc8745206890c62879d2a9ddc9fee7b75731 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a534a9e84a88f5a41f7c2d736e3dd95486d8e67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8a039fed60c92b05862f93bf1851c2fb43bd934f8ed270dc312742dfac153ce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..899d14848785a22ef9f1b0287627dccd797f1b75 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc2410a399c1b38897d8e1c459ff4a76d29487ab2eb7dae68603865e504809e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbd31a9baab1da457b879497770c7e4a531d22a6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16e2aaaa3559d60574f65adab0766f767bbec88fcb38f18e3daafff9913ea722 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..246d37c5a7f11b1b0e802f9f94cfa7577555ae67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9bda2a12ca191c5772de9d914c23dabdbceb4d7e5a042116a980fceb299ff7c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55b9337decb737a268d4e4a9a9dcc4312a8e9ee0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6badef56cbcd8457599e02b0ebaac0a777535f94e19660a2b3a7a59c7cf0adae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b710f0f0cc668052055cc0379b90a6b214331f34 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb350599f3216a2a977a4899228eab2fab56af1c5675ef522377ceadacdb6140 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c805435fb3350d7c0e846f41a92528a6a48bbc0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ad6f9d4202630edb25877e67e39d51cccf2a5290513ec0a99b63fd1c68b9ad5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7709bb357b3ce61d80547b51c02611c2bb73cd5d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b4b6ef8492575ad363724a8d8d0d738517da3a83ccb65a1fd3e1ae4a513fce5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f9aac188bb73a5f48640d9745bfd82a2804b2fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e9bed534c4ce8c58aacee45c49122a38f23926573b106ee9a85d34a0ac8482b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2977f7327420194f2fced054761d7bbd3440626c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81d2be2833a452ed6aa865a683450c1c42ff406282def6a121f08d69c39bec91 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5eec79f8afd182d45d964d9b08fca8bfcd7d214 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0d09f49af87590e27646ec7cb08e578c4ca8dd79c7cceeb6c2613e9f80daeb6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f5e5a26028c58206d04b7380f5e7118674a9f0d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56b7cb420a12d5f457ef8f165a13bdc5a9ec7c46f85cb7ee889e6d1c56b7a665 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..472730e6f1a15779d753805bbc622cccd6427d7a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:591e9d01bb2f4375f27e22ab206e068194a5aefdcf523cff59500b412b49c57d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01f1e8bb9112c009cc3f79d9b0d832dd058faf70 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3128bf3a73c7f5e1fc98634048e70fab9dc67b2457ac8c9be1dd40f0e6749153 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..73b4e3145cdc928e175db033c55b7f162c553d14 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3117a8f13ea880985d3595d689de7d9849b4d1a86b3aaefb3403feb82833cbf4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d2349f74011a5423c574978c9b7379caef9f70e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b453b696110a563d16c53e71d73e2a289c49c70172d6eace41b959ba8bb9fe63 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..69ec77034fb9d4883aff889885435f960e9b7bf0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec159b6402d33f9244b959df6ff5ba5459cd01d4f0a12e4a481157e9ede543f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bbfaee5017d2400507ff39244b92ab707b9ef9a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9697653f037fc94f6456a40835f0caefee839e7727bf1c94b5b42bc5e0ddc593 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..652736a09cf0e35895a76b6cfa3c7c9e6938fcd8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0381e7b6478ba461e204feefa0ebb216b4f118640fa639d94cf0144ec359362 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45d16a58e1cbb40d5c8ef220bece9ef5a933ac6f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d3513ec9d9e0e894c03675d2066ceddcbf8e1a65a21588ac2e531a27b9af502 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0ebe96419da7bef9b51c203378e28a358464677 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4df3a042bb8fc56f0882d2eedebaa00462149828b575a577a7229cc8ac26f7a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38e5fb6fc5f2619932dcda337645cc9866db3e67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a75274c1216f0a255f632abf2e935b4bb0dde6ae180cbf0dd0b4562f8d5c1bc4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cefa99fe4486b34aca7b132cbbc0a1d86c47b284 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7252dc122ac94545b7a44043579c8d4790dcd7129ac189c02dda322e78663c4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef44d375a6d842bd8b502742d4e9c69095b855d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bea715ca5c56de5e671dbaa7575c91f7c6141a62c08585a8ba0c7fb9c7d0cf64 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4888880dc5a8a9d5e28d7b34bd78b54aa017ccf0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c7b32edc61180666f370596868197ffec2356a1b14a8ef68e8bb9bc1ec1571b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..254531057398742a6cb8207653dca0c6c713c1c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba4f4fa5551d42c44efa8b5380e761a71a61708dc676056369bcb1c6f26f93b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4138244f1939f38dab3397aa07177e0ecb96b9a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:045f23d45c732eb106709827050a9c181b258a8334fe067b4e1eb8178774d5fc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..52cf901bb71970f03881a5bf22221085563cb809 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c15a7b49e21fe0ad82a2a20ad3d6ff2361afe9d1d4c63b517ae124d279d242f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..83acb7d6ff9dc152ff6398ea7790a96a3af5e41c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66a212e7cd8dd5a798e5e4665c8bf24d6411a4bf0d3e76b2c40a8791e67fb567 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9a22fc54bbbcb0669cc6aef7bfe9e04fd8a64ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:018fd52822a1153eaebec033ea396e0bd6b09f12547920c5afb743b26378bdee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5565c3516f1d2bd90fd3e65ae08f962c14ef09d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84dee6894f6b7677e86784f147ea39b2037457b6421971baebed8fa1f5c9b504 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ffe552f5bb2427bba894c1ec4348f5051f3e4e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f6943973fc3ed483091ae3f4c6899357828bd73d21b29c04de5fea06ca6dd02 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53676df9d395c04b192df1422a5dc0b1e020539b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:769fc2068832fb2331a184d6208eeeae6d6af01a7239846f2fdc32c11a90e5c7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7acc1ccf67a65c09caf884cd42e7940c3133a8ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6450411cda6f503cf5d5da73f073c5facecaad23c3884468147067a692abbce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ac34d9cf347ca4c6609124dc7226f7a6ab2c1be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07c09c5ffdf98caabf0c078a17af42a43fe6b3ce11b5c8eb2f6e7b2a212acfc1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..933e580f0fc6996beb13a5925b64521be7e85cf2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be81578ab76366e0bc3daf2b898596e037a1414c8af1cebeb34da7b33a5dc2c5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2eeaf42260c421d99f8feaa6a8d725939c5a9a1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:134c45f37b6220ebd1b7ed433d7d0aa8788cf68e68b0c3fbcd1813c749477922 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7de6c8cc96fdf33c2cbc7b802d5d6c0f230999e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:668ebfc9afc94671f7a80a11ab9ff29c89b328443bb627163069462ef16a26b7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f81d79b55ca117ae44adfe49e2de84083b990af --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d0e49e120cc956b18673a7f7e914074e2163c2ff0a8afcdc173d3ff0157602c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cb9320bd1ea7fc3f39b652bc9dfe420db55df35 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c240286b8d909a7fea091ac37c755ab943591ae48c40fe75b68e4181063ded02 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07797355881bbe69fb33492203bfa24699cf5ca7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c603ffe3065b1725a6c2c86ba2543f32777080138a715124ed045e2aa2612be +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8e6414d68f06a42621fd14fed178d326fda21ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c7f3e35bfdb8bd42498309bbb0afebcc472708ef342e63902f3921b606c244e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b21d227037dec93385bea776620c88fd1700bf95 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1de4734b4f19cb11fab5e00708688d8d0eb5dd2701e3588d1435b92e462fcd9b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cf99cc759f1e1b4a00621f45400a55eb97d9df2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dc53a857875fa682e29657b8aa1ccf6b2e17834513b32b0285451c8c68ad77c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11f661e3048966030cfec2e5fb394efd74467850 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bf3bbcff91e39f39f8e0c602a6350da5323347e1939c3589c4d1cde5715831d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3218bf91aa0b554bb8066e79eeb3cc268f2833da --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77aa14ecc84c5283f315f1d4a87c1a76a2b9e8d046a9dc1a22558644e39ae651 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..73717ee7ff167e4dfd02221ddd3c27970cf3a35a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2911cffcace5d75692663b7d1daff43dff89173f821a707b04af5de6f1b0283c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1678b61932f79d8e3eefc0f15a9c8ed221e0b2ae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3436c01637fc5a07bd38932d37d6068c5f6e91715c8ca3fad05d8f3dd45819e3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..733079c3b0fa5e4d7722bc5fada1a0260cb1763c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:820b09831845026fe4eefb32b02f3d5611b3bc5543921e5e39559f2837fc3d16 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab1c870595ba3a41c16fb621f3d887a5431219d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2ef6675ee77a30411a201132f1c5259c3b08181b42256d7211b72b5de21f4d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..45c07791fbd696809e7b8b74b2e0911a0198b45d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6adaa3ac83b90ef2b40e8edfc8f4efeed5aca5d1f9fdcc72d3837678e383d23 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff33dd4c738bbda3dcce838aafdf23d52385944c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b1245f854253d330b336c80a1417838ce77d8281620734ddc6e041dd99a933b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e82c57e78bbd4141243710b6656e3cdf6ca865d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b97d79b4bc1b37d70857e2969f06012c54d68ca385e86439b609a35e766fbce7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..61fb65af069e0192d6e1d342985786f722bfaea8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33df918661e70641b8d2ba1fd0a152271465d537a420bd8e13fb62abafdc27da +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..807dc83f27a86fd1022366bcf8c0ebe1afd995d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ceadea2ac78dd19a4d525f67d56ecf757666c800e08659e4099be1de3797382 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09cde42866be527cdb71586f73d6d64796b7630b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fc57ceb58e2a379f69a99463bf321f79e891d9c64ebd6b715de44ad0f16de37 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8ddbbf4a49c626640dd5e0f8c7a717fb83d5e00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c06ee629e1c5d83cffdd34ed1dc79ecd121affe2e5f4f932cadf593e11d53cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0caf53605bcb2e374e80098f10bc86a1f32ba721 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e06fa9e7da17f5bbc7aa9f5805abcb15375e3dcd3cba88127ca9002228e578da +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..90eb3175666f2e3b2db0d5cb9008b1581a3e162f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ff49b113959f86c1472d7e990eafdc8dd345ff594b2250e50aaae9144f5e484 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6455085f0f2e809e58bd333d5378bd0baf74085 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:200d93900a4c493f88213085baaf14b84e865c060c08ddd72b6159245091f43e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccbe4548cbe8eef2a91e2721dc634ad2a53e6953 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f5284e76d5341debd80ca828274d71a706fa5c1799514839ef80534e9e271b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b325fcb6542a6b26c49fc180e616eafe01aa9f29 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5c302c6f818144686ca65db997cd47c3b98d822267b04ccb2dc2c0d2ec06358 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a99798d570028dfc86fa273875bc96f91119adaa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a8503aa7e5dcab7973527e4ef8d6c2794fbf19baa135b5d01e096a6b5474a1c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11666824f7584268baf668339ed6860a240d9adb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9008cf8f9021d06824665abdd433bcbc7378c5ece3b124befde078321aba555c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e655e46222710f430757ad1b2d3eb93145aad46 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3cfae6de75433544b5259c6cf1009753726f6722e95cd0fa45a65abd1787a13 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee29b5c2e0b30992d95b156c652b0c8cf5ee9e3f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:256151ca26b91354d14500c5a35aeb4e95d6ee04068a2edffd5feb41df8d96b7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e48808d7c952b22f78637a76d3a4af32838f86a2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1192e94ad32a45bf93cc72fb8db5b30368db93c66d6f4cd97be8bc2de6ff6f4f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1af5feb24188adef664c02ad17c4bca15fe0393c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:441ba75d27f3d11407dfddd49774bacfe146261fe988a10fba9a967a58102df4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..88a4db6775839d488f9f5520e0f179e391c73a79 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:330b4f4cda7ba1f46a183210d05ce9665f2f3f107b2a116539ae2af8d663c1de +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e78fb75cd48835d930074acc91dd121363bb1aab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d1530c2fb61eeb5d6ae47404d4efb753826308f28bcc0a9fb3725c1d7b66665 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea330c8fbb67b7fee74d5d8f18c2b11936b2f71c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5747f35d32f60879243d9fa0ab6bf6f321fef3dcbdf4a4d7235f0e58cfb13077 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..149e49d34b879336fc51aab5cd1f464c9fd68aa8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5eb1a1cd75059844694ed83b1aec97959c0b2b8a4dafa8f842d052e28fb8631 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..37f71ad061587b70f1a69e62ab5814871b5059b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e87900d404eb258f234573446b6022c63f32461d6f7e6d135fbbdfd2bda7ddf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a03502d72fe6fd6fb9f43e54c22ff389d4e48bf3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf1ac6e96e18811a464a1e6421de4bb5b9339c6f7553104750b6e804d0acd6ef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..16e6e1bc264c8a9afff5f5f8561cabcedc9f4187 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21b03213954a594440df7824ec536a074d96d0a7ce85bd64448e73194ba0619c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b843e14b74e8d5a11ffc6756f78ad6bfcd9fa01 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdacf497b6ab2d3aba158e55acbcf0764067003ca6028f5ddff13c383f4dc4e3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..81b6faa95b7b484fb62ce98e1c4a324c0fdd0407 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fede878e4a08edc7caf5dcd1a069fb3b872e2844d771867bbebbcb8a56e987cd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13187ab632f62f8f3d3b58748247731ef79bc733 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da0f950a507bd7f3b39dced021210fba83f4ab67ba8a1e1246556a47b69a608b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b12cb4858d020f6cdb76eace51f8f9f162fa7812 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be78bcb8e0062288f9916412b491690107f184dd79b532533deace0fbb797885 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3b490e555bd1524e4c71e0d0847c759981ddbd7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:412ac30c09696f66f3f9d694a9fb563346523fd4a23272c252c9d67b1f22870a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ca67b10c5ee8eed91de9f317fa89db54d564d8a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12a2025baf3365817b267e9b7815cc3ed4b86b907a55dd69d6c34b7f4beaf9e2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d73e93af4bbe3333035a69c20e04c8632dea0249 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c079edc544c48bc9384c20d052a101e7528c51e827672a2d3377c0aee9cde8ce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdecb919cc2125b79f9be44c49e5e435efcd8637 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01a20a924296b792f952822fe9cb7a9069e01802812ee4bc541328e7d164d13d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec1820280b12d6d084c68507c39b25196d682c45 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:080e8c0179fbf9beae144470995e163c28a73d61a7db031e0587d4eeb84a4ea2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2d6321096dde515faaffffd22d3dc757eb7ce93 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50bd7884b3f07348d30d42cbb999e5a6f8121b4df97fc688faa2fa1f58ba2b4b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a8a1c5bd32847e9b71b0fa3095871ccb7a3328b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8945c9bc3048b8a6aafffc282fb2a1d9ea5fca5545f60daf08c6b7df88279ef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3239e4b5ad89699fdf9c7b3ea8bac60f49225b12 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:126d9c6a940b23f1637f6759898097d20c84eac4b13d983244b3356110538c1c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..004900802f3b497a178c17f91dd0e54f7585d068 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d805dad6bed0cf81b668eb82dac5b3fa5701b3fb5b626f426de64f7e1539ca47 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f363a6ee4349da43c17f9ba14fc0112bd96e145e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f7046e7b40ca7916d63826e972f9a23583fc5542bfdfab2b724a7e47e6ac90d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b655b2b5a3d144c715d4963ea476167966a57cfe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c0b0c379c7978a124278f2ce1538b138d8faa20c0694900127bd316ec374150 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d72ed70e1394c7875fd594579be433bef803ef0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6532057d09546ddca32bf8d98e8c8cae7e38868be182502c16b2b0def85b3f37 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d467a1fc12dd36b0476108fde1cf9c2e38c384fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5b1f4237fb637d6a468571e91bd3e57dafb4265b02015a9ca14728d990b173d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..39340326cc702c41876902b439e08ca8271edb28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45a6b40c7bea4cfef7efbbae4e698200a7793aa4d81e68672723d22baf53961f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cb9f2fe30e87732692babff590333f40c5c48e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30b78c70d519176f4f4da4a4b8553605dafbb11a6c487fcf8771f8633a4344a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1881cdce6706a94e46782ddfa9b534d0e82ce098 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb5596d9aa18b81cf18e1b4d8b6b20b6eb20ac078cff32b192380726ffc70e43 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ce5739c0ddc1647e76a89e71bd27eeb9ef6f2b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e55bdb8f5900295722e5e24c273774a275ce084e271d2e123002e41606f9b53e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c3539145881ed0ee7c3aa4df981a610d52d21c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06b05bd14a43226bb5326654c0595cc74a223589512bb4848c68563cf685d220 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5447f5ac1c411146efe6ebf65ec4754407c9220b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33dd03a9ba7edada724fb78a42259057036e1e9966222706c8f6242d626556b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..13dfe7650b0749f783928d7cfffbdbb85eb2a907 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:570a1f2f7e042ccdddcb4a46067e384578c42038830a94eabb7d6f8f83037b3f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de3f3e79b32483065ca929a4a11d2f4e0be54516 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bb86bf04a3307a546e6e18ebf4aa2928a1e2db7e39573e18977c4d5e95e9b94 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e251590fd5740058ab102a3a3e7869283925976 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ee0444d3b7d29e7f25173931b23c46664eebf167b1e0b330de470a9245812fa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14e6efc47b3962227e418a3a00d81410b7d2f717 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c93657d857d6f6589a229e509b79f57071897ec11467c22787a92d1efed58d8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b06e7ec16becff04a4ff6a85db0c07e17211145 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92e97f0c94a3efb81f8a879f0d88cc3cbe6a61e6ba5ba212794dff36688abd45 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59fe38fc8543a3fd59d32ee50a0eb53d6e9b578d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f719cc8b6d253e38d0412168c53eb40ff4d6fb78a07aa975ad95546b48218f23 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7669165feafdfc29fa3f372f52519e91cb69a3e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a44921ac52f3829bde3c4567210e8512a324e182640b40708a1bc3377952c031 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af0d394d056224d6391ababc4aae43406d64c186 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fdb46bd9229910461b68c9225d7fd6eaa0490f91e9aebbb37611ed003aaf22c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..302f79475b7fd0ca22d1d66b354ae4fa3727c208 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cac406b7a80ac0930d0688be3e8f915790c6e400e7f62f2dd200d59ea551f4b8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2ef6cb5545b159e6d19ab1cb0375fb01dba25ed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12697e843e076b7e9153bc1f8b00a1f753f93bc81e9c46aacfa4b0247868d892 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8f0fc737ad1b04273ccb783f5755639566d2076 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87e23c4b0abc192b53dee503591becbfc51738ccbf4a8ab51c13b667f87df64d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba66b993311bd082c7e7682c9381298fcb67541a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d47faee765722931009c1977e628bc2586f8396c9f6fc07bafb9f4f3bf93cab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d47e555efe87abc0377e6fee123918644156a275 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5741356092513ce0dc12213a8b04e9aff77edf8ef5a86be981736f5a846a68ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c261dd4364c4fa4cb4f23c259107e6ab8ce8577f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8470e25b03fc36a237bd58ace9b0d11a5b0fb3699af03e18a6f32575448c9897 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a38c2cd67bc8cc8fb23ec7197fbf17d764759470 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00cdc6ce07e7925b4c4c8099712b128abfa7359264614a89fb353a2fbbd6a32a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a9f81a877804bd2edaf31afe984fe0276ef968c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:573b86847840c3c1d3a4c6756b9f4359e42b425896418a105e87bf2c3c90aa66 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc677ea8c7746137cbef8cee26454b306f0d8f96 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d935e884d96eaa4092bfc98d24c84dabdfbf34f608e941c97cae47910d977051 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..206469e74116bc03f576556b63f43b229104e557 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3ade24be60e3538db12618ef43ad78573966df13ca710929a23c1d4482c760a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4012fc59a027d915e7fdac0d36d077d47924be41 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:597edd2bd62959702d6092c4f36973973f3a203615558daa7e3a324a3bdf6e4a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..440ec9836c7b4a580ba899d996fbd12e3e701e62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8343b6f242902a008cc2d7aa0723b10632f2c642427da105acfaa316c16ef8a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdd8847071d5d849182b5ea484e313da7e26772f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8a02d871c61985f9c3df97ba05d8af828d00e3307ce41aec928b1fdf9b0f718 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..605127e459143208c25873aab8b7dae62f467698 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fbeff34ea089f22ad0e515275856c5fdaaa1fa33531e4098433ac1956cd5dec +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3efc34a5e269a65ef958b518f7a7d571380ef99 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b56e56f7b63d820d9138eeb856426b8fc2699b3e33fc19d4eacca93c0b26522c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d182ced0d95efaefc027af8b28a1e0b01807120 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88ccefb4e3325e81522ff689e4db8289c5a7eead84c129c81d1628811ab254c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..255e4c43865cac59e7fa190942ef62f24bde9e79 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:303391e1d1909bf63a05d0ef9caf98bf144e443716726d0c62938394f1ab4de3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd9b4bd60d6ec381c85d2b5d15460f4352012645 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d9ad82a2f449a26e67ba5893c809c23de50aa0e22ce1bf4034b2faa839046f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be5d647be8d6ec6b40aa46dccdac32333bb0ea2e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daf37d7ca6c6bd109d4207e1555de80298d8c571f071f8bbd49fec5e8919bfd4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e62c21d1fbd5ab19c0938ab3ca8de659127152a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d630777cc7ebd59605e30ac7c1cccdf8a293537eda7e9fd3a9fa3bc447efe93 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fb18b7ffb6df9fe3ced85c13437891bee3ad993 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:754fc51068d55569955b94edef443ef329196e149e4ad6b7941394029d7d6fd6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d6b6bbc97a6e4ee2cc438a40910f37c4a3688df --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a246315d868320962a3f00295ed0a0cf06d68ae184f9b17808d7941c920c962 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1fe45d0651ef79da679a19d84e2b7a48ec35bc3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ee6173cff18ad93704db12789bab0242d78f784031a5ae83cc39ef6cee57614 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56494273460887c2a26ddf2f7f8a3aea7b52a725 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45a6ac0c08605aba9eddd37b6c7db8ebfc5981924d9c06faa64f1b0d44b83400 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..42fd3750792c52e8adaa864801e979faa4936bf6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e03991dd1c8f660b38ac3fcdfd2b416b98524fa1ab5c266e6470f661dbed34f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d1f9aa91a7587a72028711f6d10dfc25f6d2a5a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de972db3f724319b731095920ec7c029fda556f6e06926ca040cdf55b29fa410 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab48e2eb5cb66a041f4229b4461cc3c6024c4775 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a50326295205e74fe084f7261ca50bf8b9540caa27ca2923caf9e6d0b6e02925 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c67a64e25a1175a265a9b788ff0e298d22ace583 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e411dd300bba7dbedf699b0589b9bc8897757ad6b67215f143e66d0fce0f099 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..591b83ff8dbeb2d622d21fab7237e1872d97dbf1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5080296bcc2d2dc110ceee7ad4bcd603b26f2337c17f7da6dc42344cd3bb1712 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0ecb7c8690823ebc587434f538dcae61e4c75c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:405c9ac16b546dfc941c921c104132f3d3c3dc7807fac966900e3b6d2b5f8dfe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4b4c525732d4809868f5509175cfa624cd462f8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:821ef62bc7ff61d47a1d11f71dc29abf7d66d27caf9f73068b4869cf735097d7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14f829338475e0ed13e74507ecb415f5ce47202c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c8f4798aec8fdf39f7cbdfff2229c0b84360eea22d1b76463537f8da2756254 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..15932744a07379b2e7182e85ea4039e4271e26b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a31232c3bd0c4e08deb7dbd8338e7c2364ac83d0226928269bf73690d6ddccdc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62393c500cca9d2e842fbf2db29a9f7fab30e0c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45036a69499f1cddfecc78590444a420f5bc8f030a3d23447342fad7771114b8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..958c903116f2b89dd9664600bbc0bb5f961df196 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d88782ee326cca2e7823f2b2e2ca63e23d15aead1d9fffdad2a6afd24615d8fd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cacf0c4251fa6fed884fe76d649f08a30e925614 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ab19bbb11313bb35f04fc96efdbde1c3d6c7171ef2fbe4cab65b46972569fb2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0f4ed7fcb9fbdd5632461368c157cc9c7f9dff6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f0e5c32149a06eaf6f2727a9ace045400a875a8e83a2d31e945f5792a7b825c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f7ca23e9d92b61837c19176c6a415f7f072c679 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed2509d3461ac756dbaa8704674a79ce5451c9db44d7577fd24d8c835c8d349a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2c0e0c08edf7a487f8600e4a909deca34905013 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c27b47ebd40c550fb800c74b599586f9b224350c0c3614c9a3f42c52920df45 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..042acdc570a8cebf06ea19e5912d1d31140e35bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21d482940fa74ac4c131f534adda06d46a67227f3b49a5ac7469268442d50b71 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb876a0a18d1e0d70eb11154bc41e0061975aae6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc734ad1e95e7a60090d37adb85e2fac18dd1cbbbad260192d4e0501fda35e07 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3af8986c2464d05bc23f404341f161ff2ba27782 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8239eb6e11055353e6fe0d234572f79ea63f298065fae999a55c5dd88387fa21 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c792b6b7a19ac5bdebfeac3995dfbfd430af7837 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24523af44f3ddfba010affb3a1b747786699869a95aac80ac057fec28cd4e2a4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59b4c99e1ecbd34525e81e459405e4132cced1a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9be8bbbd620c66227af5f75b65caf49b69be60a7568a54a5b2caa3bbb30a5680 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..98ca2da9cf1d83482aa68bdce30528fa9d115bec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:214630f4b759979f02c4cd13737fa80bb78ad44b97cb896a5e0b93fb12ac49b7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1ae6352b944abb62dfe4bf1a757f16084de224c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed639d11e315f116b0084917ad886af6e23fb056288e4d420ec65a61f76a86eb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b76c5f9bc4be31bce6a44c6b123893af76631352 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a4f5e5bb40aa61f0b3e5462d26f2bccc8f30cce3b74e5efe0ddbd697f27a3e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f78d95bb6712a5682d2d13d4fee1fbff285d4aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3fb5158a9012db6bf2706c74b0dcafea9774db09897f61e7a9ee82139df18da +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ff450c03f982290f481395a2c2a3cf90edc9b06 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7115feef419a9365f2e4d23a0c9d82f9e706ce9076d959c14abce7849c1ed2d7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc157c474e59bd2777fe3acbd26d072dc722025d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6d1480ccf6b0f0701b19de2dc8386a1bd405ea09ed7921ff0705a38592b7aff +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4abc5b82ab1566f671920d337ccde2053d187b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d5501b41fa108a4caa01b645e805c11c9d1dfeec5ab0e0cf4e84609154f4e10 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0943f9c1653f9d94685d5377284ce825190a56b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4ea5a56097720f3990902b0a9bfb354c7fa2a3ed98b18503f97da71c350d21b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3dc46a43b9ee431b0d5b0dbab02e3446c05a693 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e286cd8bd2ec4800f642d0507418edbfa23bdd6e32bfec551912cf35d3ebce89 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53d011c1d6b455538820998a1753e252ddcd8157 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:885afc785aa8d9d3942a46c2f4ca4ce16fdc6c69be38bf093d952147ea9a574f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..062aa7a7c9d4d01957e71212d090880bc2934c7f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebd1bb9e3c8fd8efaba36749c916cb139e73a93669b95341d36332e0afca5881 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e37a8b7ad1fe7ced5137959524981fe4a45d631 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a62728a13cebd26e90275e8e053170cc12a2385a8e10ed7f466c3a28afc8806 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..034a75cc9bc6671057f14472d8d41f7701ceb9be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90f52275a2b3e0384d2e720094c618fb5c9b3deb9dd92fd404344389a54303e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d7e7b00236e6e02cea4b5beab683cd8263d5b7f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ddbc410c980ad9d3fe6c62c1e181671737159bf0df9f1ac99f28e991af2454e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..192f0305a0cf2180caf1c594711496941431b6d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adb81e770e95505b0e996d143caff576b4955cd03acb5f2a8116f61633b7a98b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cba8758fb7e92f4e88a106daf8050fbd9314046 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d73838a552d9e5f66a25ce6920b512d442247b58bd1373254e5d7ab149e9d11 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e759d86f48f7fff3b580a6571aa8e6056b5d04a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13c0c1355fd429981ce3425c966301951c3e99ad808b63cb10f1b3bfa6fa5868 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d18b3406cb85e52af825b680a486612d8499f8a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd78365d1e679e93e8c84881d159ae94eb9a84b07368f46ee6f28694c86517b3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..754afae7760b9890a0daa5b3bbde813604ab8130 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20a1eb960c10206f4632a5766d81a5059ce0bd196b8086cbef87d689cc38ded1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a6a3d8dc853388b76b3e1cab993b6e2c0d56217 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45d1b42e48e4f2c759ee012eaf494f3752bed9ad4ebff2ff661c502f4ee0e2ef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71ce0b939eac868c276392c2fd3acaa90b787902 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62b100bc8788699a07a35ba3639c311f4a64320b49444badfec02dc5177d5b67 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1ab97707d684452ac2675e4f3455e7968ec3020 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dafacab78a0f79712d37fc1a622de49f626c56f7394579a900ea7adaeebdd29 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e88c0e770c4962c31dcb9197fb9510483645903 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:820d49e81849c7cb9af4c819e62ea0b0bbb352ef91095dff587e1adeb20da654 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8125dee93a27ec2b6ba958d91b704ffe226180b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75aaa38c321e7fc1cea6d6ed0ffc320cc243912eb8b0a3026d4a900d5986869c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0505136e93fd0b6ee6d3bc96d3af224fafaeb15 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca26a1cec23334cb7ab9ec56d592e39ec0ed54777c873e61254b6dbe78a85d40 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..805161213302842a4c75866fda6498c2d1f3e455 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:030b5bd8274c3ffe6ea970be05e9e83e0520eb2e6411b0e6a9e11345a1dfcd0f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6ba5902ad386ac165941fc254cbcab56a6014d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d21e362bace7241e71fb47af39124d85e30c34909b94c927d176240b5c0cc623 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fa0f428fe183d8a55584eb1f128303fbda248c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feeaf69439c3cfefbdfea7f408465f75542842dabccb28116c2fe295a7138d60 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac3faa4cc22f615649758d637bf773caf0e825aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b147dfc70aea1a659d9bd3e1d9c672ebf2c066d49d5cb1a41d5e6d6e2ed0e09 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d84d516a0102683953cba041d1510e2670971895 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30920736a1eb8c78d3a0823c7fdce1ecf304b1c9f7d1230ca5fc219c4317d3f4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0f78f62ac86f42f3ef4e77879bcc72dfc173e3f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fff37c6f109f657ee57b9772cdb6f14ab7d16c5b2f25329aec2f8a4e0eeac6bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed57fb600df1e95b8c1beec761f675163f0a4f31 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bc7554dbf3facd9b3df36ae3c142b8e2c2a03c5c8debd3ebb68bf88a40631f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1937ca605aa86de28a62153ad69dcd013467d36b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a2b1a7235adfc5a8f51d8d10a56179dcfc3ba1c1f9b312f2ac8a964bc3acac3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2082d3fb20a7f63cb64c2aed49f80ae76c172ec5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e6ee69f0962e3e4b19dd6c15f2d73b587a8be4c6d1ffec010df4403252cc41e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..46a540a97a8c4c3c98da14654b9072335ab74db7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b0619adcada143083cbb2a02f1203e96bbdfb9990846b91b99eca163e48dd14 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da706f26eb660f151eb9a83fbb393d8835895b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1167a1a4dfa929cbd164814f78ecf5f1024402b5d603c685156c9ac2ecb7383 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee366b8df396abb2d9d6a91bb41a2d39b0390dc4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d10efb97593fa6b250e6621d10c14b4da27eae2c9945b9dd55283feddaea1cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ba9b4f4b8777ec46ff02e36b07e70f3ba845a70 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56dfd7791202324b4effd97032d1ee174e650bdc5578ce5c9c683588a915ae88 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a1ce6121c167b376e188899aa1f1c101b9270bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6351f3f6b27f9b23d5522c66c6418d210eae479e3e8e7d4d6bd79f9be9438cf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9957f50b3fc2797b826b1afb63cab4adeade7b9a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf9d63cae3ee13f9a15c7aa22969c67a3737569886df16f8b2f174c2ea4a1589 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c769b67d315871f6097aa4d02b9755ec9e919f74 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9eda9a243223bc759151e9e4af80eedb77e3b81581fcad95edd844eb212fcdd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7d9d6e57d2d5e4170ebff5351b58e8982aece9b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:080b6c29f2717a75ca3f0df7671df390f5ac5bc2deef7bfde49691507f617f6f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d023f2c3361e3f5df54380cc6087403d9fbb878d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e8b31e1b0610a4f1081ca289a6683b551eecd79c711002755c9d68ca0939cfb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eebf9af402add5d060f15c6507619cd98219542 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70d516082eabe61e05b13f56fb849db8d5765be3f997857f50278ef5f796d434 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08575fc7ff301f72592a0bf78691cf284333c712 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b40d0d5bdacdfa28e888571d00861eccf1c112bc7caa11b9b814eab1946d31 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3b8f5599cd672c25086f8c9e2b0e9573c3584ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2969f34d199910fe7611202477191d686288b926195aad60f62381a9a15dc55 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5d04ac685e0b6eb335fbc4082f7add0e79cf4c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e351a7e1fc2a59cd3f443a5ae5c38cb8e7ad66a4d43254db235d19072396b463 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..360dee623f1ecdaf299e2d34855bebdf2664ed64 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f64b78d58b3b973a2d9abef9b1d0dce8bf5c67db72750345c2290cf208bfd64 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5685da6b79adc587645e97e595cd4303ce8f61e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d675870f37fd939036d68cbcb34be4a4aa5fec8c9b95e2ae06cbebca4d574e1d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32c279e23b5d71d95eebfc13f8f2f7b482702ea8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced8eeec290a74c1892b0132c83eeacd405eef3e9587fa2fbbaf9845e007362d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3a9cf2dbe1ae2b0d19eb2cf05f4204c8d9fa8e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:554791200799f01668b457670770e6a7aafa5cb3cd1555f4f434b4afa4660395 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3009b14524715118dbce0e94c6861441832da9df --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a43c81e1e26a064f1ffe3df1c4630d7ee76ee0b8f2bf9a6829de2d54b5d0342 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e937f3651d3df96a8387b91c4029e8315d10389 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:574cb8069e71bf889480dad683c8149b718a5c03219b2bf81e8eb5bd5692b4e9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d16fcdb5b5fc66579a0f7d2d42eb6fa2ec3c818 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cbe2d5e85121eebea37aadbbfa869ae8e975a9d7e010a632585a62931d9a824 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dfe2da4189cfe3247cc815f80f2f14fda2cb362 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b9abcebdd9a5e7458b482627ab217176fac81cf141024c3b59d63b5e00fd3d6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1f021c034bdb4b57ec7d8678aaca383479aa321 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17f675a911ba3b1186788602b64a8c75d0635dfb375bd5f63c40c7563119cf96 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad40f33cc84c5f5f3bc96222a56d80368ef89a83 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86db4db6d11c0a2a8ff8e366691618e9713ee901e25876e0f8bd7ad68841e677 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2b6aed8b969d968b401113fa11dd9026cbaa1d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d232feeea38d9fcf13dde82236857b58a6542bd927e01b706d5b939b4d91933b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad34316bfbe39dca16de9e9b52e1a3d62d501533 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcec4d46daea3012cbaecac744de5546013fbc3e0b37e30c1ae83c2d205efef2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..723af41f3da1137420a8e5cdc1764946355db2eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:792b8469859865f90d41e7bcd6a78aeceac63b64a4d846140c2d1e46cf040fe1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a59448c1a0ff9f6a2e42dd9451852475e1bd73d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:543d3372c8671f6e7e3a19364205239a47d8a746ba4e07831ccce915e5ec0fad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ff786ff0747a506b595402e6f133b1eb012872 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e106cd02b2b5340f5f4d72a1550044af60ea9b0ebbfa67a8312d5b8993e6df41 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e48cde37f77117614d45b7152988432d19ced9b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a5b34dc3f6d2a76427577699b2e40faf2a62269e96f7a34eac7563c67023da0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af0167281f5e86521c52dd627be277cef0275fa7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5002122caccde02cd6405c60f101cad70cdab3caa685cd94dc1cfcef87b0d4f1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6c590cc81f1efc60675866035501a07aa8979c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33635bc7d988d5e559e5a3fdd47a6bff4b77687a481e2ea0b7aa73bbe3f18353 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f009aac18a445eea0d0a1c6af13b72d0dfbf3cc0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5a233e40e71c00e62976b6ceca3381bd594af955277aa5dbd080d5a37bb505e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5faf1a15c3c085465ec5503e41169ecc2cab9be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bff1053174a942d1b4c5f1f0600309462fc282072c84376e8f4e3686200028ce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99cd69bf8832e699da7459a69467b931ad6c4b10 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b648b6d3191ed4425b5fb392f397c8448ffd5a8462123b4427d0cb17b63973b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..87b1e28e450a1406330f0c302aa415875ee3563e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c386d08872ab1ff98f3e72b095e716e69ea925b5ae502bb20bc15a88e0e4d4fb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a065b42ae62b36b52c53436de2c6c0c697a3110 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ece4ba65f4e2e26ed21dc55691af4abfc246a54049525e1b672fd6396f845b02 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3e06802005aff3cf75033df470e5192f0057a7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f5ae212f6f71e64aab7bbe48ccfc004392b13375e543da357c88c9d34f8c5a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a539fb6785d7f9f0a42098a44f1070ff567fbd74 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9ff8599fbffbc9a6f4ed2c01553d2adcbf025dbcee00f0cbbc61e590e5f4695 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0056ee8c393d9e83d0bc9f904bac6b9ae0bb0e02 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8749659e23667846209f6f033bba53e5790af44d439f0fcf17475f3a096f3de9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d942f4b0da1486bdb3cc1ee25ff5016a41f1a08 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b00f242cc372b9b44c88ee470a437d064fd687f840952d26ab8e30a233119005 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fd8e8bc5216345dc765845fa30adfff96ca36df --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1460edd87dd25b3599fa7fc4b5f1e90515168146c04866c5aa96e57eebb8707 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ed6ae4e021f3da2da99e54eda161a58d000e1f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3629c2d83c1a143ca300d1b788f091296c00e0a16ade4a4705855ea5a8e2778c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a73700c3df3a492e48af2307579862b64a93a292 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b821e65a8f1a9408874669e195d8446a1c5fc1d1ff42d629ba083309c27af32f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ba6d03ad491da8b7a9a45983902e5be0211728b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16c9d2a2be6ab30fde753cffdfbefbec3a7e0fc080d31e8506911b233b1c0dfb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d39e04db4055ac9a96b8af52469d96f533330a89 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38c6aee21b696c57197239822351f4d93a31126428da15d4082a00c23fb9d4bf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17796e272a9ea08d62dd41307d98ca9869067f3c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df9ff519da87d330ea1dfc5c24578d643119748f9e8228a91bf00c622b001a34 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4982ae929cc288f0cee4b297fe6ac17df59d8c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:505c0d751cd7a8256b83e60bfca4fef9e548438220a624d5200f6fdf58764477 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd031ade5bb35bae1d25ffc1a4ba51b123143621 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6dfd01c36e6cb83c9662a109bb309bec1c0b5767637ac7f440a0f07762db3f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b00a23425be70725de54afbd6fe79f6adcff895 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a952b2ad3f3e77c786dd5b6170bb4c2b63115a604ebbeaf20075a38e7333835 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa37a2cfe60d3139e871ad2567357d77706321ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2aa7a9386ba69dc9cc6259a973e85ee3c5b3592215e55287dde584f7a907c56 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f18fc4dbf973fa582c4c8fa9eede2f11c3a06c1c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08e67dcd1d15350640458fea01c394e4d30a3a12584d7f9d44b7f7e20a261484 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c433b2f299b8b1110307cb83ec582c6f9f450ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deb332ed1260e26e45956bfe765e1697ce69c8bf0d214af067cea125d75e549a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a7be9f5be94f0b7ff3781eb20da69e5a43bdde4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbbbd765141692478fe17dd4c1e10f365a8f42b1ee4e04416015a99d14c455b3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a97434b5ec0ea2e3611e5860ede1f5abffd84d24 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be1ac2848692a026ee762a09a93e6fad55d64b7ccbfc3898ee9185e3637bc28d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a85bf27ebcbf65e80078394a9d5bde98430a2f39 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e15cbf227049815053c1b71cc0de43a4bfde6edfa196d227bf534a3b6dfdd00 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c66d86a2b45e27c9e1398d535b6e8caf4bbf7dd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:649a9aaf26ffb702686da5b91315061db3ff8e495622917eff07cfd20cb57236 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a77511bb0dc096946051e2108583fb4800ef8ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55d83a889eed04c4f04043f911f9f424b8280ef9012961be7e21bfdc65bc7d06 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f47d950185585dda1855f98c19f905af8a1523a2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3b9dad05fe330bd52ac69beae35a80bc5f5c56f623f3c4a78c545b845d18887 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4064e311783edd31f8eef80072597310b57e5f62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e90183632b3b14c34da97d6940a4081e5ee65d8b2e2760f09235071fe2726cec +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..596fe32dfea78c2cea728e96caaa0b00d2742650 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4f04818c80f950c57010b61815d7484b241ccb67d1ea8dde3c529d5fcaa804b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..66e3767e6f69a94b842958697035e17f5e76edef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08089925572356bf2185363d30b804d40657d537dab92053724e203640c80a27 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a1a23163069f87cf3a27c2534aad019ea9e1349 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7b2d47dcb03e2021dc553a6502e95bbc603f9f17528621629c979a2cc2ac1af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d8c5f83c28e882b5701565263717c9b54753575 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a28b918937613391e188299ed79d82b35fbf72567b49ff914f4834be37f7ebe8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22a2f6bee54dba49bfe73ccb27d13fa8413e8205 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dcadea25f7aa0816cb018cc430529280919fecb1be3b8fe3f0f26cdf5e1cca7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a415e11d5c3698dc34b2f2634e61f8a61fe7607c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc9f9ce346e198c5be4c67284c71116732721f2fadaa0c5fac578b9f90928773 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceb39ceeb187223359052b40739ca63a0e3c8400 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:622a3d1d6b9a607accdee3b60a0a34964089f20934b4a2e06d9903722cdd7b68 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4066359c879146416ce31d95f66e195cc4f6b0da --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3d541f6f7770500524a12aa88a3139b4334fac61e082d040a3ffb530875231d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13c25968a3e9b213d075182d312c6a5d0f192c86 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cda0582f86afe955e7a1cdc8a5d4988fb0e81a6c5587b1c0d896764be2d2c797 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..18b5745f18efa79829cb7a6f510869ad50ea288f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:838c727c9e7bb4f6baccab46bca951e2050496598121f1a9d885f7c24052d9ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78aa3ce576c4c80bbc530838c317d4841f781a26 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee24c9191077473cf4d727a0774b6252798f646f8c37d0065775d890b7ee7dde +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2288e17f5d0d24bb652946c0be20147242db5bdb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ac5039f409d18b8568ec2c39f467b01ee83938eb70372d1d45662c2f92908b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fd015653685002f565ace0c98a474604248915b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c14b8c03732b0d746375b15d42c7b18bdef2dfaf2c4fba707bdd20703a61904 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..12648245ea7dae558fe26c7e05b59aaf5e5127eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bb4d7c5705db6eeef3b2df909cc291ccb408452a67a32b2e2fb788769656020 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..531a3d2e8503f676c26f6de9efbe40764b840a08 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61ad11bc7ea3c4b2a9fc1e2ad9022ec4030b1a99ad76d8745cee3b1291cea765 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32a4b6ca051a32ab442ff2a88639ab3253eec4d8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:910110e45543b36d36239ed9f76b8b518deb1b748c1af2c6c8af59b8f810731e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..14671502ebe9fb4f39d059f6e4f8aff0b4403dac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d201d498462e03b9faa4a3a0337d23adae3a881f131fd2edb6c530e6860395f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae231bb4e9acc8576f8c46218336e03efa04ccb3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da49c08584c31386521a9f0999c1a428310b22949159963d266368e27c5c02cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6480e24e03d60003544cf2ff9575c06577e7b51 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:502769d781b3c2cbff669a80174434c06fe1473ccd997cb3076e3071c6c30054 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8a87ca9a215338315932e096c20b02bca4ede09 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58ffb2750ceaae7274d2076577adfd463c2009b11e1c378778d7bfae8b910ef2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b320839e00cd54c4820696d6f4e3ecdc4c320997 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a04637be05ed801bbead6c5e984a71f1d1657b721d6a4a7790895b6e267bb38 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0ba0fb64f8fdc89b4aeef6c3a2b1f4c5b36e7ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23e990d7f74155ee54ceee94e58424a95c41cf98c7c8085cb44bc079aed9b396 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a39042b59fddbd53afb799457a19b3882827a21 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2ff2fbd6b439053f885fa4e41b95f6b0f500ef8f045539965b57fdeef9167c1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb4208687f53b1f612837a71736fd309775f31b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd5b5980bb740e0c2fcd11120e2f074c76a6a2fb3ef9cfcda1a4f0075386678a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c857d0c0dee0863888675d05a4bd8266c96021d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27d6d9d35da7ebfaa34ad1c852ed92ee1fb3500d0bc30d8ab2aa503910ef23c6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..edd2d13e2e8e332121318009b230f8007c5c360f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6634b93cc923531adbe8e40623d47113ebfbb742c6895f58605809fd557882d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc54ed176264bb7ce3bb3ab3581fc647d7b70e22 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd1ae71e6a9735e9293efbb83eb99ea66f3816bfeab9213b12cbe05d05f3d36a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba6c203d60f4005fd0ff9f5ee2aa10d149311dd5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0a434d64c8ec5dd079a37c42e7210dd9ab0401d4904cfeaedf27934b753e063 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..618ce0e86d20867f9c882a5dee941a7a9820ff4a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5185c441c1e8d3561f15852511a0c1fd4b481028fe22f10cd10487cf0fe078b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd7762319734a95c608f0370c45b65f3cad64ca7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4b0710d0ead78527f20624e10001c142257698bfb5906b2d587cb5ff3f44ac3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44a6f938014e30d11f0dd18dc0aac21c3241b327 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3f2d8262c3bb440684a169ba369d1fd7af84ef801518fd9a568a3840be2361e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f922c79a1ff962fcb2fa69c237cd4478a61b59d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daa4241082a4759e56cda9a7c071bf4f2f6b1fd9718fce3bb0f0865627d6d9df +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80fe5212d9986465500b4cfcda6d42919f0a8f6c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d4cc78699184c5ecda4a371e6b9a6e8092325045aaef58ccfe78585adc26acf +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53b38183348243839364ce443bbf6f5078de4868 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:155c069dba5984dfe3d0780882cd4ae7b4f8b5ef06f165744205ed296c2287f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75048cb80d056e898c9624cd497d8e1b22f0453a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74b656a5fe38e6ec2899ae3cb551c15b91a375616acd9dd6f36b44bee89fad3e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d103b4bf2a6b9083f1ffbe20e26d1691e7dcadb3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74edb79a6ed7187da75e6c1b4f128d5075be5515b71e054b26ada6b577223cbd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..712e45cb76ec34dc05878ed477b19610bf07c110 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a318acb7ff6b21c20900f4f8161b0680b53bc8234f5d9d2178d164ab958725f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f236cf7778942b6ffba1dbebe47d12680734796 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b99811b61a71c34d8f55a0f05ce472d959a77a272dbdb3cb5903cb36f221f4e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f698b6eb634705a0da7b5a5065ba112db8151903 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea7c845c208a33de002a992c3cef1a8b72b6cbd45cca2e74b2d5ef71973dc668 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b22145e42985b18d58619a04f06ff4b52fc5054 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eea7fffebe160fda069c0edf179273bf18e8466fb6eeff20e50005b36a2e286b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88bb525881050fe849b2007d350af3700697613d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90cde46a3e9f9c9003866f9aff235062745253515a5a4d6369412511a55025e0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fb559b03b3943aced08cc2110cb2be64f822436 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa3bb6d988a3c53219b657774bf53442b55cb73402eb18aa9ceb1508935f7fb0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f851c955d340082be9d60097d843397fe240879 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_10/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b93381c8820811c9f825c3433dc0731185550275984c886d7f268696e7243772 +size 11395