diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/lm_head/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3925481e0fcbbbc8c871ab5c4d45eb96887d7aa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b087e7e2bc6dd436f2ab8f995c498e33dddd72798e9e7cd561d27252538adff9 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/lm_head/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb895cbde7d07a51e736dc7f4d1aa370aca1cc86 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:978d5fe4c7e6db72667a8a849dcab3227809febdaeadd087b768dfc48b130854 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..170b9d50af0fa9bccbe22972544bb20597e8ef28 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74e1526623c769a1149bb29bc8b26b02217529c1dbff64962955534f9bdb1646 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08dec4ce2d7739d37e5f3d2973d180101d357982 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:936cb15561a76e0ccbd18b2b51e1a0b1162f0a271eb4c7191b6b1ae36065e2f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..39b95dbb63bf210fbe602e24d806c45da712682a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5476b9febeb4a6c02c2ddccbc8715221c65cede89a24b79d674ac8613ecef38e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc51cb0f022ba42ebaa1ac2ba372a2966cdb90c4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaee1a529490351ddc268f3e3739c1285bc1f40725500b63a311191c17c6b8de +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..845716bebf4cecab221e7adda60b6246e3ce12c9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2efaf369759598188b2d27ad3ca9e8b91593deb21001167e743a4e5e59aef45 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4aaf8d336e5b287396808007defe9f8cf874a88b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba758f3e82f52a07ecc5082f2aaf154de1d4117bbf30d658697be2d98c2523f6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..86d2e39fe496b25227a2b3f931ab598c23a20191 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fe50e8c3c8e49666a3467d0badd88a4f264563aa4ab72f6b9881b296fc305e3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b3a253edbe8d2c9439bf17045eb2a38270ab2b7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31119f23b991bbfff4b5076f304227938716159d6d160284c9ba9a8d9e0d7e80 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9f2c1de486b8f1addecc7ca2610a291e9c58248 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91eef6b3dee3adebe7c27deb47819e83aa2e7978d4971a886975dea32196fa98 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa681618e522ed68682a10e780b42aa3fa78cb4a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a2689c25b92f3acbe58aa05c6d753b71086b93d749cfad683064a4bb81c43c6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..853e30170d83c5399d09193603f5e52e06226e04 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:601fc382b4fbf0f61753f6294eb4d7343060513974a6a49376a071acf2a3a3f2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1a852340b8307329de984c527fbcfdd13e0091d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67013a3a235b0b9e73a885982bfdcd0a0f4067b66277133d2f9c185f2de25f7a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5d4369c94244bc6157388c677023ba81833d3d1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faece96bed785f2ae7e47e0c83e1320045534eac970afbe5661f7f0e3ee2e390 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f52cce4e04e0dcd1fd84bb0a29eece7c33bf6826 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31188e68de624a57926b95e2f56cb2c47673adf6dd4673e8c9db337d401b9bf8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2e592e3e9a45261dfab0c7ea446afc7aefeaf00 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:517ed040c7175cea619728ec7c8d89eedfc42765bd0f6a7cb29eaf0e97223aed +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..89b8b34d25a7785970e15595f8f1c25199bc0e48 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6c8a1dfe13340cba7590cc1fbf7b59eb3d85a8a60dcc4baac9de9d1440d8cb7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9246762bb7fc9a65b65e345ca4acd1705371deba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:630977a4947dc00056c271a1c9c7658ab5403586a5e384248c0bf0c007b4cfc1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ded08091c3cba53cf89e9468b558efbf6fea419 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b65ccd046990822d6772afd1d8c66c27f4806dec7d08303a644accad8e7d8fb0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..782d4b453262de9f6824a1ab85d51be81c9e5ab7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64b711607cb02f3673887183cd35b21e5eca1b95734da908685954480beadc0d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d510c168aa8e9908f92b2ab957637ec64f3f46c9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cd462035eaf9824122d4d6d97e6eafa351fd828ebd2caa2b77afb8143860f46 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c3781adb4fe4eb6a09755a06460153b58821420 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e85dcab8dfd15ac3b2ef926384f7a6a287933f33500d0ed35220ffa7d4df88bf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..23be2792540692f7f5d6c779b38c273e6c65f4c1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d02de1c32a6aa3346ad2c95421275bec56ee75e97b5dc3ed3679734522bbcd8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe3fb825d00487be9c043b94a28ee0044d399bd2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18ee6d55e964301d4a148b5e029659d38661514dd1ee6a40c1609bbe5b63110b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d71a9d8be3286450ea72034d16c4f0ffb9fc7c0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a50ffb18f42d595f0aeb781898054564a7f1c64bb7e6768fdc9d33546716587 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..afcb7ddd5cf5e9a1f1958da3874a88513e583aed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35ddf1cd289f53cfcb198e5dff61296a48d7591fa996a3084952924db5bf0141 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce9f99ed6dc9b920d71a876267286aa7bab08a0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4108e8e6fd6fd5265a53c533ca28ca0b5afe77ae45ff43962c75af1c3043e183 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..008d98f8b2e0729abcbcc62d26109ead1a9caa02 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afc1d2e6088410b7391439a58667c6db50f0058c2a7f08b52c2e8876d31440e2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..62c6ceeeb051ba2119d4f0d8fbebe61d952e9b58 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e7c1c20413ee7fff732f5c9b148612f530f9af0e7e364b772d5f0b6be5438e5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c58e9e980254357a77f909af6375e7feba429222 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42629aa2fa50304fdd0a90e5ace599a7188ce886ec8ca256029e83a773068bfd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d575791731ecbd87cfbe77deb66bd3a5e9286920 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c92254ec3a38a08eee2a9edffda4b462b33b699903371d249660af85ad1b5eaf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a859cc5a18c4e64d848a773f0760e95301b0d0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e86baf93b55326286a0da0dfc60f6066811050e38622eccb080628a707008e04 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b469a0a1589ea43e9293e92780a7c9c37cf9c23c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9534e530eeb4443e86b0ec240fd13fb61e39119c61b6ef4d586ba9d222c7962 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe9f3d0d9b6f0de14351a85bbfe3628ea9bba621 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2965a2e68e832d9e1d51fcfee58905d3d42ba3077d90154dce34bb1b04b6aee7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71e3f7b519ef6b6c1cec753c76cf66efe9227509 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:731f5a93c6b74babd5bf7b08dec50ceed40440f92f045f476ceb7d9eb5d925e4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9599cd14ced6281c5036193a7cdce6ae5ae2a9d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bec30ba921bc3e92060e248e56fd1e1ab828aac2317d22c70fb7a24aac8a04e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d99463892b46079a6092e9b99081dacc40501b2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff2ff4b2688c281ceb06706b4297583ceaeaa6f80bb3c4caf16bbd4f3f79d390 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2661c7069e5baeff67d9a7bb742087562430b948 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf4fbb1ccaa38ca41b538350c872d8617354d7c0142d3a56f96f595494a244f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7a300da7591fe337e927f66753b970f21ae3dc2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12564c015b4b536958b0a4c4b514b1128225630fabf003b0e1c04bfbf1bb9c3a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0a7ad3a2e78c7046ae12a414de9fbbb3000ca5d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a21f28ea80efe0dcd6d44c125785ff98e8f2a2104e0d8867b6a26567c8278d7f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..35d6b2560af811ee38b321e0015b134a6342653e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5c7e6f74bde863c4361b88fe179c8e44dd5ad4dc68826a826cb01070d7cbaaa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb4d69f945dcd317d5340ff2ca0117c5221c2827 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d51be50a6814e539fb78a2260fa71c8aed32a19a10b30c1442d624ff11ce546d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..63d4ba2c81b3e5d6aa1f8662dd9abd51c65e16e6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea19087f3d71dbd6a915c544104a486376c986c62b4c207d8e4d9310a0524efb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..863813ab75b3af9f708ea3b7f39e91510c919642 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3ebd5579d79ab5aa7d14474c750a04f0a345a33c8eb7dc771f3ff1301003450 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaf7fadff6273dccd81a2b833e6381060969117b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1e1dd54eaf8521663f05ba926f99f686c2e77111cb9b7c1022c7e38ff696ad7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbb4d844e78b55a084a2b8d5c8976786ccbad1c1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:919fb48b4f6ffc92689a25b4390de17669a72e111fe51d0fcdbddb0c12a9d10e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..13c33cdad151ce2a411e4e9919283186b9970cd1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458cfaa1d04abaced3f846bf8c064870f67767f24a59cf4a7f900abedac35678 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c96a398c6a15d14f1fa47b294105be91192cafc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a870cca6c368eb961f52924c148a9cc445cd65add22f7c7348de378dbaaa7d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..85c0bfd94795a7bcdfca29424703a539a97c7e46 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a505610757ad59c29817bffba0e2a4e2bd5d9596a974d517f795b299aa6c718 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7adf72f60902ef66b612b1d793d553f78d654bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46bbce0c3fe203b6535c044be68cd9905f30e0bff084f687e3fb157ba264f574 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d2da7513beeaa89e29915ad2c7f2c0629370daf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f67a4dde3571038a30a1b5685ba8881d428fcf755c2ffa7715dbc5662570777b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c623ce3e285c04ef3336d740c483f27054fb1035 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e803ffe9b11116820582efc8d29c13c79be9a3d7e2ec050cbb8b0e7aaa335c3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2179d01e4391bf833035f22e686217bc333d497 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df71f755a62c4090f71873e493cf8dfcbf2fa4d0166eeb55ee5d1bc5c804b208 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3ccbbebf18d5d80ff6d7685c3481faa56799ec4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d3ce1f7eee1cf8b015f28c6b3df5e043293e7343e56af4fc34f889f375eaa6e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aa5d824385ab7fe44b6be446f4185a2c6f4089e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8633780ba7bd5dad86f53e1cc3cb86169c72bca9c0d9dd0a417678f43d13167 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd9e89e80c75891f159fda0cf4662c2a42ecfbe5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e0a6a2eed5e6ee556f315a6fde7113da62619503cab98d778409481bc75b5e2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a95edf3c426a65476b1a46ebf44989950719592a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44905dee3db9106282ac4c7c10becc1614340f0072291496dacb7dbed9cdc5be +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1472c48eb934f91461671c2bbbb14f95097fb87 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5215c01c6df3bc029a127900e2c479e3789610da0dbfda3eec3fa84a7660cd16 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..af2731d31348ce507a93830ebbbacabba3c8ad59 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b1f28a9a0221b09ea344f0c5dd9aa07c1ed61c3325e7cf548019591d4f7379c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5eca95dc8accb761f5e71803de62e1e1a3603c2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24152c03e5ffae9f97ed7c2fdd7d6d4b0ebe70f906b6e1280865b8a3cc0787ac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d40dbebe5a97bb05b4f2be07be1e7c31dadecd5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33abc562e7e53d78a73f8d8d9ac2764b218f9a83146abdca02d158edb8556884 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..584a92bcf74bc3f902b1202cf3c4d158568ecd54 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b561e20d4133d395602d2750d65d47802ec5ac1c522851c5ea79517f61e100aa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d29bd525556d955e35388cfeda6aef92a569e224 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f8c344e37ba3a366ee3b07d65fdd33738362a2dcc563285be5282035f6a61bf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aefd66becd2d3a2c9239c0ab94474e24ab81b681 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4295129b70a818b3cc7f2e0790ce04f18962982a6b1d7a41ad2072b96a7d508c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf1d7f0aa04eba51a73954752aad54c14357bafe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aa125f07d0a1e463a4d5f05ac47726b295aeebf658fa5ce29efa3aa58ad41d5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f3bc47e87b472ed91ece0f4329b40fd290e338b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb0eb349c98fe50676eca9b1de219438f6d29704141f726b626df7e94cc26fe8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..230e954e5cdba88c952e1215753d13db0a46af88 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:830ffa44c3061b4ef50abafcf6a3f8efa94e526d5350c3579843e6ff5b05c65a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c620deda4cb4af464c292eabd88dec7ef3d937ff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb601119a31d44a1a3bc37183bed5dee93c4827d3dd57081ab983a2854d0ca2b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f6b1af73d31a6fb998f1eb9a0a5bfd5af77e5c0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aecda3f82d55e6efdb6dc84dfb0121feec635ec03dbce83f924c0d9ca1c6950 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79693f507963554ac3c884ae5057873b625b299e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63636147734e251d2f5b8b64d2722a9c5e2134a44dc14bcf318f304daad73b0f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d01d98a03f4e1ed498fd55e7ef60a36fddb90928 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f6f51405e5ce52cf799ad01d659ab7bd29582f1f6fa3e90cff40faba216d985 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bde199f019b83f837be4d43936acbcbee76cde3b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aaa0118489d73ba7dc90ac15b0bb68ee514c02b587345c024223808a7769c31 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa6c365cede51427d0e469acc992014ab4801111 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a364dc0a720fd09448bc30d3e57ec1ddc4b8ec365f2f4bdf8c3ef42947a8b5a4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..96c9c29d521a23bedccb6918ecfec346ed182dc8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2245952c011ca550abe55600b0b8b2a497bcaf25c53042cc16d608a6332ac4b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50b8370d5c841567d43523f3eb5f094b32142942 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a508a7a746068ea1bc6e79446dedacab4d3902d64133fa93bd9bd7089472dbe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b79ff3797710f3e44c1f47f2df3d4ec6aebe168e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f2096b6499143a8c4eff9b43f158e6e5e88836cfe81035ae546d00e3757519e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df17b3f1632ca0978e08b98ceb11890839768216 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:990f643c5762ea714e7305d63896763e1596ccbf69fe7da6d7f81a9bbca9e6f9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d099fccb086910a94a46d26bdbc84a7f9881556a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e90b39ed94ad062597b6a57b57e1c4e902c68de3b0217d08e585e651f1530ab9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48014bdada572df4ed554b583466b58f84e909fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:566b29d0907b93946258273b292fc80a1633885078ce8d9b304a7aa849794f84 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e26ba0d3a47bc6dd3c40a416d1ca9f8142a02b8a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c085f8182ff35c36030ab6e453445629c7fc5355eaad46c67470aee5a56b097 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5596d0a0dd88a74379aede4640b7ec66ab344816 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96807be795c37540210f0f9e556271da2b04b45a4a664e24efa0a2dbb5499e05 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfbd93f260c74a04101ac585de0a0588e527d157 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f5de096b4066213eb371e882c70c3a052f57a3ee6ebee4ea5e01bd47f7d79e6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9965a80b66edd956b0293e3b519b5311deb2e01a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6555922034b398922bd80828d85157c34d91aa4f1132bea458cc148e57bef1f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5e1aa1dec663a38beda248bd3d6420197604e5b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:080ef07dd4b82a5058087d46988464efae32c4d76192e528dfa0f0761483d023 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..41dd30501a25b63d437feeb561ca3639be4934b2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47c388ebc2e8cf35fa1966216dec0f029507cde44400e9213f754ce3f36ee16a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..237f80562066571125e8713f6560a452decdacff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9fb2d9556d5ad3e6f7f4873402d274b5ddeb3e16199f0c609eeaf037ad8b3e6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f908eb70d7ebfd2d49993e2b4d6640d52c56b6c9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89edf21a507f4e998e966249e53c8d65a1b0c87c479ae6a5633ad8854532b545 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..33a8c8855903a1e21b776553b563b4c3438295e8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdc186e07e7256b962f3dbda7baf62a2ca26c50da0c9eecb551080c6abf83492 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d48ebd48a91101d03aaf868092c5ad8667469d2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:665d5cfcd063f068d603e58914248885492e64e006d97bb19f7cb36b75adc73e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..14633e09841eeccae2977d9bf07ec473b2af18ef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58e8741c5e60a0ba08b5ed061f925f63af1a60aaf9cb8dd91c747e079925e658 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..504fd8cad5b46c7c5710cfafc27ac5352ff58142 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18bc79dd9149ca06a3f04d6c4c154106c04cc633bbd4ffb23c921a768b2fac9b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..812b04428d9aafd994566fdb2a9d20037307d6d8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d29147a801f7f970b6490e798147001845b76de759fc9895bfa0064ebecfd670 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eb8b183a9e3244efab40ab99aca7297325a91f8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eb77557055570845ac78296d8482a8a2654fa4b7f07b448550ea49ae94b313b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6642eacb8818505cc4415ba58265d6944def0ef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96c603c76f465f8a476ef122a083e121f68a079ac939eea6886cfd24b9101f6d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7460e4dbbc1c42b781f8cbc596b3e503d86fc9e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d981d7ac996a47ea17e2acdb92057de71ed6a1d16d57b14cf88dc3acb34dd177 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6dd6d09d78340a8652bd60582b5898ca2d53b31 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97b521036a377e1a4bbdcec8cdf0817a7513f6ea6c4fb3b417d1f585f90af493 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae0cb487ef14d4e83203a2ce97efba4f586a4929 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c53c4e93ab1760ef74af20f0615f8176567682347e949ced6a2b2a8c7d089ad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8c04ba292b8fb999334108c42a3215ee3d2207c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f63ef2cfb4e8d40708aedd8fa9dfbfd524f75cd56c794fe2bedf24682de3a8f0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9828eab582634f29b214c1cdc60c022f4020e3f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a89b7c9ac89394cc3e50e885ade13c507c9c728f726bab8708b6e908f14c1152 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50c006876b3d41e6b87f6516e9e477a1ff2baa5a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9520fafe51686e808277a851ac3fe4afdc96d64945f38ad6398a74124b4956f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bc04cc5a9858b1606394b3f50259145f03b8576 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4774db02342161c09d8bf6081482484ffb6cd8e1e189409ee64c8350820b6816 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc708dcd2772a850bd5554316b36b65b9b5a2950 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:055bcdf1fb8842a0f1f35a659a8f4168f3e8cb2a2fd848f2284e0dd622b56447 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a41178245e8920642baa0d008a72dd71a5330b14 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27332c44ae9cdec805ffda1f887a6bcc40ea3b25a88c3cd09605feaecdfbd5d1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d964b9d81e16727a6ed21eabc71ea11574a0503 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dc553cd897bf353e5d51c50476eb94a2e04d25bde41b32752c31f5df9b20a72 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a143a443ff43280db52c0db7a67b8209f163c5c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae2a1dadffc63cd0d75c61665c3b38b23bca4102a3f4c60234ea7f43bdcbf16a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e32e8d5228b9340babea6161252e711e0599012c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0bdc0f54bf74e34495b1f124269413c68dfc14ce966dd027d05858db73b5cf5 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea7298610c2a6a3baa0eb40961e8c65fce436184 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98916f6f0a2a5ab7cbe459b4108562c814b07fe183de91c3a2491c80eda2f609 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03480e8a1ae77db90d641ec44974c90e7e9cc78a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c570f0f3ee8843812d9d0407d48a063bc344f5933c0dc707e231f1f404ba421 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..db2a24072a6df5ca8ecf9983bbcb962f760cb6bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6dc070751c8537de9d54f790853264a8b031af8f6872c8603317a9e83f42efb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..726d295f0349743dbe0eb746955738f78f9b21ea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5019aaf0e1aa36a9bef28e45c5ab8477a5c1a691d6c2ee47ed194437fc33d14 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92bcfd18a881659a9ed1fc35021b55ae3faf45c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4ad8abd957098031ab42667d87a11428b863d4ba4d09b7bc0ad0800a22ee345 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..034a666709d4006cd7b0b598d8e6189a09af0983 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c8619b3d05195cd79d2dcc3fc0a9ae56edad9554922d12cfb44f3c93bce67ba +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd9da70e613e82c1863a1b290c332359c0b26666 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9dfe066f757d624cd329e5f13f9b5cadab30907c461ad16597ad5ef28e5f76b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c69af98f3414a35e90ac8deed73c86f1af5ee329 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27c60b68a04ae6669b9c62c1d42d40ca94d2ad02826cfe551e5597978a944c40 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c9b84dbe8436fed4ba883a0a5672f93579bb2e7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dd8e5768a2e092dac41659bb31671180682bfa618377903a04f39e21cf89013 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f469db9e82d9f057342e79527bc8c04b07dedd2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd22795c1b8c4fe5745d40019a80cd7b450be20363126d573bdbe1cd5a01de8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbf759dfe57aaf560b22ecd2c46b192b83a9cb2e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e05023d1fd97ca3fcc2a0aae133d7c43320f5b2f5a2bc0982c8f4296ba3439d3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..193a25137cf4c36a0c376809a1b2b6dde30c69e7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:025ef8a405144eda76973f3a17161e5710f2cd2911480b3be62d36f40a38ddef +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9587545954e0099f567679c98385786f526700bd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d23d5a5e26b359d6df143bd4aea26f62b49eec7ab5e2382d719efeccceb86d73 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..912562ce248bb11ae301ce640e39103d662b1025 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e4581b9caab9218408a058f01408dd5867e4a36c7d36420d1d4f8101c7fd281 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..77860c61a6200be4045bddc56d7cc5f402ef204c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a986143f47fbc524430bf79f47fd65abc751533d11faf4a6fda6295b834975b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ce90413e52afae73085e6cc83ed28577459e287 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:045482c25aa41e9cc7036476f24c07df2b415e40328ee146ca4a459cd77c0ed0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..575d0fa9438d98bd92a1963c56ed255c5d5c385a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1db7847724068d9dcf2dcc48ad39468d0992ecdab2a80acb31c34131520d69e8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..028e4c8d10f70665e1b8a734728f85531c650a5e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80408b3fd655e95680c63ec2b23a172c491d3eef80b3ae8e63f3e08291f69339 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e710fb5c59447412ee1bf5cca1537735bb4982c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4d4c5b8e177ec9d004484015e3bd6803c474da9843e2d1329d5aadc95bb5de5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..da0b6998b4617c96199336f6ffec1d1b053ad76b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d4b087947dd89c365639f6b08a4cb190eca2992c1cbaa645323bd087d41c77b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c132237e01614e322d0484486827bb56a602353 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0033230b04b3d7e02528a15dfa64a9c66faa2293c5e8ef9e004dcfca033c95a5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64a654f6394b89132d27c2e1af4f08ad01d613fa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dad4e9510670e53b5ee9cb07f2d1a94eac3db4a31179addc2dedcc5e1eb9d359 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d3eaa8853509c6821d9d753a8a6c6a2820b8fb9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:684e3720bd564c0c131c1a5dc5ecfced0f53b00e4885cd7325d4fd92801ed532 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5072998165b27b06edec1d02a44721540458fd7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b276435c324d9719dab269230955581d21a4731113c43cf759ebba0343e085a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc38deaa3030048307d986ec375a8f352ff5f9dc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b91013ce11c003dd5adff98db88edc1789ea583be042e62376495f28f870689d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5215f42ca283d8ee940d51876010d3a733625b42 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7d7dfe6bf58e1d49d7cb3a8dd8000d146a09c1929413b6bf2d4a039dc9b16ab +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc0a869ca2a52946a6128a3ec264d435817c9e56 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea5b04bb16dc3fb38bcd4e7f2dff785cba115d92e70b45e5af1c434f957e31c7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..86ae222729e39c28e351fbc20ec9d268931fca80 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:790ed2524595ccc208be2eb47af232b2ae42a93c0787e500023f3d4b1f521371 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..517ba87ce8153f9bfb797561fbeeaae9321a2010 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf7a40a3b15d906c43fc89104cf93a4f66b850d77574a6cf1577535c2d00a6f1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..29b00b991f5df358c8a407d00b8de618ee560973 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0c5a8d26932c314b3832a5ea9d57aa203fbc00132a0d1c2879521b414130b75 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e95388ab6a97c03f1205a37d6d03ca68543613b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:154457e9c60211002193ed8bbc19c7056e86ad2b2922ade1b11bdefa67957627 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d474e493ad037b86f2e4e081e3b389f708f6736f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a05ea9fea3802af0e59246bffcfba652945638e5865d3b6b74d82e3ea8cb15c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11c7e4a6ace255ec9f063f6311b2a672202f2f10 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09b0011f504019b103316f409467951cfc24fe8bae8ca7cb6b04a6d422767c0e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5d290fae5760b777c91b52bd55984556f544d83 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1b077bce21ff3449ff7ff5d392b1e5cccd8eb38ed1cbb6379eb0ad238151bc6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e735766e318cd10c87d0a92119785d5e94ef9eb6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b4c79c5dd25d069d5e9f0c316da794dd687a9c812bbde6979460961e3d08881 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b4d4da6265bc079c3603236124ea6e537469070 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc8ef5d7ff27e86f47584206f48ef4ecb85c04125d3ef06d9bebd5ca9ec2a4b4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..93f0048e5be9455c02a82af116f139602e31889e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:482ce65777a5b2b5f80ef0b5c1ae27dfa0f2b1e2b14259b440b3dd1fd38e81ce +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcc7b4a1330df367e07a951b264bfeb476479b54 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:420623062af488125a20c314d77f8fa366674418ec6821693cdd96c052a28159 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01a30f888a01d46400d0e582b41d254a6df28039 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36d2064844778d6f4f63ffe80230fd77b99534759740054634371e57f3a567b7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..156cf8b502c8dfaef41d6b060c94180d47ace27a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21c2985d895da013af5114933c04584ae5bf22e6398fd12be882d7c95f791ced +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b45d39486f1e55ae58c47c0fe44c14d0aada68f1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5e93c05039c90011e3c3c0f60cc6594cfc73520afd32f9e2aabbe0e307f801 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4b6601101aa4045973d4c7a595b11036d9d47d9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edc4f3771aadcd0966d017466b914a800e3fab487898f330cf9509655df1ce99 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7280cac6b5803e48f364011b3f7705686b573a4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:626f85f0538a6f5d8bff15ab1c0942611c263535256b10c416dcaa4f6a94b38d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d75bf4b1ed44dca85011ffbf8d39da552f83d78d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9adb6907b9030cebdb27f96e12eb875de8e17b9832bf68c6d880bec1eacc1b06 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..893e12451f6b83e124f7183323cb7c63bd6ac919 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe599ea78cae71b58eb51008a2ca7514323d3a3b490171c86c1e4320597cb039 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d52bd562668851531c1882f6b5c2abdddfbfd04f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5963d7dc4834b757f92fe532e072671f3078086af902fd7825c7ebf4ca638a2d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52da009cea8c5043ecc65e7f173d1aba3c90a6bf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca92e2b9864e760a235008666bf8c1092efa2a13457a71a06a3e8ce2d86e7f8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeb328b21144fc317e63a92724745522b28bcc8c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdd0d815762a8cdc4694f3fe457dcc0cc211c428452357262106bd9cad28bfc2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f87b4d166f5cd7d758f0a9c42c6a13f347957f5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54c464be6fb240c814210284010e68b8f4c24d0503783bd05237f975b50f98e4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..770227b5523e22ce0d59e5ada27d43ad2608a32a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e85319da1424105806c340d75953da2d92c58914659e607ce815d052c8a6bf97 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54500368afe1ce3c27a5f3bb3d556f59e30ab25b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68302279244c73cdac3f6fe523270e75bdc9ada828307522efe172428f9081a3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2442e1f59cbcf2c7b371a26e162001dab4498b9b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8829a2678c60bd87a42454fc06ecac202196bf579b2ba92d5748c165e470011b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e307cec1db8c9f0f0a0842c7d455189f59f778b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b549a0619bebc61bfd0627a95239d553af0ca3e29f66e7ad4f0b0b5385aece6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e03664d1b9bbf87cd033210b2d4dc19cbac9e816 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:455555ca6bba55a38e93187ed51ac067f0a73e0e8f2c779acd657c4ac58288b5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed84b056662750474a5b723f95748fe39a045e24 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ce094fc791ae10a2d3f14d3ef1186cd5ba2ffd64834a982b01d1848b432b963 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b77be3af0eb60b481c873d2893bb2b64267a2e44 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed4e31b581912cc3a95369b1a99c08566d48901746afb9df495480981225e2e4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a49c019d3d2d931ec010a70e6ad93f158b61e136 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3241781cfd8a1043d50fa48d23340de438d4b43c5be3051c6d2ebe3dd8a2bfd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9bc0c2148a79153dd6aa000ba6dd8bbc0b94ea0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3140dd3c7a73202ecff8bee421b3eebd30ad6ea45b40b42f36b3f7493bd65fb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c358e7f9877547387531bbf5ffdc765c3c79617 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cbe42b9c1e0ea7e1f3b589f9d01cffdf0dbead998d36ca9b8d6055686a370f8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b116a73c8db900d744edb1b879ba2da488eba10 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd3c7f605b3cdd75c7d71a7c0637c99f162d7709ae99358f108f8e1c708e0b7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70daf88afc60221d1057b78a8fc0e4807b2e627e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d72f6a8897b208723c98ede1beae5dbe71903a16fb55b661c48746b967261d8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eebbc5b34c7520a73280f02c3caa4e0dd23c1e5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a31dbaa0da55ae487d09a50535dbe196c0bd815c1c3aeeb0b9c13b08b2b14fb +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc8c1c80072cd886e4cae2de5b4d9543bb223152 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c75e78144430b9d14f076cf91a5c7e91be8b8fe5bf4c2e0e0e9dd348ad6bae3a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..90daebccdefef5c545193c23ec2b285e58d7e864 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:161a9398d45d7e100b02a61723148dc0f0f2ef482b96337b3a02b1f70563537f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bee69c0322bb6ed0249e46e454e93d4ded38bbf8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eff4cf3a13f1db6e0342cd2338a9c4edae75bb84bf349346d3d590ac42912dad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd1ae45fc49af6240a6e641a1f9ca041570bc9fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8802b9bc71964587832c9367db4f418ad49e7173130ffd0f5054fd6a33a2cb24 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb384964ce19d9d840a63aa84deda2edd1d56464 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92b73fdfbef70855d270363313f48cb1f1bd08340642a8de778424fa8531afae +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e769ce25ecb79b7718de1440a04668aaa9352258 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b66b450f3931e545eacdd7cece482a42ce789fd6a698e4fb57e6af7cb7fce108 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71a95f58833227fcc6075080c38c953490f1cd90 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25fbdbcc7cf49f1e194d8e475b33e51a50024ef563e023383bfea1b6f4d165f1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ed96d0a2e77e8e08775417df5a0437b13eb45bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70d4085c8c6d5e0300a90c4c833aeeadb5b8f41bade9116d1f92dfb3828da7f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3d4459867dacf1b490b5f4ed7fd1d599667a866 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a212bdb8bd90de10b81f87084b7e177c0cc0ad89dd67afad99411582e3736b43 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c19d151179d406a3b8850abb5f35f6738a1d389 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa9a5d663babc0c1108ec783a1ac9929e673a72a069ac50e9f59926da36d6089 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fe2a0f7d02cd18508d4c7135408ad0ee70f4b6e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6aa79f73e161a3281d47e34d37a7b17f1fb71460292c5671e53c6c1734919ddb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae0a302d8f3aad5168a1ebe83a915bead32dc66e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b48aa0c024a92abc5afa64371a3f1c2293a42b33cac5fbd9d1e913acc45764e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e83a51b62093c929c9d75d97ec34e4f2ebe5e098 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac6fe71bc98917d3636612212c238dc700d3339a98205e2eee66c6efb0979e5c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0244f0a3261050da8277383cdbe0248771a1f0dc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ecad4186cfe081a49a7fedef0f4f040841956a2a8120bb29b9d456c9013815a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38d465eaa2432f3fe8033bb6e509209e191b8823 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ec641ab8e740f1485a6292670dd7481499e5b3fca678be6725e87f8c731497f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4989cbd2ff068e992a2bdfa9a5e6c20521162365 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77edb407e0e17def3668c331306e79380a138a5f700ef1a382ac8e795cd29335 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..91279edc3385e6757eef60292ab6493a0c9376aa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dc1bb853d9b8c3bba97467e5c06b2e6c541ba2c91b15f86ea8c5023bc7ab690 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f470dc9d27d91163ff3e0d90ac83847e9a6f3d5d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d5c2384430a172915fd77ff552e76d502ad2d8c25ce94b7e2e5e0a7e3cc627b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea2cbf6f5aff70744f8a8aa6d75ba29ce391fbed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68faee27a056dab3269ea49a396c3d4c1fea8eac53c18d0c9b4a514d209bccb2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c999920bf35c00dc879abe3a5dbe02ffa39c497 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1725aec5ff1d5bd385eeead18499064b253a4144c59e1b6640f55ba61b5b7e79 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..db33da5e7c37ef79964c5dc655fc2558659dbe19 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a650bebaac481481a58be663c1ec8356897d7e2cac9c5c8aeeb4c9cea1341e7e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f02a2dd4fc71fc77b081b94aa9b9bee391093ca3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb51cd1764e959139f0b9fe9fb389d4653572ff9888b8d9aa6710054ffd489fd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed4fea2fa60d3670c251eccc8e8595e4bd8f67d8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f89a3eff7f2e8a9923f49892fd31ed5774f3e1e602d46b4e8b726952478c21d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfd60b8b8e4e4fab8bfa4998ede1091613ada17a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9951e6d9391d6f029cc95fb66f425c5168afda5f1ab687dfe4f47dac86a846e4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0297c5f5807baf677eec36d8c197c863be10de0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6090c0c8bffead6c349c1485c8f8b093c160dd785971974b845ca8693210e9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..46d6f142a3a394d003542623846ffd66538d909f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c9bed88de84decd3aec49cdf1c345a1898332c8fddd61ebcec33221e5e0814e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..442b4755c72846a7b0f15b5e0a60b234fe7cea74 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8adfe8c23cdc0669cbc0292462b2474720d979cce00306f9e607b3555291442e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..794381718127a7f3a3c406e240a6c78abeba7f95 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:168f576999d5c1c1e580737b2919be561f23830d599430aecdf0ac2fbed07ea4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0084b45545f31b0a1f25914252711b3cdf59551e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:492115e5f8213dfb5b2824e3b0e595b51912f23dcca8601f926bd86c7d9e48f7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55af0538bcf7552865017ef5ece85a3a1cbf5d53 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:722132ebd6a108daef1a815cd246c91fc6f711ffc21a156b7a52f7dd6db0ac73 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a84358c8f4bb4eb3d49a25bb6a1b4dc268d61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eccd58adf9bf2e24edea7156d6861af70f291c67220b2e08280c35ed1cd38bf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/lm_head/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3925481e0fcbbbc8c871ab5c4d45eb96887d7aa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b087e7e2bc6dd436f2ab8f995c498e33dddd72798e9e7cd561d27252538adff9 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/lm_head/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86bbd94ba180e60000f82d44c11d4e7ac3b45004 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffc23b179c4b33de797931c1b00371c6baa00b25d50f41c7e6bc09ec06daf9f1 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..170b9d50af0fa9bccbe22972544bb20597e8ef28 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74e1526623c769a1149bb29bc8b26b02217529c1dbff64962955534f9bdb1646 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24111a1b3af4100fadfd7aa4343c8f8e5c2bc651 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1073ba5c9fba36d40bb0a8563dac315c4fe2b2e6ef049bdc6eb3a8e7a9269d21 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08dec4ce2d7739d37e5f3d2973d180101d357982 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:936cb15561a76e0ccbd18b2b51e1a0b1162f0a271eb4c7191b6b1ae36065e2f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..794625cc600977645cd959c0e33b337f9f14c4eb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f78ef142046c5b05bd997a995d3dc08fec3e375fb3620ccb7cef4306de61f20a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..39b95dbb63bf210fbe602e24d806c45da712682a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5476b9febeb4a6c02c2ddccbc8715221c65cede89a24b79d674ac8613ecef38e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..437902cd711c0ba209c007e7d9690f22f5367e59 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b06a11f25c6986bffd2830b5692554d302cbe5241c2b8cf9a839d086ceb8aa2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a21dc1bd7d76294157078c36f85c768de4b25b3d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:017a7e514f380f63018bc111c821eb09edddb48acfc1c8b6c55dbc8839fe8484 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a4c55f354e106c5424db6c228efa940322eb529 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d57b25df41ad55d56778e4a1b43280748e365c62b380c0cc388dc9ed2d2f585 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aafd58148691bea90579ea208f6e29122e6d8af --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c637c5f05c60285fffaddccb80a92cfcff872cd8b34865db361c76dfc932554b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13b1def39b171fdd906636eaf3b436313462cacf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:432c06707ee745286ec0040683f8ab71351e75d2e9abb0a3c8bfeebf2c475669 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4aaf8d336e5b287396808007defe9f8cf874a88b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba758f3e82f52a07ecc5082f2aaf154de1d4117bbf30d658697be2d98c2523f6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c42aa3cbe003d437dab4030d327fe2c10f0d7ea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfa02dd537d00825f841e95f4cae12f5f6d77e70319c019cdc97c9b0e008bbf6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..86d2e39fe496b25227a2b3f931ab598c23a20191 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fe50e8c3c8e49666a3467d0badd88a4f264563aa4ab72f6b9881b296fc305e3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..240c7e8bccfd3ef054e324a49cfd63c6469dee92 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23555e44d5cd44545d5331168abff77d81870f4c18d00d468dc7d5f76da04422 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bed834469a98402b541a469d17e92c3fa363b5f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a92d2eb85b9f2abb5a7d830d54e2c6600576a1e68929647d45a8bef227c75355 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d912ba082d0c0ce5bd50f412686a27289881a3c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0f8a4e86121348874c0b5d41db7fcae6a3f83a4d15f348f0125138a14742a1d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa681618e522ed68682a10e780b42aa3fa78cb4a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a2689c25b92f3acbe58aa05c6d753b71086b93d749cfad683064a4bb81c43c6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..127f769b5d9e6d17c172e1fbc11efa3edcb824b5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3184aec0ce7d01e0c09a1d879db20eb214ae5e6a83ff72f7049ec1ae486d1951 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..853e30170d83c5399d09193603f5e52e06226e04 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:601fc382b4fbf0f61753f6294eb4d7343060513974a6a49376a071acf2a3a3f2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8b990225200ae658131d27552cb3f5c52996d15 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d2d3e45f8ef9c190c80e1e00c955e622c11b80e8ea6b2388ef83bad589d68ea +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1a852340b8307329de984c527fbcfdd13e0091d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67013a3a235b0b9e73a885982bfdcd0a0f4067b66277133d2f9c185f2de25f7a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb2aef12821a0ad60cd03cfbb1a5758d2f10a8b2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3579ee7a232700d8dc5041e4961705494636dc488de70f1e652472f9466df7e7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5d4369c94244bc6157388c677023ba81833d3d1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faece96bed785f2ae7e47e0c83e1320045534eac970afbe5661f7f0e3ee2e390 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e38aa0b6ae27d42080fb4615fb303fcb7c5d47a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c8131c6c08131cbd8d53933be2a431a88b03cffb846e9b4212ada6462c74f01 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f52cce4e04e0dcd1fd84bb0a29eece7c33bf6826 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31188e68de624a57926b95e2f56cb2c47673adf6dd4673e8c9db337d401b9bf8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..573d66d318ddb80d8e6d1f13935d3e836ffc8e9d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:111fa8ef76e63b573cb3c421c0177bc241231b89dba33364bcecad4b7bab1693 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2e592e3e9a45261dfab0c7ea446afc7aefeaf00 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:517ed040c7175cea619728ec7c8d89eedfc42765bd0f6a7cb29eaf0e97223aed +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32e0656ee5b6c9e4a06b55390474bddeefee560b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:544b8f3b991d374f2948e75bf4c7cca3ffbe557068662c55c7d2535b058093ba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..89b8b34d25a7785970e15595f8f1c25199bc0e48 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6c8a1dfe13340cba7590cc1fbf7b59eb3d85a8a60dcc4baac9de9d1440d8cb7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95f8369bf433cb56a4d07ca1a607dc455a6c1ad9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3633f68045b97101de2d364a59dc40ee8335de384da300a8ee911372d13f40ed +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9246762bb7fc9a65b65e345ca4acd1705371deba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:630977a4947dc00056c271a1c9c7658ab5403586a5e384248c0bf0c007b4cfc1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbd3d9bf8eddc43f0df1309bc6e77485c9fe55ea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8893b9a6aeebfaf22a555e3f24b3e0496fa2663690a12e45e7a680f94f66ca10 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ded08091c3cba53cf89e9468b558efbf6fea419 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b65ccd046990822d6772afd1d8c66c27f4806dec7d08303a644accad8e7d8fb0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff6db2202804e162c605cb70e3fc1670573706da --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d2cc40dd81d3dcddf7c9999bd401d686fa9c77918d500dbb53de7d2af859908 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..782d4b453262de9f6824a1ab85d51be81c9e5ab7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64b711607cb02f3673887183cd35b21e5eca1b95734da908685954480beadc0d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f436f5dcdb17aa9937906a9b627a55cdc5e3f8db --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5782f12ad528801929ab48f0590c651ad2804d13fbe4c7e781a03554b568f35a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d510c168aa8e9908f92b2ab957637ec64f3f46c9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cd462035eaf9824122d4d6d97e6eafa351fd828ebd2caa2b77afb8143860f46 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e69daa5a5160a4493a8bee8eb5c6096689feb916 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:440474cef91f96e7659fb59f0a6ca623b6b4321264ba09ad1e69ff0a2e6c184f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c3781adb4fe4eb6a09755a06460153b58821420 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e85dcab8dfd15ac3b2ef926384f7a6a287933f33500d0ed35220ffa7d4df88bf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..160bb82c61fee2af99f2e8c32760c5c14957a830 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd8eaf6e4546eca031039c654f3f29244f58d0b124785f2f0df1930333d09b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..23be2792540692f7f5d6c779b38c273e6c65f4c1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d02de1c32a6aa3346ad2c95421275bec56ee75e97b5dc3ed3679734522bbcd8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ce59c79adf09178cccfffc8d1ed838e7c4d339b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15ecb087ed9838daf34b5a287ae7c80d83d18ab3e416769146234e2eb4d25aae +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe3fb825d00487be9c043b94a28ee0044d399bd2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18ee6d55e964301d4a148b5e029659d38661514dd1ee6a40c1609bbe5b63110b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50fd7ce59fb97ca6b43dc3b340d1aa35c46eae3d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:824e5a0e8b380f3c8a7963a99014f5a1a8a585af03b51bab1b9cee2a3189f947 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d71a9d8be3286450ea72034d16c4f0ffb9fc7c0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a50ffb18f42d595f0aeb781898054564a7f1c64bb7e6768fdc9d33546716587 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab0959a252b6df098f477cce12352de081b44249 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d26db3e8a0b4ed79fa01c9f95b1b08311b947105393a14dfeaddf28d0af17430 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..afcb7ddd5cf5e9a1f1958da3874a88513e583aed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35ddf1cd289f53cfcb198e5dff61296a48d7591fa996a3084952924db5bf0141 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1286f9baade9452f3f32ddb9bec0ed80c7437a4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e15085699f4302937f7e8d5202cd4ebc36f3b2946c8c2967e1475e8eb86d8d83 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce9f99ed6dc9b920d71a876267286aa7bab08a0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4108e8e6fd6fd5265a53c533ca28ca0b5afe77ae45ff43962c75af1c3043e183 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..856ecbe50b662ef55b2469433ad7755d78cff7d9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b0162ea9e44d55a99260cc30e4f2850c8cd7c498c33a4ef8ae0518f81f0709f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..008d98f8b2e0729abcbcc62d26109ead1a9caa02 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afc1d2e6088410b7391439a58667c6db50f0058c2a7f08b52c2e8876d31440e2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e78ed1541229571015e7b2e44d73e3efbca97bc5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c66600ee817182577b3fd165ae64389a1345117f0855a77279f2c26b891a3510 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..62c6ceeeb051ba2119d4f0d8fbebe61d952e9b58 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e7c1c20413ee7fff732f5c9b148612f530f9af0e7e364b772d5f0b6be5438e5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47998820d363a2ad02da9a409d28c1c92d02ae27 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:351967956d9a4dea694ad69dd5af427ce5e530bc3c601e81fe8373e25034814d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c58e9e980254357a77f909af6375e7feba429222 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42629aa2fa50304fdd0a90e5ace599a7188ce886ec8ca256029e83a773068bfd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..173789272456f6806991e81f42c84dc4a660319c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11a57cc8be5e6a80fe7b63faaf88fb6dc1f6fbae48ed0888b6058ea65617456a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d575791731ecbd87cfbe77deb66bd3a5e9286920 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c92254ec3a38a08eee2a9edffda4b462b33b699903371d249660af85ad1b5eaf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c449c733dbbc62c681b53f56aa0ca2108d4d6a89 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e90ffce916f793216d3c5f2c00c8ef958b9d5c5890300f6a8831dcfd52be4de3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a859cc5a18c4e64d848a773f0760e95301b0d0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e86baf93b55326286a0da0dfc60f6066811050e38622eccb080628a707008e04 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc9a6f13e872ea512cf815856fac7a979fbe2a91 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:245bda25e99da75256d9c4f815590237951744a4311e134fad92bcd16a37b3e9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b469a0a1589ea43e9293e92780a7c9c37cf9c23c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9534e530eeb4443e86b0ec240fd13fb61e39119c61b6ef4d586ba9d222c7962 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bf09a567ffdd58146b3289002e0cfa781284538 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e92e147af05f29cbd66adcfc79e90ed65ad4e16fd2fad73f6bc1a182917ecc8a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe9f3d0d9b6f0de14351a85bbfe3628ea9bba621 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2965a2e68e832d9e1d51fcfee58905d3d42ba3077d90154dce34bb1b04b6aee7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c36138e323a138056bc5fb6673139e355f56adbc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67e9c309c62296d6bc3cf45e53990b0157caf0422bdbb2cef49414b5b6d8ed91 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71e3f7b519ef6b6c1cec753c76cf66efe9227509 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:731f5a93c6b74babd5bf7b08dec50ceed40440f92f045f476ceb7d9eb5d925e4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b140ae4a50823b771a77e3ef4bf2c0563c29546 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:921d373cd2edfc5f815a49151c367b23da8e7c89b76462e74104901bea8da554 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a50b61dd63a66f78f65a6d328bf669fbae474cc2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8327466ef2f8eaed9be6ecadcb7edb03fad3a9d7c82052a850355ddf06f336d1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c60b52ae590138b9dd9d6dd9aead21293388e173 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80ff7689f8bddbc10f57601a4a33d0ab44b7b2b9f129ef76bced1b9a8d1f5314 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2661c7069e5baeff67d9a7bb742087562430b948 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf4fbb1ccaa38ca41b538350c872d8617354d7c0142d3a56f96f595494a244f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..025ea80fa2f7596fefc53c4989007c0c0ba2e606 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:603aee2bde425a9dd0bbe4db91c44d40a153f765ab54f818fef19cfbdaa5c3dd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7a300da7591fe337e927f66753b970f21ae3dc2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12564c015b4b536958b0a4c4b514b1128225630fabf003b0e1c04bfbf1bb9c3a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aca0932a52606f208003a6c603e0182d2bae07a2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ef8654036a7a032c756b1f07ce2d36538a46e2cac30abe8ee844e4fe821465c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0a7ad3a2e78c7046ae12a414de9fbbb3000ca5d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a21f28ea80efe0dcd6d44c125785ff98e8f2a2104e0d8867b6a26567c8278d7f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e6352c13eed0ce27f86824315116fc235b0fe4e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cd03281bd733c976d82b0ce2ac8c36152dc3126887bed5eac7d06502bbe9903 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..35d6b2560af811ee38b321e0015b134a6342653e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5c7e6f74bde863c4361b88fe179c8e44dd5ad4dc68826a826cb01070d7cbaaa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6993805e98f75ff8515907926c835e936916c528 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eb3799e9e5c0119f00ac0efd2f8c91d0dcfa6a63599cdf1a91c0d36e1d11190 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb4d69f945dcd317d5340ff2ca0117c5221c2827 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d51be50a6814e539fb78a2260fa71c8aed32a19a10b30c1442d624ff11ce546d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..013109e499c71ff02fd0b9e38800541fda5816b4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dd2b8d278225ed486ee8041e729d5504b37e67f4734d44559886048550f8953 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..63d4ba2c81b3e5d6aa1f8662dd9abd51c65e16e6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea19087f3d71dbd6a915c544104a486376c986c62b4c207d8e4d9310a0524efb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb0287d0402dbf16a6940314aaff73c14b8a2914 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57b9f744c05bb0b6f8908bd79130168b8a5a3ac5b6ed5b519d7edeb572834237 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..863813ab75b3af9f708ea3b7f39e91510c919642 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3ebd5579d79ab5aa7d14474c750a04f0a345a33c8eb7dc771f3ff1301003450 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c56fc181b8909621ed4a9d60af4cf16d775b925e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3563e79d44d7325c11a204bd4e66ae585dd461bc8cc17a9d3f5ba2939be701b1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaf7fadff6273dccd81a2b833e6381060969117b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1e1dd54eaf8521663f05ba926f99f686c2e77111cb9b7c1022c7e38ff696ad7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e5793ae8d4a772edcd135543a6befd789a513e6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a69f5ef254b779285ce84c3eaf247a24d084fc9f8e92912161c97ec9cda71555 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbb4d844e78b55a084a2b8d5c8976786ccbad1c1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:919fb48b4f6ffc92689a25b4390de17669a72e111fe51d0fcdbddb0c12a9d10e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..537e967576d83f618b69243695ac821f6ad4e712 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d84f6c629767d471005dd6c1bac5ba35c984e482a2e692a907bee521a564d44 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..13c33cdad151ce2a411e4e9919283186b9970cd1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458cfaa1d04abaced3f846bf8c064870f67767f24a59cf4a7f900abedac35678 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8318c4412b135b90e1dc72103bd0ff84aa0ef15c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f7b1ab8d22f2002bdb98cd93dc0cd3571a11f8c8db441c23f01f95f41638483 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c96a398c6a15d14f1fa47b294105be91192cafc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a870cca6c368eb961f52924c148a9cc445cd65add22f7c7348de378dbaaa7d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d08a2d10f7a0d6a2292f053d113a7cb7c4fa5990 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d02533759fbd2d280cbd1d15d76c471f85de1a9032befa249586dbd070e3543 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..85c0bfd94795a7bcdfca29424703a539a97c7e46 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a505610757ad59c29817bffba0e2a4e2bd5d9596a974d517f795b299aa6c718 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd172be0afd5f2654e0a0d8efbaaad04df63ce5d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2857526596f1476e7dd90bf0a325b4ea37d17ab0da2f37b24fd81d940bec6d7e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7adf72f60902ef66b612b1d793d553f78d654bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46bbce0c3fe203b6535c044be68cd9905f30e0bff084f687e3fb157ba264f574 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f47a5ef90ba1fd934a160856a18ac8ec0fd33f8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4933245d0c14133ff5452bc68acfa5176be2c0c22750c70b47f09da07fcf080 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d2da7513beeaa89e29915ad2c7f2c0629370daf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f67a4dde3571038a30a1b5685ba8881d428fcf755c2ffa7715dbc5662570777b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12b3e95c1370244ff73d3b7ae99460fa75003cfe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f716d502b0326c213da84427c4338066a978712b362ca8a7d3016ffa28f92aa0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c623ce3e285c04ef3336d740c483f27054fb1035 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e803ffe9b11116820582efc8d29c13c79be9a3d7e2ec050cbb8b0e7aaa335c3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..202eb150a66c34aec13d674c688cda230567074b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5154f27b04093651520fd018ba367ee8aaec5b2fd622caea474c81ae42a8326 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2179d01e4391bf833035f22e686217bc333d497 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df71f755a62c4090f71873e493cf8dfcbf2fa4d0166eeb55ee5d1bc5c804b208 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e03fb000f433ce6a5105b3b818cc9abe55f23f5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c8c2415bba5483a865dfd13ba286331bfe4fa7af7928da7987879e935c11eac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3ccbbebf18d5d80ff6d7685c3481faa56799ec4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d3ce1f7eee1cf8b015f28c6b3df5e043293e7343e56af4fc34f889f375eaa6e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f5719b7706546c124ed8e4409bce55b6c195fcd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:953e47b73f1348e856d8a6f7fabc1d637d10e05fef83c9b7bd8cb233aaf80dd2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aa5d824385ab7fe44b6be446f4185a2c6f4089e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8633780ba7bd5dad86f53e1cc3cb86169c72bca9c0d9dd0a417678f43d13167 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ea4450c79c9b0c169f31d8953d4bd58c98d2d8e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87ae00be10fed2741e411d31c320797f3722e796aa2ca8fb2fbc1b52bc6ca32e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd9e89e80c75891f159fda0cf4662c2a42ecfbe5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e0a6a2eed5e6ee556f315a6fde7113da62619503cab98d778409481bc75b5e2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..331b13c28135498734c8b4077f3f76af36434d72 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:616d4c6a8c556f1b7d95b893a2239577d6b53e20b1c84214f0ee7423e5b1e786 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a95edf3c426a65476b1a46ebf44989950719592a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44905dee3db9106282ac4c7c10becc1614340f0072291496dacb7dbed9cdc5be +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcfaaa15271b5ff72b4181a5d0d307a76659f9dc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9485fb19e8d197dcb93192284f452ec0d7f7a7a2f3ea790669a026824bf08f2b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1472c48eb934f91461671c2bbbb14f95097fb87 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5215c01c6df3bc029a127900e2c479e3789610da0dbfda3eec3fa84a7660cd16 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a1f0f21d4e2d3bceab3a6ff174cfc8955682535 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9648e0d4ed740872fb491ff7c26b0acf7a6eaa155325a8a672d1f36cf25278af +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..af2731d31348ce507a93830ebbbacabba3c8ad59 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b1f28a9a0221b09ea344f0c5dd9aa07c1ed61c3325e7cf548019591d4f7379c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90e5467897e7c067dbdafb9b1e3b098a271b8684 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19324b51dcd7d5fd577fe3de1a32fbeae715be72bcbf8a6507a3b26ae400c4ce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5eca95dc8accb761f5e71803de62e1e1a3603c2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24152c03e5ffae9f97ed7c2fdd7d6d4b0ebe70f906b6e1280865b8a3cc0787ac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6928c33db9a6898fce57be2e9423f65ebf7c4744 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4a22d5c012a20566c7fd4d92c26b93c610bceb45a1b7f8c5f1cac04243a048b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d40dbebe5a97bb05b4f2be07be1e7c31dadecd5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33abc562e7e53d78a73f8d8d9ac2764b218f9a83146abdca02d158edb8556884 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad00b6517cff4898e2dd203d62f98c527591e333 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1add63a6bf1afe4adb2946e872ec5484d4ee839e192b1549e26661bc3c15decc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..584a92bcf74bc3f902b1202cf3c4d158568ecd54 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b561e20d4133d395602d2750d65d47802ec5ac1c522851c5ea79517f61e100aa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..646551549ccb2a5aefb9bc7d0d3f002777adbd6a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbc1987b6e5e4e22764d1b4946170e7cea89752858eaca3f1d651035558b54bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d29bd525556d955e35388cfeda6aef92a569e224 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f8c344e37ba3a366ee3b07d65fdd33738362a2dcc563285be5282035f6a61bf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d19396a5fa18e0e767c206db541fa72a2ee84879 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dae08ed6904003676f692f3f8c5ba150bd5f614afbbabd6370bf3a5fe3f9120 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aefd66becd2d3a2c9239c0ab94474e24ab81b681 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4295129b70a818b3cc7f2e0790ce04f18962982a6b1d7a41ad2072b96a7d508c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77281c7bc97bf1afaacacd0967919fc1c88e36a8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00b441cdd84ce56cd2b25d9b3608c320bb31796690c214e693244567d920531c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf1d7f0aa04eba51a73954752aad54c14357bafe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aa125f07d0a1e463a4d5f05ac47726b295aeebf658fa5ce29efa3aa58ad41d5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d56c079be6d8c00198fd4263ab7d9e41329b2683 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6e205889ed4c6e56754a5e1e7e3f413ecff664dcb2108a79a9ebc6ba4954829 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f3bc47e87b472ed91ece0f4329b40fd290e338b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb0eb349c98fe50676eca9b1de219438f6d29704141f726b626df7e94cc26fe8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0688898459e25f6807553612ea073c29898ef8b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:573800657cc181b98512fb16360fbb5f628dfe24489671f2fecd26298d85c9e4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..230e954e5cdba88c952e1215753d13db0a46af88 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:830ffa44c3061b4ef50abafcf6a3f8efa94e526d5350c3579843e6ff5b05c65a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffe6314e8d5278f5f8ca80854b91bec7ea28e769 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e9c32b30ec5f94732299e952ffb14bdd4ef3d2159aed55ee1e9fa0e7eab9a51 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c620deda4cb4af464c292eabd88dec7ef3d937ff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb601119a31d44a1a3bc37183bed5dee93c4827d3dd57081ab983a2854d0ca2b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..20c1a982192d25e68bee6017230fcb01dc0e37f4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4466acc462e69684d6d64463b9a8f3ceb1b08537715a446e65f11cfc3106c548 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f6b1af73d31a6fb998f1eb9a0a5bfd5af77e5c0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aecda3f82d55e6efdb6dc84dfb0121feec635ec03dbce83f924c0d9ca1c6950 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..998b2f58da200b5c0e910ab61d6ad819e9c962df --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11ad7d57ec35f8d0d8a4037bd127421cd67d188f145e5a1ca3ece2b6eae23616 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79693f507963554ac3c884ae5057873b625b299e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63636147734e251d2f5b8b64d2722a9c5e2134a44dc14bcf318f304daad73b0f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..311ae3dd4ac61f497f307965faf6e09a401b0d0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3602b05a4edcf0a7b913d8f82e0819edcf91ef62453cf218fc9fc14d2c365755 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d01d98a03f4e1ed498fd55e7ef60a36fddb90928 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f6f51405e5ce52cf799ad01d659ab7bd29582f1f6fa3e90cff40faba216d985 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8774ca87fa0b5f9f97b9e250840c8725c20b5a0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9358f1e06dcf4824ea8b14b7d9cb8208787653ca2713ee94c4f6a2141419368 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bde199f019b83f837be4d43936acbcbee76cde3b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aaa0118489d73ba7dc90ac15b0bb68ee514c02b587345c024223808a7769c31 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aeab4154fcec23842b2e114bac7246132920085 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:792baf1a0fd7847681cbc05461a5fed7306d77e9c8737e3ed3af58123d65df13 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa6c365cede51427d0e469acc992014ab4801111 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a364dc0a720fd09448bc30d3e57ec1ddc4b8ec365f2f4bdf8c3ef42947a8b5a4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a50d507186b12c065331ef42eca6aa396f34305e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3ffa4dc12975976cde084880b23045cfd3dfd8da6f86b7930a9e69676e281c6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..96c9c29d521a23bedccb6918ecfec346ed182dc8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2245952c011ca550abe55600b0b8b2a497bcaf25c53042cc16d608a6332ac4b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d71838ce83ac21483f630c35c7f61cb770e18fb1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:916c9db61a4eee75466f197b3cce11c47a8db50b11153e750a311944e61cb33d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50b8370d5c841567d43523f3eb5f094b32142942 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a508a7a746068ea1bc6e79446dedacab4d3902d64133fa93bd9bd7089472dbe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eabaf48ed78460be1e76ccf2ecf61395353cc8f0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c93490a32468a452da3f0141bd1b8f9621052be3214d86a293cc1af30acea98 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b79ff3797710f3e44c1f47f2df3d4ec6aebe168e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f2096b6499143a8c4eff9b43f158e6e5e88836cfe81035ae546d00e3757519e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1d65db7fbfb37a4e9276da596c4adc7880c8bda --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:400093f1f6224289d1b4eeef11b853b7ada076241ac1a803eff971ef9f6b15ce +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..63b8ce64faf6e95619e4f4c74eb0603bfb860c2e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8acc144fc4ec5edec0ce4cf2f20491241bffe3b2450b4404f980d83e96dcf3c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ac706272b226e34f55f3937f6494f998b2e699a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb7bf878d2f97ad3d0d5624b47c7bb3abef991e3b36ee2ba3331cc511cc81091 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d099fccb086910a94a46d26bdbc84a7f9881556a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e90b39ed94ad062597b6a57b57e1c4e902c68de3b0217d08e585e651f1530ab9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23b505e2c71ace507a5f49c4efb5a125aae539ef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95a459c83cbd020395749999407c44082595a1c06ad2d90a0d5ec207c0b54f8a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48014bdada572df4ed554b583466b58f84e909fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:566b29d0907b93946258273b292fc80a1633885078ce8d9b304a7aa849794f84 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..887753360a33e6aff2ed3b4cc47b98fd7ae49073 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bf108bfc9d8bc7d67d582e76c61ec31d2fbbe74eb35631fa967175f984544ae +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e26ba0d3a47bc6dd3c40a416d1ca9f8142a02b8a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c085f8182ff35c36030ab6e453445629c7fc5355eaad46c67470aee5a56b097 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..337765688e5916994ca338e34270f4fe96924fe6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed418a61f0e16a62d64e85984c49a0e89032384b2a2fd4759dee723b11f28e72 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5596d0a0dd88a74379aede4640b7ec66ab344816 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96807be795c37540210f0f9e556271da2b04b45a4a664e24efa0a2dbb5499e05 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90c9e9b75991cea4bae2a713d0e4927c41b3b382 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70261e29d6dbd4f5a1854d38c6a7325cfe61734a6209fdabdff6c6e7b5609ab3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfbd93f260c74a04101ac585de0a0588e527d157 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f5de096b4066213eb371e882c70c3a052f57a3ee6ebee4ea5e01bd47f7d79e6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da90013671493176be194d38f25d7ec43eae3ba8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e3b9177e973b6408e58c7f18b37e9fe46bdb9ae1ebbfc97e595c083af94b33d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9965a80b66edd956b0293e3b519b5311deb2e01a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6555922034b398922bd80828d85157c34d91aa4f1132bea458cc148e57bef1f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b506a8067e32a2bc595fabd1ed6361cc4323ced1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:331a53f6625f64975eedcfac579234dc48d6e07f4921cc546883613da9ceaf69 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5e1aa1dec663a38beda248bd3d6420197604e5b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:080ef07dd4b82a5058087d46988464efae32c4d76192e528dfa0f0761483d023 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6ad3d1107a1a0c96417401f1947eef1d4ded103 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac442e5b01433e1e04de16c51f6f96d7609cb3ff5e4815d727b08ce96e7dbfe7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb86a94b1b2320a3f9a4264f5d3a4e68e939cfa5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0510a3367c1a04a66a5a5a00ca7a42b5d36d8559d2e364670120ae9e9f11b63b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5dbb3c1f183b017aa7d88460d0ac1e70ca127c5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dac2d630f0afb279032e95f385ad573088d6acc23c79cc865890b2a6cea8b7c9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..237f80562066571125e8713f6560a452decdacff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9fb2d9556d5ad3e6f7f4873402d274b5ddeb3e16199f0c609eeaf037ad8b3e6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffda0555d8034d79f5ebfd40f8cffb2c112fbde8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ee7bccd4352d59aa74fb9e4f33a1d42d8e2fed9367c8d2be6c653ee6271723c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f908eb70d7ebfd2d49993e2b4d6640d52c56b6c9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89edf21a507f4e998e966249e53c8d65a1b0c87c479ae6a5633ad8854532b545 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5f5eb9e4e3b2977e57651c10b36a0fc34d39ba8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e31d44628198b74c36b591386a0ed8e90585b055cf93afaafbf9f0a65b8c90c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..33a8c8855903a1e21b776553b563b4c3438295e8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdc186e07e7256b962f3dbda7baf62a2ca26c50da0c9eecb551080c6abf83492 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebf5a9a9413deb5f900f63a2aa9cf644abf00fe4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41159f33338fe7e21b37adfcfdd637743ea2549b854ea492250707a0bc3d410f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d48ebd48a91101d03aaf868092c5ad8667469d2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:665d5cfcd063f068d603e58914248885492e64e006d97bb19f7cb36b75adc73e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f19c7bf51619b99efc58a58e15f7952f3e9b480 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f63030e8d58c3cd275e9d16a633ea6552e625556d8df78d3035c59ef7c32ccfe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..14633e09841eeccae2977d9bf07ec473b2af18ef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58e8741c5e60a0ba08b5ed061f925f63af1a60aaf9cb8dd91c747e079925e658 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..479b643d42c2199e08df843b69b860d477d85f98 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac958bf2954f7e6b22c4a55961b4f3bff51d7462a6d8dfb26a631e4c04cd2210 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..504fd8cad5b46c7c5710cfafc27ac5352ff58142 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18bc79dd9149ca06a3f04d6c4c154106c04cc633bbd4ffb23c921a768b2fac9b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fab8f68dbc6feaf415a7ea413c509b61beac7ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d55460ca18f2e1f9dce8df8889027d924d3ed78013e7ca78bcabd28770e3322f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..812b04428d9aafd994566fdb2a9d20037307d6d8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d29147a801f7f970b6490e798147001845b76de759fc9895bfa0064ebecfd670 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5df1b336657360d5a64fb929ff8df32a4b23359 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:911f2f07c99a0e501db46dab857eb2c38a707be924eb06b1c06cf3c09592d46f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eb8b183a9e3244efab40ab99aca7297325a91f8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eb77557055570845ac78296d8482a8a2654fa4b7f07b448550ea49ae94b313b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..957c3e459c94e4b061e9707347c3a5d73c078263 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a89406548380a54ea8cb5d1f6fa7024af149afe4a8deaa81aed62b379fa912c0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6642eacb8818505cc4415ba58265d6944def0ef --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96c603c76f465f8a476ef122a083e121f68a079ac939eea6886cfd24b9101f6d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..617803e643ff5b8e8566b1fa1b203150a36054b7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14ddbbcb4ede2994727ac0f0dbeec8984191473e13d95e483a5a28b302f72175 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7460e4dbbc1c42b781f8cbc596b3e503d86fc9e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d981d7ac996a47ea17e2acdb92057de71ed6a1d16d57b14cf88dc3acb34dd177 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a478a013776aed3c34000426b3d96f3ca72bd94 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:383b00f14beb05b45008558f5bd010b21c443ea67a6d4197ccc86c78a2764d77 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6dd6d09d78340a8652bd60582b5898ca2d53b31 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97b521036a377e1a4bbdcec8cdf0817a7513f6ea6c4fb3b417d1f585f90af493 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d336ea5994d8f91681939853488cecfd0a3e6999 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8250efa8459378e0ca746783283a7993b646ef52d65b39eac635017a3e500d1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae0cb487ef14d4e83203a2ce97efba4f586a4929 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c53c4e93ab1760ef74af20f0615f8176567682347e949ced6a2b2a8c7d089ad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcd21c125a43a50ffd420aa2104980b598d7c286 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:793d6a29c10bbb7fe10351977bfeb7ae3b52fc98673c5706f5b7cede236cfdd5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8c04ba292b8fb999334108c42a3215ee3d2207c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f63ef2cfb4e8d40708aedd8fa9dfbfd524f75cd56c794fe2bedf24682de3a8f0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92b4886c9f7aaa14c0b8c0104268f9dbd50b9b87 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31b5aecd2a3413bd986c298e515dddb83dc997640f4285adf382dfb58c9d75d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9828eab582634f29b214c1cdc60c022f4020e3f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a89b7c9ac89394cc3e50e885ade13c507c9c728f726bab8708b6e908f14c1152 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6109677bf8dd8d78e43a48455bcdd4f5dc8c271 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cb62c6fcb8bb09ade87f02849d8eedac36eae263e414fd809d0bcfe1cc6db60 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..50c006876b3d41e6b87f6516e9e477a1ff2baa5a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9520fafe51686e808277a851ac3fe4afdc96d64945f38ad6398a74124b4956f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..044c0ea56c5127c9fe74199b169548800c55ccbc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f6d02711e16ae481e6f4a11c38589d9daf7798076d2a01bf25b170338fa9eb6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bc04cc5a9858b1606394b3f50259145f03b8576 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4774db02342161c09d8bf6081482484ffb6cd8e1e189409ee64c8350820b6816 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..24f46fc429fb3d22f1ab0e95693583706907daed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d40ae1ed3dc21e2e7ad00fd44ef5f849a2648c442054b6b5640266395ae4070 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc708dcd2772a850bd5554316b36b65b9b5a2950 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:055bcdf1fb8842a0f1f35a659a8f4168f3e8cb2a2fd848f2284e0dd622b56447 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fe7dce935c83bbd5b6213f58be93c6010624971 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b684457cb9ef687da6cf51133198839a41da7d51bb0ac56c964244a6d55d74b9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb3d69f2b08133a3a4ee216e63ad5878f9aa81a9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da74aebb923d9aafe2fa0f942f4ca4a48e3b4978094b51779810a46ea7c6397e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e83590083e6df21cb7d739e7eb451c62ed80b0f1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa685f224b89dc3779774b611f416e65a523fd474c5334dace842c460f80c487 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d964b9d81e16727a6ed21eabc71ea11574a0503 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dc553cd897bf353e5d51c50476eb94a2e04d25bde41b32752c31f5df9b20a72 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b78c16c502a3cd171a3c6d326efb0f385dd59386 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:241c77f58d73a12baa60d5a2166ad75dbfac9a46bc8b4e55dc5cad1d5fc49ca1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a143a443ff43280db52c0db7a67b8209f163c5c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae2a1dadffc63cd0d75c61665c3b38b23bca4102a3f4c60234ea7f43bdcbf16a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e64a386334bd8676537d30f5d25a3fa846b96ad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:361fbeff1b4bc99aeafeffa007bae674b156a32dc87aaa474123bbeb0821cc88 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e32e8d5228b9340babea6161252e711e0599012c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0bdc0f54bf74e34495b1f124269413c68dfc14ce966dd027d05858db73b5cf5 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7451497e5e7e451dd8c165bb37f6e384cc70a7d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34af6a3751236367bcd8fe6135fadd5a6b63347c1d62604d5bc556fc1148a88d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea7298610c2a6a3baa0eb40961e8c65fce436184 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98916f6f0a2a5ab7cbe459b4108562c814b07fe183de91c3a2491c80eda2f609 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04565d0602c7d3276e77737ca33848f858376f32 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1963cd0893f76df5eb28b311ee7f05dce415c970437bd531dd7c0f97112626b4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03480e8a1ae77db90d641ec44974c90e7e9cc78a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c570f0f3ee8843812d9d0407d48a063bc344f5933c0dc707e231f1f404ba421 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ea5ba27dee0c089d8d3c86b3222cb76805c1d77 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c6e07c3c75533f32119fe7aed7fcd7887d38f31153aba61eb2132d5dc63038 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..db2a24072a6df5ca8ecf9983bbcb962f760cb6bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6dc070751c8537de9d54f790853264a8b031af8f6872c8603317a9e83f42efb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..58af0db234e852b0d0bfb3b840a27d77dee22656 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4a6255d9587870dd750d9fe0e7be4c8c99845565bc0346352e3c2d18ab84ad7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..726d295f0349743dbe0eb746955738f78f9b21ea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5019aaf0e1aa36a9bef28e45c5ab8477a5c1a691d6c2ee47ed194437fc33d14 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8c88ac6f5c384ef33b80861a2fc5a13b4962c45 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d21ff274aab778ce2a8a0ef3f7753e803a7c17556366dfa066bd773bbaa1a33b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92bcfd18a881659a9ed1fc35021b55ae3faf45c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4ad8abd957098031ab42667d87a11428b863d4ba4d09b7bc0ad0800a22ee345 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00fb2bf440d533105d9dd954f6639162223a047d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73681c7e8000dcf20f543285ba05ec00aa8e87fbb39bbf057d8757921f3d7d59 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..034a666709d4006cd7b0b598d8e6189a09af0983 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c8619b3d05195cd79d2dcc3fc0a9ae56edad9554922d12cfb44f3c93bce67ba +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4ddbef02fd09dd513aef055b00cf6683751956a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:263591c78c9a0afc8eb6abead898fb7168d0a074454353940781940c91decfc3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd9da70e613e82c1863a1b290c332359c0b26666 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9dfe066f757d624cd329e5f13f9b5cadab30907c461ad16597ad5ef28e5f76b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e2da1df4477db23e3d17090979e43452d5b3fb9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aeb8723167c2157447e56013868e3d3c5e63a5fd8058932e01518f16ad1c1b9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c69af98f3414a35e90ac8deed73c86f1af5ee329 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27c60b68a04ae6669b9c62c1d42d40ca94d2ad02826cfe551e5597978a944c40 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..116d98c00da1c6e359f144e424d1c397a452b2d5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1efacb0727d88cc2e9359264575a5e2b4bdbe964b09c364f798184e85b277a58 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c9b84dbe8436fed4ba883a0a5672f93579bb2e7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dd8e5768a2e092dac41659bb31671180682bfa618377903a04f39e21cf89013 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6c5f3d3827a435b5bbfffc215f6596e471432cf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf71f4c563a0649baf5b045d73a05dc47d806d1739f198775b851eab2ccaee70 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f469db9e82d9f057342e79527bc8c04b07dedd2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd22795c1b8c4fe5745d40019a80cd7b450be20363126d573bdbe1cd5a01de8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4326d6b29abe7a104f67c02612ef95838fed3898 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e18392e87c1353d7768b6799ee9fff3f1c03d63539f39b5b95833c6d04c78c43 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbf759dfe57aaf560b22ecd2c46b192b83a9cb2e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e05023d1fd97ca3fcc2a0aae133d7c43320f5b2f5a2bc0982c8f4296ba3439d3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d209137da7274ee2f55194566bff608bf422a185 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1ccfcd2db7781301650384e4c20a847f0b6fe8e89d07a7f8abb0e6d562ba2d4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..193a25137cf4c36a0c376809a1b2b6dde30c69e7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:025ef8a405144eda76973f3a17161e5710f2cd2911480b3be62d36f40a38ddef +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e9c77221802fb1ec1b3b5758b13ae7d02469c69 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cf74c664dca0a79ff77ecb5420d9426874bb2c42f1f6238fa95c0fa5fb44388 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9587545954e0099f567679c98385786f526700bd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d23d5a5e26b359d6df143bd4aea26f62b49eec7ab5e2382d719efeccceb86d73 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a4afe4b72f8bec70be91128a50e4d6a3f4101a6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d6df7fce99216f7e8eee38031f8b796793845f603dd1fce78eb67adb926679a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..912562ce248bb11ae301ce640e39103d662b1025 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e4581b9caab9218408a058f01408dd5867e4a36c7d36420d1d4f8101c7fd281 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddaf4fe8fe976fb2908df6fdd19aafebfe0758e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ac304b991635232e44e7c13113bec6af63cc035862699bc23267d623b860ff4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32da1230bf7485055be49c85ae3898cb59cc7e78 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e52fee9350ff01632d3247585144508aadee17d2e690bf8a2ce954e6a7490fd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1844f485aaba2e28775a469a6ccbb529c81f6c02 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75c9687212d62c7f93d318ff1d0f4704af0703267d0670314f459fa396460d02 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ce90413e52afae73085e6cc83ed28577459e287 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:045482c25aa41e9cc7036476f24c07df2b415e40328ee146ca4a459cd77c0ed0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3edcd8ee2177e542f12b85a17006202e37cf21d1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca7d2e383ba75c2e0a55fa268347f42ee220779159f1e8e3abf03fa00545e6d9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..575d0fa9438d98bd92a1963c56ed255c5d5c385a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1db7847724068d9dcf2dcc48ad39468d0992ecdab2a80acb31c34131520d69e8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..488ab9f140213c792cf23b67529b4a02f338e5bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eca90a20d739b9859d5d7d05131fd2c440359fb0570cba8c0a825c62af6eadb2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..028e4c8d10f70665e1b8a734728f85531c650a5e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80408b3fd655e95680c63ec2b23a172c491d3eef80b3ae8e63f3e08291f69339 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28555311d8eca15adcaeaaa3f0eb39e742229774 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87d57f65fcb0b9f9e4b4b98da5eab939bb4317bda7fdb5d2de77fba88d33a32d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e710fb5c59447412ee1bf5cca1537735bb4982c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4d4c5b8e177ec9d004484015e3bd6803c474da9843e2d1329d5aadc95bb5de5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45b60d0f9ea7870da5776676338d234523ecece3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23319e89d80c4159af37a49dbdfa87b63e3eb92ed16c5c0dbd1bbf5a1872c019 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..da0b6998b4617c96199336f6ffec1d1b053ad76b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d4b087947dd89c365639f6b08a4cb190eca2992c1cbaa645323bd087d41c77b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c9a0714a9304e77dbe7a3c199b275f99c99c0fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de536d02e9397387718512b4443e5613273b2873a75545b09ce68c1317d831e1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef5c3bc97e2c9c01a41a5c0a47e0cb11746602a7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4746c4fb9cce4e425b68fcba25d5d4cacd993b56c28b8374785265cba8e2686d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76f0e4fa3122ff54a2e8a0c5cbeaefe2e87f1acf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa725ce4ad8dc7cd9778a186bb42536cc238ce1de218cc92786e7adac9109132 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..64a654f6394b89132d27c2e1af4f08ad01d613fa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dad4e9510670e53b5ee9cb07f2d1a94eac3db4a31179addc2dedcc5e1eb9d359 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57199158164158d4a209665529d8834be3194291 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48527e6f1f6277b23f64bc47ba684fbec7a46cd937fa2d62e99df606ad0de2b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d3eaa8853509c6821d9d753a8a6c6a2820b8fb9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:684e3720bd564c0c131c1a5dc5ecfced0f53b00e4885cd7325d4fd92801ed532 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..858239954d214cc2b5a5decb025701c0844627b4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b89a319e930744e260823007fb7d18b965cf984e4374076abbe03bdf9fa265b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5072998165b27b06edec1d02a44721540458fd7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b276435c324d9719dab269230955581d21a4731113c43cf759ebba0343e085a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2316d63e53bb4a93a807a71842b8a11955ba8a0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf4d8ac145a1c4846270b5f1db15f7e65fd2c2fc0123c7d29f66725cc1110eb9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc38deaa3030048307d986ec375a8f352ff5f9dc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b91013ce11c003dd5adff98db88edc1789ea583be042e62376495f28f870689d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..560a053c437102675dc5056475fe565db0487104 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8525e97ade7fddafad5eafdcace2363f7afc16dc20e77e1aacdabef92695ea2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5215f42ca283d8ee940d51876010d3a733625b42 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7d7dfe6bf58e1d49d7cb3a8dd8000d146a09c1929413b6bf2d4a039dc9b16ab +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb0826c686ad7b6f844e41cde3f803750ce6a465 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eec8f6ec1a2b9726053074d2d531b210af505185cfc96655e15e8a8587af4725 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc0a869ca2a52946a6128a3ec264d435817c9e56 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea5b04bb16dc3fb38bcd4e7f2dff785cba115d92e70b45e5af1c434f957e31c7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f53e68785b57a2fca0d63e1f2b70aa39734027c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b1836d53bc676142b71d7e1cd1f0836d7c0882cf0bfeacebe5798921b6568ad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..86ae222729e39c28e351fbc20ec9d268931fca80 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:790ed2524595ccc208be2eb47af232b2ae42a93c0787e500023f3d4b1f521371 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12401bd5a6b4ba00f7909f8af358f82ea14ba63b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fd1b4bdf7933abd3001430324d8839e8d35f21ef007141984e3825b9a587eb5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..517ba87ce8153f9bfb797561fbeeaae9321a2010 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf7a40a3b15d906c43fc89104cf93a4f66b850d77574a6cf1577535c2d00a6f1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..20e8877e91fdc5da771a277a16ad4cc4a6b34cb2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85389183a5a3877e8ccaf22708be06ddb671510b2c73f2a72540eb808510a26e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..29b00b991f5df358c8a407d00b8de618ee560973 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0c5a8d26932c314b3832a5ea9d57aa203fbc00132a0d1c2879521b414130b75 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ff2c9e840bb585830a7c02be823a871fddd498b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31f86a99f5e41caaffd69b3eaef89b1253163f09d98cb417f150c92ca05a08de +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e95388ab6a97c03f1205a37d6d03ca68543613b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:154457e9c60211002193ed8bbc19c7056e86ad2b2922ade1b11bdefa67957627 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74c99b00e98c903a498fdcc85bea9187f57cc471 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c1841775a2030472fcd959454cfacfc2d11308dcd272aba2e09a9f5f0463c50 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d474e493ad037b86f2e4e081e3b389f708f6736f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a05ea9fea3802af0e59246bffcfba652945638e5865d3b6b74d82e3ea8cb15c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28f817ec4772eb3a38e09a1a7588c8483c516735 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cfb7b3deaba489cd00dd45ae8fb0d6312522df31def204acfcab8ebf7442c93 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..761bcb7aa5b48b9a70ab247f8c5b2da543911d8d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a09a71635d279dbe28b12df9fe093056bcb8ba8aa9cb2f013b3d436af3ca9fdf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..426208f682f305699c01d0da52bec19d7a120c70 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6002b93c78fbd24b56881d66fc2f203ee5de17aaeeb98f73d99afb25052da77 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e735766e318cd10c87d0a92119785d5e94ef9eb6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b4c79c5dd25d069d5e9f0c316da794dd687a9c812bbde6979460961e3d08881 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e692920208892f8692783280594f6a3e7c8365b0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:022c45fe00d69f1283c59f7379c68f617866acbb2d0d9da9d8e1043dcfb0f454 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b4d4da6265bc079c3603236124ea6e537469070 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc8ef5d7ff27e86f47584206f48ef4ecb85c04125d3ef06d9bebd5ca9ec2a4b4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a5e5ed26ecf5e6e6ad80e78c4bcfd5a3a2077d3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a45c17f54881411ce0c99d1b3e3009531ef5c974aba23bbb1e3cc9f51af8df09 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..93f0048e5be9455c02a82af116f139602e31889e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:482ce65777a5b2b5f80ef0b5c1ae27dfa0f2b1e2b14259b440b3dd1fd38e81ce +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3e125fa9ad16323bffee52b62594491425e5ff5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c2e738e2b31c338ba08ae7d3af565dd933b9e1565c067c9282caff8b976d140 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..855f2c9ccf8b110ede57a65eb11098c11676b810 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80b8102061aa9762b3a56f02fadbae860753e9f92feeb08564f53ca164977919 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11cb109a0875de66a703a71bfb7716114c0bcf79 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3200370ab42f22251f760f3801a6104e6b8a499254400441ad5ec584739de0af +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd0039014148bd3471b1fb37cceefbafc225a9dc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0a520ef2afc013bdec73c5a6529c1c71f8092d7303837ca06b27125f133f6b8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c176d06fb8e40f55782a0269bcbef3ce60c2024 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcf8b20cbfc62b3a5166e3fe65d3de04b3cc5d7d8e345b9270e804bcf75d2c53 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..156cf8b502c8dfaef41d6b060c94180d47ace27a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21c2985d895da013af5114933c04584ae5bf22e6398fd12be882d7c95f791ced +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81fb59b1968280dc27337ef9ee0ab6a4293bbfb0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c2e181ee2b44bdaafb7339baf1b523a9a7e285e880aead7f41e44978136dbf4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b45d39486f1e55ae58c47c0fe44c14d0aada68f1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5e93c05039c90011e3c3c0f60cc6594cfc73520afd32f9e2aabbe0e307f801 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..515503507d3340fac114d91799559949523f20c5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df9908fd6c6988305544857a9ca8cd5e3f6f61ed8afb8453fc316b37784cc66c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4b6601101aa4045973d4c7a595b11036d9d47d9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edc4f3771aadcd0966d017466b914a800e3fab487898f330cf9509655df1ce99 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02d500213e375bd1a09437deca7f6748717502c2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf641da584e4ef75c9c0b88fb63b19aa0385229c0c6985e3d370ca6098624af2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7280cac6b5803e48f364011b3f7705686b573a4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:626f85f0538a6f5d8bff15ab1c0942611c263535256b10c416dcaa4f6a94b38d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c35a3f9e117b9ad73c6b1b7b1a851203964ecd1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3917a1da9ea3856128dc1f6026d1566259ad363cee48bac067e6bb3e28481211 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d75bf4b1ed44dca85011ffbf8d39da552f83d78d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9adb6907b9030cebdb27f96e12eb875de8e17b9832bf68c6d880bec1eacc1b06 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e78bec541ed318c4a27172d053dc2daf7c3d5854 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bc9a0bdfe50ba56ed147ff873d0f55be4b0004fae02043b05d03bf1fff5d215 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..893e12451f6b83e124f7183323cb7c63bd6ac919 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe599ea78cae71b58eb51008a2ca7514323d3a3b490171c86c1e4320597cb039 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7f993ace6542882a03c0a737ef1b335981a8e2f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28e5f062d51d0d2f22717192d8e4f295d8cb78065f2af4fc54d7eda82c031d02 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcc1421f0f9a83099c25a847d89b4348beb10723 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9591ff35c7cbda14755439fd5c966deb631d559478b17a94366174db03a0813a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3351d60479156631783cf9898b9329d14065283 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da2c7632fc98b4205a1971f721c3c398892f7a1359b686f496887048051699b5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..42c8ebb19c5720739540255f89728d04977b3dfe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a228eeda4e2766b8d0ee3dda2cdac3d1f7ef11750a796e8b604448c3294d392a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3525670931d40e78407508c39c4af000fbe6519 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:487be3b5f7671a688a154d3107fd4579772ca035c5fa0f79c1fa711cc581dfbe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeb328b21144fc317e63a92724745522b28bcc8c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdd0d815762a8cdc4694f3fe457dcc0cc211c428452357262106bd9cad28bfc2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83dc40fbdace5b93812fef8ae135c855d5ef996d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41c8007e76df47cddd0f98f5a1fb7e70bd6e2789340279d464a06e5fcdb73751 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f87b4d166f5cd7d758f0a9c42c6a13f347957f5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54c464be6fb240c814210284010e68b8f4c24d0503783bd05237f975b50f98e4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fcca18910e2f2c421a7596bb570067adc627405 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50dc386b9e139f9dc1dc801cff54c1147e363d71f844c8ee7d28747794eda9d8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6026f2956046a143ac3e144409a0ae5c2377121 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bd9e87d55a1a3bf4f9cdb948a20f6ed7f0e28d716745ccaffb8dea040a16d22 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e88f64a2d0dd20d891035e6636961be7a2f51d2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89aacc6a2acbd1ba21891e1003c46d108ec9780c0d2f0f16244d3dc96c169584 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2442e1f59cbcf2c7b371a26e162001dab4498b9b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8829a2678c60bd87a42454fc06ecac202196bf579b2ba92d5748c165e470011b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2df4fd83adddc19bd1dcd5e0c4c14ac7f31618d0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47f1a574a2ae87bde015b08a8527aa108baaf3b4250f1c595845c638996c2a4f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e307cec1db8c9f0f0a0842c7d455189f59f778b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b549a0619bebc61bfd0627a95239d553af0ca3e29f66e7ad4f0b0b5385aece6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..329ce59833edb996f7c1081742edf53f1279f053 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b22fcab37b210e0559796f62f5b47af293d7c129eb6c7ba1480d6979d8b2bc42 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a210ea6198243dab260f5e8dce78fec9742d1256 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:257a2f45c4fb80027082d4ceaaedec48f69a555be3bf2d204325a9ddeded4769 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeacd4683664a0ec9bb4931f8607db23a14f21b8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50bf7057218bf108e13dbeef7d0c63836c335a075aaf2326e63373bce2bc4b61 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed84b056662750474a5b723f95748fe39a045e24 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ce094fc791ae10a2d3f14d3ef1186cd5ba2ffd64834a982b01d1848b432b963 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb19991acd4d60922a5ff561d9181c983e23a26c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d9ca5f8cd18ac6c519011b171fab51b9fe6900d94747cff482515333c78dae4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b77be3af0eb60b481c873d2893bb2b64267a2e44 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed4e31b581912cc3a95369b1a99c08566d48901746afb9df495480981225e2e4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80cb9513380a0c6497bcec1a4e30ae467d3bc981 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87c5ad66d35123b8de4f94de5a9b715ec9dcf01bcb7bcf610dfe906e00cc7b42 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..62b367e41426798fdc107959ec1eeadd13a77645 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e55cb33f585deefa166179499f1be0fc8905fe584097b5baa37b832a05fb9411 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2bdc0b45a95e24d4adba57192940020d77ea11e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ae80de0c1d1c6e48fc2f210acaf45c9e8f7c896786260eedcf924ad09822f6a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9bc0c2148a79153dd6aa000ba6dd8bbc0b94ea0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3140dd3c7a73202ecff8bee421b3eebd30ad6ea45b40b42f36b3f7493bd65fb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79fab4a89bf9e6f1b32dc404f5a2fccf64e96b59 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e109f591e19efc697ba006533857486b484daf9c43428437d6a81b4f35845be +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c358e7f9877547387531bbf5ffdc765c3c79617 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cbe42b9c1e0ea7e1f3b589f9d01cffdf0dbead998d36ca9b8d6055686a370f8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..725da1712e0646bbb0f909f69765c9f8d76a55a0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:679d4a2792f840bcb3f33acd8f5345de1444819eec5cd7cb690cd42865a2c427 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b116a73c8db900d744edb1b879ba2da488eba10 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd3c7f605b3cdd75c7d71a7c0637c99f162d7709ae99358f108f8e1c708e0b7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb06cfa1886e815ccbf52d06d01c5676324450a1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f12e0dfe488968898ef444cefe0daac08b76ec73f3ecaa3898f147093e114e3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70daf88afc60221d1057b78a8fc0e4807b2e627e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d72f6a8897b208723c98ede1beae5dbe71903a16fb55b661c48746b967261d8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e38ea7de3c0e18b65dea6f3eca4690bf7c7224bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9722825410a27c8f4ddb36ad218be6275a2def4487a024a9d503d9694b787cea +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eebbc5b34c7520a73280f02c3caa4e0dd23c1e5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a31dbaa0da55ae487d09a50535dbe196c0bd815c1c3aeeb0b9c13b08b2b14fb +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2c08016732c6373536c7d84bc25c921ad672b79 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:406058389ff149409be480af05f730893b99d4a32dded7ec8dd5e4811dfabbde +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc8c1c80072cd886e4cae2de5b4d9543bb223152 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c75e78144430b9d14f076cf91a5c7e91be8b8fe5bf4c2e0e0e9dd348ad6bae3a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dc944fd16afa5450556beb9873a76b3c4accf47 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c1d38b0b7b2a94e6ecfe0fd0031d5374d11999dcee4bacf7ac13c3fa88fb739 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..90daebccdefef5c545193c23ec2b285e58d7e864 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:161a9398d45d7e100b02a61723148dc0f0f2ef482b96337b3a02b1f70563537f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fffc0c6a0f9dc25825f002cfda888de2a65515d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d21014045b05c603d8229c60c79b6764f75f9b3240d706aeb85d612c0ef975 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bee69c0322bb6ed0249e46e454e93d4ded38bbf8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eff4cf3a13f1db6e0342cd2338a9c4edae75bb84bf349346d3d590ac42912dad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50a0f1cebf58e7a909a47595a036cf935ee4962c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bf808a17c14a118c77f3c7f37520a6a0289e3aeb640fb33e4941ef2a154958e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a931d84c16c9cc4dd29f8988dde151118ba1c013 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99499c57b5a44cbb52be1ba7187dc699c53caed9669915906048257b7ebb504f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78739e1279084b33b5167754696da8c4811c759e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df0427bce993ccb2900788338a8044afe4233c7180ec82564672bf665b5b51e1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb384964ce19d9d840a63aa84deda2edd1d56464 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92b73fdfbef70855d270363313f48cb1f1bd08340642a8de778424fa8531afae +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea804b52f7744851bb650a39cfaf12ec66bebdf4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbcc76935aaee6c60d574c8e621deb7286dcc21babc59de951ae3cbc1915df63 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e769ce25ecb79b7718de1440a04668aaa9352258 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b66b450f3931e545eacdd7cece482a42ce789fd6a698e4fb57e6af7cb7fce108 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8f18e9af8c8aafb8fc2ddd0aacc45f868cb1116 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a4672bceed8ab0230bb2963799bf4445b5262dcd2ce4e5060191c492906bd91 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71a95f58833227fcc6075080c38c953490f1cd90 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25fbdbcc7cf49f1e194d8e475b33e51a50024ef563e023383bfea1b6f4d165f1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf51e3c3e7a97094a5b3e254a209fbe9f1e27728 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b9192e84fad4d869a50408375a1c6a38264a4d8cd593e8289ce1e61a2319df3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ed96d0a2e77e8e08775417df5a0437b13eb45bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70d4085c8c6d5e0300a90c4c833aeeadb5b8f41bade9116d1f92dfb3828da7f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72fb1fa9c7b9150a82e050e9e498d16be8f14117 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07f303b63ecf63a193f5769ef2f744868b0a28446d12bbcf23c165b1d80db31b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..589f267310cc4cadac7ef3da1b0e71ad7b9e871b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c903e3706e2f10243cda97486c984ed17ff5a6209414c8540d142732c8d76ac7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92a27f99ab487875d6630af797d2833f63e5fd6a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec70c9ac8cc0eeb95cbcb5b93fd595fa0093e7ad093ad9a06dbf4e1b8be09c4d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c19d151179d406a3b8850abb5f35f6738a1d389 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa9a5d663babc0c1108ec783a1ac9929e673a72a069ac50e9f59926da36d6089 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b55f2060692cdc830d13b3275f1369fb296358d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:083de944a126ad957b690968f1b8c539bed3d79efc3cbe9c4ce6a34b50743597 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fe2a0f7d02cd18508d4c7135408ad0ee70f4b6e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6aa79f73e161a3281d47e34d37a7b17f1fb71460292c5671e53c6c1734919ddb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9047542044c18a1fc5e240d702321299bde4f97 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1351cf611ce4600232e60ee049d1cd61cc71c195070aa908c088f866d184ba65 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae0a302d8f3aad5168a1ebe83a915bead32dc66e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b48aa0c024a92abc5afa64371a3f1c2293a42b33cac5fbd9d1e913acc45764e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12117ed875b6a712c92b5d8b5d8d5ca3ea0568c5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dc2c502de37cf866fb807e23dd4f5b3a7b48416464ed0315480b50e2a9f3da9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e83a51b62093c929c9d75d97ec34e4f2ebe5e098 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac6fe71bc98917d3636612212c238dc700d3339a98205e2eee66c6efb0979e5c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b4d2315358c7e98c59b02a7347de9da05f8046b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81e52a496d0e4e3710a6d1b84b6af7db773d91ba770e1c7c1a47d33ab9d73484 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0244f0a3261050da8277383cdbe0248771a1f0dc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ecad4186cfe081a49a7fedef0f4f040841956a2a8120bb29b9d456c9013815a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a08a1af50fa633e7211cc42a1d23971e7661cf89 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c90c037613daba66adc88f05215241d2f843eb8e146cdf684c728952c3eb3c25 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38d465eaa2432f3fe8033bb6e509209e191b8823 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ec641ab8e740f1485a6292670dd7481499e5b3fca678be6725e87f8c731497f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ec332bf5f89ee1c1008c3271cedb8faae0344d1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f08054e3b19a457d4af3d50c2448762bbd279e81fb46ba05493fe8ddcec2e745 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4989cbd2ff068e992a2bdfa9a5e6c20521162365 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77edb407e0e17def3668c331306e79380a138a5f700ef1a382ac8e795cd29335 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..730b2abfcc0abc13538df733814872c748c1ff8f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07dcd7170efd463eb20c6a02c575f27e935dde78248f05ad68242b5c404d05ec +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..91279edc3385e6757eef60292ab6493a0c9376aa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dc1bb853d9b8c3bba97467e5c06b2e6c541ba2c91b15f86ea8c5023bc7ab690 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e8f10d56c4f41c52265b6fb1b0af97cebc583c5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89bc2ed6e818ec1f98564fbd543ca3625ffb89b0c169ae5461bf9f3e91df74f4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f470dc9d27d91163ff3e0d90ac83847e9a6f3d5d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d5c2384430a172915fd77ff552e76d502ad2d8c25ce94b7e2e5e0a7e3cc627b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f07a42b2e06cbaf31beb8754aff5cfe76825f1d1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d827580f9fb0b8baede93993e508886ffde34d0f8dfc5de6f65205fc95b51d34 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea2cbf6f5aff70744f8a8aa6d75ba29ce391fbed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68faee27a056dab3269ea49a396c3d4c1fea8eac53c18d0c9b4a514d209bccb2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f24a59d0563a2f6c5793b43ea59f189f015d40f2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d505247a05c69ed5b1546b5a45db3c1e7e74671338283b7d929649c11dfbce25 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c999920bf35c00dc879abe3a5dbe02ffa39c497 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1725aec5ff1d5bd385eeead18499064b253a4144c59e1b6640f55ba61b5b7e79 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4580c059e3b156d01cc8e642c09300ab38fff01 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e5501ac0aed1c0b3b6dc2e128c990e082c7bd630356928e92731667036264d8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a86e723315eca40cb45886da699d9421f193bf7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9507da7eb28c9ec35d42fc5c2786846fb7f27e7ffbce0b81a645362ceaa2d2b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3795d3f2c2e057205c01d100ef79f4f7184c37c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f046714018ad9cd6e076b31e7a1035e4f82541d5362cd389f58577f24a44e8e3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f02a2dd4fc71fc77b081b94aa9b9bee391093ca3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb51cd1764e959139f0b9fe9fb389d4653572ff9888b8d9aa6710054ffd489fd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0158ed878d81e5fc8c270bdeae96b5b75b38ae2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38e265066705bfdd6e2e773ba509a7dfa0557364c418be7a59a8e5e231936766 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed4fea2fa60d3670c251eccc8e8595e4bd8f67d8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f89a3eff7f2e8a9923f49892fd31ed5774f3e1e602d46b4e8b726952478c21d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ee89bd6e5be70268a66332499f72f24ff810976 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cb263d60c30ccdb06b8797d6931a893d86216b4c06cbff1c17def21d94e51cc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfd60b8b8e4e4fab8bfa4998ede1091613ada17a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9951e6d9391d6f029cc95fb66f425c5168afda5f1ab687dfe4f47dac86a846e4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..beff4d8db0edb0b02d61d59aa15bdad6ee77d5c3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f58baa5a4bb047607711db86f36381e7f08fa46c8b08eef036c88612c872c9ab +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..46d6f142a3a394d003542623846ffd66538d909f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c9bed88de84decd3aec49cdf1c345a1898332c8fddd61ebcec33221e5e0814e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82b2cfad93dce6ccb31c4690790d4e7b23a24f9e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2351710925d66f8195f2b4cda0bf4bd4c9f710e1bfdfc5ffae9aa7c363b2f5e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..442b4755c72846a7b0f15b5e0a60b234fe7cea74 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8adfe8c23cdc0669cbc0292462b2474720d979cce00306f9e607b3555291442e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ec511d15c6497224ebe44637b9f6271806d841c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa9f574583b1a7005eb50b83f72881eb58007b6babe1e287aefb2e04d6ed57b5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..794381718127a7f3a3c406e240a6c78abeba7f95 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:168f576999d5c1c1e580737b2919be561f23830d599430aecdf0ac2fbed07ea4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c25111bd63ca2b8ad1ae8fcad30301d43e731df --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:981a4050a4bc07d8a60f77ce35df6ad84d2fda7847f98ee7cecba41993a81611 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e53cd2b6bf36b49b3fdd6845711d5ef5a8dd75f0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:817108896c996a7da1f9ab22b8d4573262f42b280310a6ff1d88cccdd1a238ac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbbe3aaa4f4a75e0fcae875d54b8b5db37b1d495 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeab321d80c166a2284866fb7beb07f625748a8d8387ce9a6bba55cd8c0b648b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55af0538bcf7552865017ef5ece85a3a1cbf5d53 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:722132ebd6a108daef1a815cd246c91fc6f711ffc21a156b7a52f7dd6db0ac73 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f4a1ac58c611461c16f15d26bb0ac1e969a48ba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_0/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f625b7adc7132917053cdc6429f673b8cdeccf474d4b369bcf3821729e24aa4f +size 11395