diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d21c439cce7f175491ed6085d8f914799f436c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a63d286686cef7e1a88219cb19f9019238d6b80fe317010ecfaea17b653511be +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc2d4793463277c3c103d7b79cf26534ac5ff1cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:175063cffcd0fe3849bf8e0c30a95aefbf2004ec5e9d3b0b5ccab5a69c2123c4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fd9317e479e34ef8eea6ead4dee4ec03604931d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4abaf283c24b88d4a5bd1c856d0dcf1ae90a20d6a0389272196dd2fa9fc077e1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1982950221d039b742f32f40fc7e1648dae69d4c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8dea1bfa2b97fa8454b5f5056ae4511d1aee5ecc573d4f1c32ddfe1ffdcf098 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53279192c8daab117bede215948f2849f5f6b026 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09b1c4932597015532f16d30b59376904f67fdb2a733b585b72ff1d24c44ed3e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38b1266955c732ca2f07ca94d0ded95db72cffed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4f41bacb44dd2cc12c63ec81b4c3fb202a17625aafaffbadfe16d4bba759a0f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48ef1e9ca208c26474d338d5ffb7eb1f8fae5de4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27c189dc3a70501cfe33d08adb18ae3c940bbf4365ba9036eb0a7961e789bb11 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3edb6fba3bce793da8265a6fcbd57f7c759e2cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d06db3becaee64ce237d335d8275ba5bd5943af7c6d2bdb066b137ba2734d72 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..45074ea65c4731d90cb243d08f422d6fc2f08f71 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d0ff9406289fbc46fb0d1fafb11c9f59a70e59ce1c406ba7e4c2edb1b31e803 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a534682b98f63c34ac6dbabf3cbec0b4f398d50 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4c34def52b9d74a55b6a7ee209a923ccfa2b9acd4f64ffc82e8e1ef3f1e0110 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70e43fde908f4f6958452bea13f489669e3468af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:828c11aeaa87617168d7f5d27b7fadf38061447215f3f20e6475aaddd2c7a01b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28af6392efd7ae567251646444f73ca30262d7d8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6b3a1c017641958de8c7ba27de0163f4f7ded0d42881a58aaf8bbc6d615368c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6bd3aa9cdf4a60b9351d052ddfee8e6ec0c136e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8128a89902ce98fbd0912798b7c39da2c55282948f1a8d7644947d23be1c00d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b224e8c1e9100cf34a28828fa7b82be8e491b006 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beb6bbed83b4eb7bd4e733fbcb241a41ff61483d91d2588bdb70a1e56428786c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..33a5f77e45735fbdc2892f963bf202d64cda63ca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5abc67005a5a1b831938e9bb7eeb47523f5570d1a95d892b6da2f6c656f2b306 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd462edf5fa39add5595d3b67dfe3039e7f90839 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db852d18abc43d31e59d9b81491e1b861cbba5c2561e1bd12d7e423e1e38e596 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78e3c218242f16a5f48e2777186b76d9ed730290 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df178fdf5e1f819ecb94eb4d7c42962793ef060a2da68c8b365dbc17f114ada2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5704548458f97fb43884fda19d58805cc920dae4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1220e2ce344ec474651ebd6ea3d3f89a7ae957d25a00b3b71593f1cb9d366ce9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee3d3c9c4875dbd0d0f6783b8aa8aae615d61e4b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:498290234d06cec336ee9d1d3bfc0b7c2cd1d60b8d4b6f4a234de76a7af32dfa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbed0282c1cc78197bded2f893695a51557d63ce --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52d52aa054ed98c970c82944694cc6381d9e19e8f92b39a9c1f91ce1b8565241 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b6a3dcd5dec91d9788d3223602951f75146263c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2268137a0c09e1a6edde009b8ab13376b9a85afd9d47cf55469e4eaa530b8a00 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eeec7a44b741706d740249b7ae3027f04ca0c4f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba26e06fe7b3941a2708ec1ac604877026c88e2bf581fada3c5978c22560f98e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a65e2b12d5132df40d47d2c4230d216dc8bd45be --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f01d070e594a6faa8b85195e9e7c97479a0249a27ec3fe747a682541eda3ebb +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fa03ec92ee40f38c179a5a66cfb8de2e2840603 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38f96e425a7a89cb49faae2d1670643efedf4eaf371e3bb7214d58683cbdaced +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9b523cd776c96c21bd5153162a8238044271cea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6dd986efc7ad61d1c9e8df7bff4b95507bdd205f826afdd69495932a82e5321 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d90d235fd75d5da3f24c8667de210aa4b3ad0b31 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5f452b5524db2b5bb608d4ad566076ce75925a8132372224b9fe4fd6e8f041d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..67211512292bcbdf85066cab9aa02ce0a549aabf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8822852342fb2a912ff50da0476020157b6ac8e8ccb15bb7ce88672f01704619 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2e20f3a9266b0a4537cdaf763c9f4d5ea0648cb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89e0b4a39c31538b92729ed27ddcfcff4647c5b32ccddf9d8a971a4d46a964a2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39256ce3cf90e4b574342453d028681844453b0a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69bdcfbe490e9acbd8666d9c05a56a93dfed761d26051527abeceafcd3a03cb6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10938efaf4b81a39c27b581d32fe4fb14c3fe12d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4693c1974e0b98527adc2b7d69d36bcf94f74a6fffa2dbf840327455a8a2dc27 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a10a61128784dcedcea02b71f0a377b765e3815 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20c28eac8494910ab53d9589d9206540e116cc294827b7dd043cd989d90829fc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4904fa8d7493316b24e6604003e7894054022c12 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb4b617af4df0df571d6e05a3325a619fd78db42869f36b0e09ac8c0d7c454bf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..11e32ee56298a8bd4a535e05bccc4315fa54547c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a093076516b28b2f97266b54ead865f517218413f1d742f86d1bb99a9424e90f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d3402fe772d09411a91cf2ff5c65fdf91245d3b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebe5c69b6edce9c2c8e979395ed01493d66803ef28bac85eacb3b05998ffe44d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d576a3102b423b13b705f5b88c238a6060023a73 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07699a24bdb7745d8577007068975bc4141c5e2bae6ecbaf78e206ef878279f2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ab92ed3b66b6bf0fbaa372cf6240508ef560828 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8818519212d3925dd22b52d9223e75d7fad3a293cc6b58472852122d24134457 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70c53bb6219611bebc50bb84c010a9eebe2cf99e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09fe7be6ef99a9db7d14ae3490ecc826b15b6361121c6c81b279d044376cd91f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f243881eed741146f0c4a243f6472a2c7561454 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9cddcd5f25a790ad58393a187446b232776f8b866ef4a2322d1b750fd5b9f83 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..902d1e90796110196e2abec3f907f9cd83e77ae8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06e2bed86c776bd7ceb21012cc48f1612daad670dc23619d0102e6bf3ab113af +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3096a54bf26849250573d4b6a21ac724f3fa4c4c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43784119b866c1f6d758a466c2588da0fdfb6374a19fa7c85ac61659a948a7b9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19a17356bb7904e4e158b80434242c24eff3b5ab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e48f083e7b90a9da0a53c4f58f32988b871047733aa1c8c587a81533623e7027 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9edc9c10ce40d37694053d295da4328692ff35b5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:303795d85b0d9787352edb8cdf0b46578f95c3035ac9e7f7657ad51d896ee0ce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..85447bfedb6505f8e4da7109150bfdb16895800c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd6772aa7efd75177da04d08fb408fd1ba73e0df23bbeffafa898a8ab11e26c3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16bc5f0127bac19ae4f59485f334ad2360b6e589 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87155a1f8abf6b5104a94d68e90910328d3d765579713cb9b0e1ebe8880080a3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c26d2cf530097169d4bab3f869e72cdf95b63df --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c05ea1de571bbef41325bba45a7f68c97876edac2f2d73980f9831d51d89f42 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db37ecaccdd91af4bb6c0056c353745e18731fde --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:478442321acd3f71e946993ed128c6edbf1a5598e80429c1bf30ffc5885c6eb6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d28fd8a39e0c0236e19ed589b4d702507d8c0cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:983f0aba148781a46f62ef2ffd4bd39a8ec9ddadb040f135769ef7afeedff498 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..659c4f9d2451c145915559593c303d6b33c78b16 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3caea9ca9db9f1aab93c57e63a1eedb709335d5b08fa18a147154e331087b804 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6f465977056e76fd4e811120f5ccf2173210f58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dad99f858fa7304ba9dd600393641b1290fc0f4b549a5308554a8c8143461b1a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..729f40146c6c7458806b80d172db498babc05822 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdcba00c81280915ffd2c584c8f35796a59aac974b82048fb1b7ba14d294532d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..01211315801624a960ddbae1c9d1a979b189f8fa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd9ff4d80e49aba92991df199da4d9aceb689e05feb75a1db0b7b1c814dcf66f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2daa1e11d1d15d3884d34a33ac4d1978cd6880db --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fd6675320f82ace7bd5c3e30ef31505de3015b71d888d08a58009b8f5680e7e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2a55f2ddbd00ed6c82bcbc7aef74ed301663dfb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cacbb8c29e581a93f5aa37b3bf410011f237dd9b27f975a29cdd95c4f50eecbd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fffa51db2ffc85510aabb0816878b99e2a07a55b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a278e8df5eee84222e193772c6b55019c63303a259b603f49d856e4c3fe6e305 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f28ec737099a0b5093ba7616794abf1e2132aa6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:960b9578d77de4f4787a6ca705627f88be61199ee7de38074503d8b467b75c5f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1246583244b661be5144735ee4d0f7518b2b6e4d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede9e8818bd995f2adf97cfc4ec62e25823c9243bbb86d42e68fce68047a85f6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d514f305268f31eb75b8c26c90f746f1f86e3562 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b14fa049a38f94e189dec1ad4b433742997cdc352f19ff8bcb493fbadbd12f4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07f9d859488d9c304f1c7bc24b4abeffe79a1ec6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f5f38b046ddb30c31da12715945063177ecc7c4b6333c3589a32f61ba79b9f1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4ec58df4f7fe6cedbe45a77fdd8381931792eff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e80fedfbf6fb53241b5b5d5f31339ca768a0dc2419c3d88a14dd9862074a6b1 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cde33ba97e933f19d4642bb9714272cb09743fc0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3888a099fc84e75094826b3c01254505de447cb14dd600820748d6c1a5f305c4 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..014901c30cd158e215c04714b8ac50b08aa00d55 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d141bf7691f2481a5e0108c4f7c665713aeb1d86f91890d22a2f9e1bb382921 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19952c6c369212a7eb794b6f3947e75977527398 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e68dc90c8c22fcf19f9fcbb14f230dc821d96de1ae7a604b947c475f15f749fa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae0b7355fe4e5038b26959f93ba458d819ebb3f0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b46207a19d51b32a2f65763204518aa0046464ac19bb5da25b20b63de81c2a4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06fba70914ea181c5bcf466a6ca50a79c390aec3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1892be84eb12da99479789e9b17f564e0444a3f7113f0e90e2f21ebe9ae18016 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e33690327afa824bbda6e4130a2cb72ff73d93f6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f7c790112bedc80fb7cb98316aa270cff45e638eb38e5a5b86269ce88d0c684 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ba71eb0e6521027bd5c2fb91fc936294a7a21d4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:add19c856d32de2d039d4b6620db11c9b2d8ce66157d61b743e403f25e389eb2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7812c71905d2dcf5a3a05a3f7bfcb07b904fe1b4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1ebb3c16e5f0988d988e4e1a4c1e844e77feb32ccc4bf9097a86c67df85ea3f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc6af9fe982ae9abd91a4532065ef07627088195 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1568304d1fa69bc86197d63b7d6437f6338caac76ee157d6460df06d58f6d75c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..52dd2fc821876d9c150fac24b3851edf384a624c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ffb6d769340680524769e0cfd8b1e94993e366232a0d5345506418c755b9440 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad2a0fd4e7446b48dc5bdf15cded2ab595a236e2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da087830c10ca81f549ac96bb502e652e95bcda481121c0119c4d78f72be0000 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..745bff0e791fc048e2c386515a641d5c45dd441a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e679fdf09c6b98934c2d25499b91d505e64fb86f843c2e28a5802eef8d060738 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f223278ca5b599559bee7422e153f7677dadfc12 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:739e24c907a44a97e4a5255581d8c3f71a1b6bc735a3b58aaf1e02d39f3dd4d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8e6572c81360cc443652a75b4f8b5e5c038453a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:785ef2996e3ae52729a455c0d4fb80314e5a8a85f00531491976c4e0a5df3c0c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..715718f8b115ceca7811984fec0dacc33d4dc3ec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44fc607e52fd402f4d1560a5735dbd782028383a977de328150e6eb614f78762 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaec86bafa9d2e7ad72b414c6cc7523763cd0765 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3988a4a0031d089136f004192b99a95473dae4653b248a2c679c6cf5dea70084 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90c913df50cb08b9db4fa86ae26652e413648315 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e4f88f5d4416fc074f2854ee39186261d96ef6f0ab8cb1c31fb483afaa1ff11 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f663f8c1e3f27789be87562f616caf0ef0895fb8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ad6fc4ed5ff42c95a4e204c7845916a5b9a4b8fe0b5eb63476638c208e6f03e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16e5e49ce07fcd0956f6504d5e237f721a3b6f4f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:781a33c0f89d565fa25e773a65e5adfad3ac3168fe56251bfd773962cb1ec0a5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd8ba013ff6e7473c15f6caef8d895e30bc88b52 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ad1b45573fe34f4fbc98fd4dc2905308811b9c6503ed5456d9e0d4445a4613b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..310528ce2b5773f1249af60510244dc220da92c0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfe5315e32be3037f11993708cb488ded67712001f7cc99c0a7e0becb7255b17 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..abaf908a64e1eb0201dbedea9ea0978e05a07baa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337f155008559679cbca4bb2098df882e2ff47372af4c6e6dba09f5c6ed82f06 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfacf9f2fa8ed2c3da6b8cc31ab66482979f18e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40dd50f5325dd2547b9ba2c4006c1346af1514584ee0856bf4bfe71836965c08 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6ea29e28ed603fdcf1e06bfef99045a469e1412 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:322e95f0be03747e57d0240e5d6b14f94f3d89ae14998b5d5a86ceab721f6513 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8195e3d7ca0bc42c2afb520b974160087732459f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c27e87c0cddc40db0a6dacad3d14b698350b035f0ea41ad6549d2611d095d38 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c18590f1e785a9000ca699c75f45a44d0fa06d5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cc3262a7c0b8fef22fae8485d2d5098102c276eab6e07d79c47f80546df2a2d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3c0ef516945ba9cf3b33dd9bee4e3f53032feed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4191c4fad516597388047097d27ba398d0afd8983e33f746cbff4c19cdf7680 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef07e01b9dad1a92a4bb0a62f385aab1dc5bb773 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c46ab99d1af7ba92c00a13c9bb2659be11e7257896324ae618139725106e8856 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b65e55321739179c54775f650313b6c45f189ea9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:047d2edadc239bad9594a0858eaa08e425b2267b6a8104704ef13919cfa4cdfc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0bee787ae4b699944f0be3e1204ffcd9b343198 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86ce23dde05b96e6a29fbece79865e5859ca0b4f6c9c62ab6f27a04d12e4480b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06f32766ff5eec96bffe454f834bbe7ccbacb634 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1966fb78f099c4300a2688be37febac84e6e1f8f7283ca647886e7f9e9b06efc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae20ebbfe15d7ccbc3ac0f5e97c99022b6bc8b07 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0d8b11dd08e9906460be6f6042f1976834680ec3de3222a2ac5466d4371f334 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69ef11985c6081c454f014635143099c620cae7f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4662633747bc53d7cfd055a3cd71127de81c48832b5a74d7fa01df54a3b42c5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcbadc473a22d16b4d8820f811210b277ec222e7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee97fbb4633573eee0fb21224dd89893321fa7bb93ff6b92e01a8214857a65e6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a34de719bed49242856eb33e7bd94d5a1eb39b9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e3fb74f289a33c109f8dcf6ecf8822d4ec27821385297a6b8ef0ec9676b4cde +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c38ac1e69a619bce260254a450c588466026f403 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68eee60929dc9c6c4da762c24c0a02f085a523567590649bfd9c41d25ea3edc2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a719697db193a12a7ceae2acf0afa4b14f0bb53 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37a1c4fe0fdbcd734690e43fee744a07f0336602938ebbf508bc8b32ffd124af +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..609041b7ac0cd5e34fd4320aa0fa0367714eceae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:998bf75c4e6d95071d494c033ec87e1484983ea1ac2d0004b3613b42d02757f9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09e983b5c0f59b77b5ad4167ca69432123e3b155 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f90e70d89233096108bef95b72186f85ddc1571aedfb37a221750fff2b5afbda +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3881ea634cd2a194b61f2dc7f55b1020fc03a64 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3881888c8da3516f9b4bd2dce456365ed563d115d427a45bc68a59e6e51d4316 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a5e18a3379ed894d4e9568822e60fdf3f1fe87e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d10fd1812c6a5d67c9ccca4f0a62d357ce9df2cbc3c3b6cc02d300d85429807d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..018ad55de46c2a54e17c66136bb684b880a247a0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee4f4947eb82a490c3119f2bb19a38be737af33d51e8399b35bd5bde2b1f5642 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..33e002158c745b640c3a5beac9749cafffe802a2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c182938d67e897861ecb390e4614c804ceb3948d320d9107a677c946a029ba18 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdc84a268f3e5b9931662f1cf862a8d2a79d7873 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e58dd30dac6183858aacc3b524f75e918b2edb405cd37e640cb60b9b64478df0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb710107d65ea71423d2f4839460e57c186d3fe7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e65b39b171d76fea5d58a637274a7cc4f2730db6551a177b5b06a25655a9616 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a48d3c487ff5b198a1659cb16e09d939d29aa06d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ddb3e79f3cade2396a2bc4ef71d8753a97bd814fbe524e098582c89ca32f724 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..498ecce5a2bd4b0f3e926d3383c9ddbc1c57728d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edc6e40f0150242289fce713806fd0282703898da694191a2656098f627b429b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a64c9c17384a51942e36995cc306539e217d4abe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d47075c39c9acd1c1ac4f69adbf7a49e788d9b34ef0a4cf0884bc2d01855a5a9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2be97e3cc93f2faa59dedb551d49fe849d8c82d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df2243fe4d23803f07d5f27a3346f78da09a0727ed1097844630ab6581775cab +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd218f94b41056e12223cc6ed89a8d558e031d5b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cec851ef8de34e0c26b953a805af68233fe4f32a66e6e6979b9374b673192f3f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea307ce525f2fca524a57a194766f9184d04d234 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04a70d3344bdce6a548e4dbc4bc2ebbe55b52fb5ee5247e21b878df76cf6fc7e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4da4a0083c662209ff657cbe82bcfb8d848cf05 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4607b309e21986e0fa5332c532430375010b052dc9e5aa94b51c20cf6ddabeba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c6c6ef5703ab35279a7f375d039e117750a5e8b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93efb114b2a006c4f48129de06fbfe824c969028e2a244887cc1eae10128972b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b54e498b596676de010d4b288ac83804f32c979 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da3a9a21c289a7e9b89dd3396e7ac886dd7326a6e7785879ea51103705dda7fd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..701ba4982d81253398397823211cb9c52d1e2d5a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e9f8af171eba42939b47b46fad34964ce19d825999445db4961e7b1d3d80958 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..457a4b091c76599250db98cbe16e4a730d2f5a66 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3759c34ed90a7e135ebb545d166675be1f637f25eab88dcc6fcca628d5461356 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e33a6c511929215472904902bb90d7437e691df --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c92acec493fd82a7ac700fd1b8218f40a69874cc430fce0875b1ca67262e73b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc0f65bf985cb8917a104b95bdeb91e761bcb3f1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3041845daa32530e4cbb07d135fd796e216c51c335eca580e65a476f2f943bb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9643184c6453f42514b1f4a3e67c8d9c97da3b9d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03560adfe23e816a940d13a02a081d0570e763a0799f318f2d64efbd4b68696a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe861345f5867d79ab367f0afcb6602ca07aa8d8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd2b9ab79b332b5eaa53931bdb3647a8c30c71ebf6488a4f83aca244cd34f694 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e4bd196dc7b88a82d95fef32e7115819acac485 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fb565993cc33d42754fef7fdbbc4571e27d8154be608279c85d52c07b88e362 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a326b58c88e89e943a0eb5f0e780e1c77c4ae58 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83c80eb7da21f2514862ec0dfa87db530e8ae56ba42ea82b063a6b9b242d4a48 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cda1965a4e82dd0b5682e55c84dcded49f494eb0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:785fa84685f212d0be67adc441b6c55648af855ded999914a5164aba2f60d108 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cb0c34388623a81dd28ae4c833e9afb4f2d236e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1084046e022d88636ba881599d2118b90c73fd77a17979082749c72f51c96e9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54a416799696af6445090fa07844419d97984f37 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13c556de819f5443b585677a1a60c2f6de7168685be092c6df507b7e6c83c11a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96755b91114b5f87658fa1e0b9c5689985f1ba70 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7f79a3ced484fdcc425356467e8791dc5da4f6cd481ec1ffd43e35ff62f3796 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f4e120702cb1563f7de27a0555c4ee30ec9ed64 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f2c9fe3111276e857cb9e95f13432d2364a477b9555979807ac197afb339356 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b388ef2d62bb3149f4e896f113b933de6188b7e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c167b0ca86f6f408220ee71e5fbd5d1df913f8fac029a0b4fc2c7212619365d3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa94c5bd500ef6f9099a0ebf3ea254f4e82acab9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:118e484c16fe90d664e374c00ba8aaacd1777119103666735be3503436132d37 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2db047dc81d6809c5f1c39b0c4b5762705e5ae79 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aed5a515940ef93b79ec7ec1d0d8603e26c260cc2cd03c6ffabe03cd9d531f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e8ea84dda24c01b9fd61967d572c8ba2f3e05e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c71fc649a7ab9dd45ef651f264209e625966036dc29211bacd540d1f4fc47a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aae53ca15981b4d25b4c219b4328da0fa8a9d5fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a7b7d7c5f2bdda886ab4649aa0d86c406d5bdddb8925ab3d5e110f87379db7f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f23ff5690e2c1864bb98e4d20962534dcd2e9246 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c992553e1baa8a8b940780c9326be0602008ebfdc4e0ec2b67ba6f4b8d3e8f45 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfabf68e5cd22d066bf338dc550387df612f2073 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da5b59281b1e77adc4a705cf9def34eda3a4d6f95fd9c8da69cfe4aebe97f9be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34316e88bc3e4f6c97eb853a2cbfe9968051eec5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:518f09eea56fe05f36e8ec6ce4fa853bf278cbbe1bd9dac0aa7e43c0834b388b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..909182345b91a23da14ce6f68aa7858e6636178e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb79efcfd8a0867e3e2adb4a7c9eb53f7b669984af5eb5f44b7a28e67be78e1c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0423248b62bd8d94191160a0f42f05d2ffa5525a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86d0602f71a9685702c45a62620ef9b483ca48bbe29696a704b05518e9db0f72 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7edd86859cae63b7d362aba324c728b921840da --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba6c6fcd54c0f796d36f2e62b03ec0f4274ac73210c41213141842cbcede1967 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7470486b1f51aa01edc11dbf9f4058c7cfa5ed07 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0647b3f7374b808f606640ddbcbf2783842a4daa125d9bb761f579c33379c989 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..495a73efeec358cc4c6278d5f00da7990f56f481 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87c3579873d066a5907c9a81980d5bce7a4fc4b0d2775ec3040f1c8f8fe272a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a9d30773f27a16ab9196aecbe663b4441030f65 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6a64f34e716cdb5a22abd51c04ad6f0a8b31ebbaddca5d47cf2508c48a3116d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fba613b53236f26ff4a700be9292be8ad2d6589 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd978befc17269ebb089062c543af0c81fbefe1cc5cdc8027755e5d84b825ed9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62b12e5fb9a444d6bdcc9b6b1c56d1ddbb4608a2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f96827726b512ce98a382652b08534139ab84d81f0de1c0abf556b98e986806d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..476b5fa979e62a8542525e0869338649c653cbeb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db6f7304c7b03a594daf5494645cca26b924805c17a9e8c6af59d49f0585da50 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0b0aa7374df94c89e2578a3c8e0ec74114821bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92e772db01af98a87a61916a1e479f6c29bd6aa8b10f76fb44906b72ede29d61 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf2d6f38a2945601fe8b5c08ce10cda264006659 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0851b0d02f6f5055147292594a382e246277f2e8edef88047d7341ab1fa69ca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dedd68ea0d6e2ba4cf58b5ae451f8b5832f830db --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d29e4f4c14d573cbfe9c488a223a97c21eb2212b60f1028e4f62814f8bb8230 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f68a52ebcd48516629c1f5a5ddbe76d147c725a3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d56becc9e19d254959d4f9a2be5cd5cb3fe7cca9054e11dd2b2ae9ac1cf43a14 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cf8155ae9c71b8794adbb95776103d9c0d03b61 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f6b7ce585d26884f22fa4b012465600f9f732e676213307cb1578c988650adb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2aab4f3755f0772d052229120d60de1030f5215a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c927ced0a0855d24151e2ff572eac3a22332f28a4b2fb5b514e22ddcfc3b2b19 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59b4ae1dda5e224d95c82cc305fdc56724de8c8c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e73064cf82b95c572b10327c4e541515cec0b1cbde7baeb21ba42667e5ada0d8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e0b20386d8e31f0415b2d36fec992b2c1544559 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec730c7ef98877e8d76406914e919a370d6ba59060c733027f5540ea8a3f76b7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97634e7b6e56b37d76f52909cf2449586c9f5fab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c954240824adbb746a5df47b3fb273e33bfc07f027ca2965305b17533883e329 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a0c104f4edf2c993ed8cb26f675ba3f5de20fe0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c06cfb375deb1a6311af691abdc03d8fdef9ecd83eccc6496d154e29f1003d7c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5eaa28816addc755e79962566c13ec59bbc06984 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d241e16920825a952ab76b4a9cc54ecaa391c76ef0d8e559ea4afbfaa4aa737 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76c862333b0b8c2f91b60af503292f3c98aa2925 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0d32f1ca78a6979257b941fbe736c77f3098a22292b5c32fdb92dd150144774 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95093052e30a3cc1a47606fd47665d3cfd039d9e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fbb9119ad2feb86a57fe3ff994a7a59c36041a72bcfc879d63d0f90a1e8695d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91ff1ad1e3862e9a8465acfe57675bf7dd8243b4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c29abb0359a34ac309fbdd31fd96f591224030474a191979cdbb7c9f4be808d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9494c0ce6803ad0e4af887ba4189a058830978b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfdea7214ab6d1e8877910983c5293ed1196fef1ff726299deb2a6a9a0cf6017 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce48868e87a33054570cd1b998e5b9b8e5d4d369 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aecf0ba27da5cfdaa06ebf128d1f9649d6bc25e8313385937e88a1deeddfe2f6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84528d66b2ab36f7d5d81baf34d247d4a60bdcc5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bee52d34151a737e3700443f66c92b7edc992b7e573266f44f8c162eea290a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93acb5915caebf1262c3aaca24df6db2d1db0da9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e58eb372a6e5ff06da46e52bd9377953880aae5332e1479334e4838002a6908f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c252cb479f0face486546f790a3d81401ca9efd6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d45b02dd22b5b4409f7eed3a107fdc8b03c05e45e4b0fd38e2c763b9f982e54 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7abd4547b79a0c5aa7cf8597df05a023b2213684 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0656ce9cd1bf139e5235d308a939b7110bafe6305028a0335ac518e49be1f3c9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7043a4c5d75de7627a9439b6eaf7e4653c1b2bed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:995cbc399c9bbfe1a24317cb24eaafb950007e81d03052b83a77fd834685a11f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a68c97d34c72dcc8034184c72b28f233131fe561 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9525de96909450985911e9197525454b9da9d2eac658dc43ac81b8a611d1be3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d30526e14a9ccffe7fb2165ed05339ad5f1326c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d161f45b19b38e137644b277df8c89599d38c8a0114357d01d497554c20ea5b0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89da139d8a1759661a59242dd6eef5a295ee7cb6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aff883c86c3e8b1e7746772665d35c9d4b7fa08620578a6c8cc76b05d4c30c3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c3eef293f0dc677678ea764be9abf45b642ee94 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:469131ec9bf9e7cab656f0f2fb2ad009560b73a0329ce7591189f73b43ed672b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dec02701bcf282fe676e1316474d9dc1b827e65 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:307a2b08b34b098dfc61c6804230814e0d25f7e7621ad02646d753520f9bb688 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5333f868661c35286f31b2a0a630621ed78f27e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4efa1b0926f840e5b37997a8161bfa1d04d05fa4421b2ce7d28c89900462f35a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7c9b7c2f59039de7f9c461a594f677d888eb7a0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:241af8ff7cb8307410355d321092fae80fda9594bf7b39c023e0b23537b2ec42 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0e634305561ff69e088b3b10869d2cc23a3b68d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2a28ecfef909ce707a975e66c407e4b27fc5da9da55617595ea7b7339618f20 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7276ecf13f9eecb8bc5d47f85278ed18de6fe6c6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d90f36a9a77c8876ddeb970bbf2636b91394cb8a1671c10cf82b7e41198223f +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7cf90ef24d898f1596ee323d2bff24873b6a189 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98426ea676029c0ee094daa8fcd4dc8cf1635f5890138fa0114af62a50c34f0e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39770f8b732226aa675cec87efcb3b6b4eefee5c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0deaed1382db2ee2618c9279c36492de4776397d21f1749a8624ab657ee86289 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6df40b4126e8d83dbed5c8d8f802cf05b9048f2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7c9bb9f3babedf1451cfb51d15c110e5e58b0af13ba069ae414063c0c37eb09 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e39a5b20fcf830e29a9853afc36bddcbf3d8720 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54c48e4adc9dc7b70bb6842b4b6ae17eeddcada0118c6e86b17a8a81183715be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da25d4a3fe0e8f9d2130f58e5b4f862f019fa529 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bef8b70e8dcad15bdf3289ba67f6e90281027d23a8c0b4d5c40fa3ca07ee846 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7fe7ac3610a5a8a79198831ed89904e2314d49e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a6332d19b1d4d6b3d681f41092a130c55d8e69b236d2b8821fb5b2d471bff00 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06f554ac13ce4d475993007506441f0391b44a6d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8ee01c5e4095164fac81441671b8605712b4471822634647a9ac836c7bdb445 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9196cdc268ed20dafb4adf5850721f0ee76cf7ab --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f74e365a338b59a0836f09df2ec7869995c97ec29f23e6a060beb09d99c59bd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..954ebe22c69ab003a11dbcf392bcf87446c7d2fd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40890b00bcc547838c030aca2815ce99ec96bbbaa6a86728f897d3e613d3a3c8 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2b84bf38005bd1f58583ae03752bffb25009d04 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69d84a067a49cfb2d861b054fa5201140b2167d50e8833e96c1e959b31236b53 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f31c6631b864402b55ab349d278a2546add8671 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:627e3622a3e38a7a65111cdbf7da004b1509c6a24d021cd2b894db41de3742ce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ed9794918b336c54fa6e274013d69d1c3e244c1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f2e84bb746642daf7456e620a5e95de8931a2fe71314e3528142ec84bdeeb65 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e864af8adb9a57ec8f2f79fe342a1d8bff54d8b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a642f20de32d3a2b70958ccca102c16cd1db175528dd722edbe1f8810b2f856c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69d175af1a9340339d8aed3d8e9e152e593a52ae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9957ea45543678897d36b3c67bae174cf541df0a848781d7eab745adeda7afa3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e22e01844f9894c0b5fda9077c43e89e9522075c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1da2a19ff80991f02a59dd2dcee31c89c83193d5c4ea966793bcba0aca67a5a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6714eb7249caf6b05b90a0a9b53f329775b0682 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf59a945e4ab969aa8305b71941effdc0e8865ea884ac74a43e839cd26677e55 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd7316c726a1440be638ecfece6969119851b8f1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:862ffcd0c82c20121418ec29af5c9643835de4f0aaf6db88b7bb47e071812ded +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bf3e726945ac12e12c66ee91cbed77bf6f738f4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9087149eec0ea53b3569b6285728641bf8bd12d9bac155294f72ad5ddb44ba49 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c43c66db575503d11e3497685528dc6456251912 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a41caccec00ac567804255cf4f3295d94edea1f6f2c970f44b831de2ac70bdb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b5661e5beb3f7de306c5cdc788e9a4c93c4e15b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e380f667ead20a8167ed3eb8e66f60de0264abe0f449df1396a922a131cc29bd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4889210b0875c4c0f22f3c04f1e91732ed0540c3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6bf1c69414f3c4dba3e0a29c6b6fd436f12519716b4d0017a1b33df7487a002 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea704d4063c8339668dc77e0be28bc8d74b220e6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b958080123d189b9ca16e079c72fa0acc6cbeac62a27c7c53bf60901522aedf +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5683dd675ea4e4fe4af0712fc42c79c2a392149 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2bd58e05050653026b3b20367a9437aa63e053caf38e958f663ff11980f234e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4568af2b76101c93d463caddb348f9e9bbdd9ed2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1488dfee0cca53ab8cef52c77d45a75cecab0849d9110fada13bdf35b40217be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..836c94709d6c315003e02afdd8650dfcf14fcdd1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83c6f36106cac2094e3959d7ca2e28ad07d9365ae2cd61366bac6173aa3e669e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c277d7cc64ef4a8f5faa6ba79704c49d26576f9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:968e126692de263993e33300e334749510c7eaa188cdeb7f0d3668995b8719cb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..121299be7117af4496c9c967845e621e546559e4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e3361dacafc99a8c082b652a3af6691994d215db1a726cad7ec15a0cf8fcc95 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bbedf582e22eeb52e2a2ccf0282ea6ae48c185f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d61b3aaf6310cd8c4e6267b1a463065f425516f5c93e4237667337181648027b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f55baa3015b764afb6b8ca724c657c6f19b64676 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:796a093712a5adc08b06ba33ef6d11ba2a1bc8bb0c8389a868326a02dbd09e53 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a61aeae01419ef94fbd5dc55e8b60a683acc60c4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8894882ecec073505e3d4f2d72906f4099b2ca6dc4c205c13e8edac5d8ec84e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65202e1da472011ac3a035a7e4a7084e263ab5b1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d67bf0d82cf6b70d11290560413a4b0570dd996ef3f6d6dd0e847a5b718ecfee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e346620298e4dc35b40684612660bd180d0cee78 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e48918a7b4b929e63b3fbb53fc4889f1fb3a4698ce35b3afc5cdbea2f805adf1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..32b2f48f610fc19d94d5e998826ae4cb0181dd33 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea0bc9c6fe6affa64a35b974438fec330b90be9ffbcea26f9d559cc86f184f21 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6435becfc3ce3f9c42dbe7086a3f55c59a3b3f0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e57d790c022a2e848876c9fd9439d9ecc86e1a3324d3051212a30873da0bedce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e46fbcbe70993b702f4ca8c51cf8a51eb14280ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69f9aed7a90d3d900e2bd359e2a7d0a19d229fc8f4b108e6b99d02c6f36aa777 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8fb58f99f39fc275b81857774a8826ada455f4d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70e8ef3bf383946ddfb27c4761aaae5c57242813422813ba216fce30316652e5 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..69bf487268a205e7de322d3bd1bfa2bf7e1d1589 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73521a158cb02f8666c65b3a0f216c3d1203af5c7bf138675ed344468217dc30 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7272579fc6c0e2a270d8860840ac2eff79bc5c0b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c40fa6044a797849b0b9ad501b12836066d892d3a3c387fd0956f637019661e3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2aed4f7b1e9ef7bff06a67a4bed2c390dec7cca9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7309d0d891561147fd91fcd79135c22cee45734f440047bd2fd9aaf549057794 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..404f1a1caf492b2c7e5410983487a46e84d65565 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:217d3ec563e7a3c832730887c091e7920fec729f81dee46ef791d372ff2dbd78 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f8c918253bcf68b08ed044faf16692a866d2d64 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b396981833b5ebe82e089982c2b1ba48bd6bc951db199230df4711b0225a16a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9a16da2d2df03651b0b73177e8062c692f0d899 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2973e4bed6adff05bb5319460de0ce734f80df7a96308c9613edc9ff33ecfede +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/lm_head/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0fc529c296c777e929ea5d0a18ac2c70d3d328d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9a187d695a82d08535ef8525a1f8bdca5c82335758e503de8b92ea87a0de9bc +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/lm_head/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d33648c33e2fe549db008283ba16489f4a5f24e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:491a004e7f0d5c44aebe5f532d79db196266ce2385846df17eee2c6c27924ea4 +size 205955 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..54f03f4794b930d3769d3cad1efcdcd5a69f2588 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:332a3b3accf5ecfeaf847196672c93e62f851c41292f3bff6ad17d1f336fb8bb +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de8b62e231bef2f36049fbf54f65b3d04db49958 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17b7a9c3a1d66f7afd70125c4943849777e5765e5dc50fa50a03b22ea12afc92 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a97b1e9e6b431898005ca59d9507a0dce5c694c7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10351284157fc3e42ecc21cb7ea42e9dc2200e140203a109e7f40935c69e981e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c18211636a1d9ffbe4dd476d14158dbf5a0a035d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bacc63545f6d54c463b53f4d85597381109f533f7411b877b6725d56f555257 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee5ef86cb8765d7460219e4a287ea770727f062d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34e6bd554e95588fa007e76aadd82b88482e1d36a740616f31a54d0fdbcc4901 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc69efbbe49f380f3c8f13cc4ad8a54d3c4ef021 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1301f2b771672f40eb19ddcfe3a67b1f9e68b55744888feba007195ccb93017 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8d2dfa1b1d2a79bdaa60de0e2dd106489eec5e2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62ae5077fcb075fa532562f1004565175d56068892a54cc52b74d451bebafa19 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e7dce65a00b27feae638a68a9767e910bef9ff4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ed4b7055d76ea1e83e4473a002382157b23c15dc622b401fc10b6add0a68540 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d274c7697dbb6c57fb5a67cd199a182a1fe03bd9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6efa3f5c12a94829b580d113c8adeb605b839f2540a75717099ccf798276e0e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94e9f1e416c92f018c9db022d8c3992c5ad7d8f5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59ca7208a70ac8742b357f3457c68415768cce3241a06a29adb017cafde7374d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dde21144090c6cd0c1fbea97d2e3e1fa4b80313 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc9cf7fec82b81a220867dadd8d1582ffd5ab3ad7b99e250325ab3c2d2d0a779 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca95f05e2acab9ef968d5983c11c22768091a4bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9834edfdba1f7f7ff4f2313a8a926da956136cd0bc3dabd8094bcf98c1fa59f1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9daa8086c801d018867390d1358526cdfccfd639 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72af1027500fc988149d79b3dc3cedfe468d23570e3a0965c2f64c44373895d6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..853f819c499514d26e8870927e9a1af82fb2349d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:420d5d397b818c1ba43286ee038b0f77daac9c4349af9c241ebec32d0e0d91c9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..97b4b97f8415c91d8f892b7221287e82a3fcc3cc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f17e75f7632f5d307a5a3fd3f0673cbd347ba2b885fc1e20a2471427510b5a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb9e5fefef7f6d9e451d41a1b3049d94eab8dd4a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3c0a102026c5d32cce6bf296bd2a21e457fc2cd0e98f806a64a10367a5c76d9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f84c16612e9de18e4e81a33f9fc32818c7ce4a59 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34db1e178ad140166ecc3dd31390e3c2a3e7131da212eafbd3544365dfcda915 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30f2befe25ed207ea5f3750f647c068c4c19d5d3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaa1cedbdbba59be7f12cea6d7b00ddfbe4f78294277cb1eeef5a35a604e3f5a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f8705c9ce703fc0bd80dfb2217d50c255ee8115 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6928f8baefa798561407c58762cfbc40ca9d09558af672e1244da5d41e0aa33f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..896df415ee6f256f88c8ba5381cfc6eff12392c9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a7f816b6ed60eb3bab9e9fde3101cab0d6bd93531a97caa6a489d05f29b715f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9576c2f1343ffc5efccb3ac575b5e31a894825af --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5e2a279a7c3f5e14e2e31578137d0820481be30f95110315ee02290e707ebc6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5d1c21b3328217d27a0a53901213f4a1c8cdfaf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42b4df66f5d9d34e955f45b209d878b7b56686f850d36ed16ca2d4f243f6dc5c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0a6dd24fba9de8b85a8e35d4da73b903225e9d1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee47ee5d344746ad3fb8e96f9153fb222b16d454a38e16e455eaab4eb2150a67 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfbae09ab0ff9ba31559551a1e2f9fa99a53b927 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bbbb31803937affce35843887fc1d31ad1c50e5a73ec796df4011435a1a0197 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be7af8d782391267029276fc68feaddd2ba0a127 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a32436d0cd7ebfaad37d12431a40adaea77f3401b47c0685927d01abaf0994da +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f66ccd54281af086b31f15359c26a56f368e709 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c99b78108fa0196bbdd640ea9a617bd280a6c2f91f55bbf2e588b6bb2b016a77 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ad3709a7d74b8b91a50847460362d6655045574 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b98ec50e517adb9d133f09623c85059e082a416e1a1e85b25e4a01c5dcc50d14 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec7cb86e4accb056215c0a430d27157fc1dbabd2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:317568d9b1f6fe62982c91b28a8dfbcc4f0d22d484d67737ef2016f506dd0fa9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e9af4583682258cf011af786095bc86e5a1d9a5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0082e48d4ccc983b6a518d85207f8ae6e611505e7bc28796a2fca4cf226b6b1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53268d0b244700a7c1d0edf8fcb8cc565936c93b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eecca6cb653914d9e100960bb8b9d1d7ccf7c25695224a98c4b9f915a1ef5085 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..861bd4efc718ac53a3dc0efa3d1ab380626c4e79 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef0c5200ff19569bb5bfa99f3cae7da997645bd045f56c11cb7473f97974239d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f6f551d390d6836a22a53c33a9edcfda9551f72 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c214b78ee5509c580a0f48dcf7f903bdabdcd00682c9765d00681f3048920b38 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cadc880d58b4cc423fcb43779541af1490d5bed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b95dba33ebf1203d5930b15bb5824c9fe06ef863132717c5676de0099238a53d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e5fb659747b84a08835fc3f137107e816ceff5e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:548d834b4cd709d587d87fc490c8dc7f1eabda3430f8cca5d2122ecabe6405e4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9be89dd58d0ff4f35b103f828b2fade6da1b38d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80d151d22685e510c9d71811717b9a655925c4ef8ffe1af33872cc66959da263 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c856b1efa558fa688196a8b09ce28e2f1532cc6d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:805c5906149647845c31340011b70755f079761cc521dda48e7293751ccd665a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4af92702b63d7752a2dc2df71e06498df34cba6b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95370c1640b83edc5733dbbf13c6134c006bc93684627bb0bfc39a511d537b22 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd546388c754226002356d47e1be9a09def69893 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f51c82564f408d79d83a9d004fd977a6b2fcbd33f831dc266823ae787d009ce7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5cd8dd33d6333b51afc5997ada2da04f3193802 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8428849ec8319816de8806b46f83d0a8799124de262f04782e0b480d6d50dd2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd9bcee3283bde6a3e0e5ded8f7cb1108579c05c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:601b6c67f3c5298bffa12af0121461eff6d62621b40487387a7554fe09b5f4d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2db67e53def10edb20b7cabfeafb2fd73557def5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c70d229ab9237ac1de7659f3235323b7e824fb92b46269c44bcd165acafb06e8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b781c70d585267a6710e7e78d44c962e29a23db6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b3304ad294506853ced12d8be7cde9ea6dbd391b19b65ecad8b9d738c4c7f80 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7953c212876e19008c325269fab8ba5bd5b32682 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:463b603cc1e9b5840a6c398fbc7e2903da5a172d2a79a54d5219056bcead9191 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c80c6aaf3c26a861a4df822640325c5745728d8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4792146250fb6524665a22adc2773ac1c856972c3214120acd8b5a1972c9bc6b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..adcfddaf958760809bbb63ee43734dc2b088f55d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d8063c90de9ddcd9e3202e9859be90564ae9b0c83522210cca6c7d4866fe725 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f014c94635e3b96461848930a1878109341f6b83 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fffc3e0009612ba52135d256a2b31fd8b7a7ecc9cdc388523c8da6784cf7f19 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e15eaa0e0f59db7f73f60d6a5e2548f39e6dea9e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b628fb5f4cabd647cf93ae0e38535b124fb29a8a6aef66599f527debe51a05f7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8d5972e7216113b79f59513438a603097ae51f8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:965d05116f9130b581a4eb997ee46d105d4954b7abaf5fb846257415a92268ca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfbdde22ea615871599fe2a425fb91a0dd32c4bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c937df2ae598125e2835d9b763df612ed21d2e4e2fdd57f7c13d3ac26659de7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e8a9cb4d61ff493c885ab691e40db19d137884a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a8337515dabbcae2e7ae2d96d49c5dee29f6f6c41396a41e8599183abdf4d77 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb619ec026ea076ca84eca96de0624e3002f5bf0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0109c4a1572e8ce79cfe433c172cf4a93610359173dd53cd11f188818d251a8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2606b45e47fe84d513497411ccf88093ff906188 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af9a0279278fe97b25d54cdfd456e44fccbef8b3b0f30546418af115a2575be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1250d07532d8cb8d9c30d3ab657262364da058f3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44c69564d8763da29a0040657a05bb6e2b7350d2bf11a5674c1f23575e7aa8ca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a04f60a4015c5840b478bcf3d33f62424274f09 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b89955b9a58f435a444a3d53681e1d72ea6937e9286a59d146a1cf07a26a9097 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d069c1b1d25ee04c2ecfff4d66a24ebf156c4db --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63907b842e27ba2723f093580114d1cc789298865d1d06afc6a66ad16e5b549c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..26c5b837a83eb630567283324b73ce1a8e320c54 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75bb2554407b88c557a1e44a77ccfe0f1b6d81ceaa3fe58493df2126af5969f6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c016aae6c6f1b5f372af6ae2ccc7c3f65cc2170 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8bf032778a5e0d517a25e10d33e669e00e45ee96c8c737db9ffd3e8d037d479 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d225178748066220f654a1d2419a4dcb948efc4a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e490b664f5e685b999cb9631313acee806144652272befda2f03918f78ce55d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..067be34d1da8937ab245c503fecb38ee513f8b0a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bd828c590feff3231b3807acd8acc3f53f42a141ba79b23c4478a57df6aa079 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6856b4f7f8701284dc3763f4ec3a7122fc534628 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37322aa8abffdf5b688fe81d4cfc77b7e91550e5bbaf227859d583711a5f782b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..09629e20c98618a6632ec6be0fd8a559dd5ad2ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59d6af48964adde9ba5fbaf998e114b74feb03ee8886c47d3419b89065135e8e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89e30a593e1cc69af673885890a0a58b0d652e24 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc1893834d604efe1e1da2c85de52a9d76561248cad1b7bd9e3786151ce71248 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a67a12b97003e27f38c091dbadb1bb36f63f7ec --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46be0e90d008db5627d42d8323e3becbc817ca56cfa8cd946500f3688215446b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb8c32ae8a67511527580922b0cf8ce1cf2b5731 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e0640154d5eaa90a975efbc7f14dec601320891f53da81bdd32227271f04a70 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b10c569cd9b51960734ee7a5451a367de133938 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b8ddd0b432382f7a6e35c1b66da8f23aa4db1cfc371233f9d9c56c6428be714 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd6dd8859d5324ca102d92cc799788fcc29fd3c8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:628ed848f58ebe5a8c6bf22321bfcd693a38531f660999ae5778a8d8dc395239 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b59b83af968fc4b6563dc5739abda49a490caa15 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8fb028ccec83868d3a7297a4d23efff2d6b7182922292df2e30bb3a082c5c86 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e6e9f66e316816588f36033e45116b969f66ab7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31f3abd509f66c6a6aa1d9af478d630c1b7d1d0fa8c9122d6828e6f08c454ddf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..04b0c1fe3c1c4c1dcd3dcc07a447829ae347265e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b9fd32ce65615fba3568cbe556e729c3914c908b4bdaf48605e64af372a5fce +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee7e20a5f28708123ffecc244ee31febf6dce895 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1f4ab5160923e64068afeca9328b8ffd2480763a639f53881e48f7d76376757 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..032fa4a32a66e5ff9f4a82717d6fe9080d07ee2a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ab59a1a24efb0887338b3d5bcfeed87841986c6c608a4ddd2ec5f33c11dd136 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee61daa1819a0035e18979a427755bf661b046d2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a98c0368417a0dce582858af3f2f229ce80aca596809b079ade89403f793e94 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..54d7a9e0f528362dea0850cd7402d0912a5d88e6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5130a7c6dda16bbb26471a150095634c407b9c4abae11b4f6a34c407538c8178 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42182ca228594f8aabc301d7079b9d13e06bbc81 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb185330931e0bd99243eb5b22b74e186637e1aaa26a17e69c2e2452bdadec22 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b48bee6261bc515e184110728e25a7ec41a296e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5f772384f0ae200a10d8ced5f71697ca68178f208322004de3ce2ddc48e5372 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbaa90d5d6bcce5d2d9d778a4de2bdec9bc3bef9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d01461076249a5eaf7ef1a537ffbb50868c5df433d0d6147c52f248799ea2cef +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..27a794cd90d9b2c4aabdc4d58d32b9cbd02e1352 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee1d46f1d00415ea58993dcdb320b958d5e1e02646eea4f0decc63cf04b89231 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2ad94b5f56fbee6c76c01c29ec8ae1fe2c42d2b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62886577b4ea47eae52d6c6be24534c4bc5df4ed30e69259eee5679d91a476c7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ed8e55970cd4dd5bed2484ca0aa6fc7db68cfef --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db75b83d571c64d2ad279ae62e58bf51a448efdd827940b562b9d05b99be224e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f16a07c13646edbb97d16fb96b39958d7da30bcf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58998f0d8ec695436207328ad2ece198a3099aee49d2e90b573e187a23ffc20c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5764c9c5a3d15d8d6fadccb97b57c8331a89f24 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa6e24f185edbdc3bba186df5e77f19c23fcdd2c620b790e06a273b504c05239 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5966280eea234ced8d52f3629e159703a6e5394b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e192e933344aff7e15f75e33af370508f2452fac473be7bf4dab09a6c7164ccf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f65aeeb57abfc48c1783d4c0428b6278749ce450 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6925e716ae18f9287f576d4bedeb0998baa39044a7b2f1b3e78ed8952374b254 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..690744e9c5ab0945634afae0ad7481e51494b1a9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:413e5c6dcde8969dc1de0b2e1bc929da4e270e569e59ee4061b8cf784f38a887 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3647f239eb48e335bcc811d43378a2e45bdcef9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c163551607d59540b2e458dd40c5fdecddf7f20e631764c9b202e202c5904fcc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..414524e391231536ba521bd75c62005c2cf52279 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b468b2f356409144b8123e1827ab7d6e093305eacf7d8b6fd6248d7535597532 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..424854f7a807657006225a84f2ff79423a1071cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94326a56daf224ce39b2de47370cedb4a675f24cd800dbc5cc114ee273b56226 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2efb00d6cbd7a0e8dca2b646625703942292b965 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf23f2a5659a4e47f577f749a4495e6505b53eae91427c9cd9d4881c5cb9d43d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..66876231b8c17e2d223bf4eef350ad3f1a257e2c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff015e9b89f7edbde124b2a975a95b34a60bc7b93cec127d72b9148e09a421b4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62eab611e136883a1355051ffd68caed4142dd11 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9db19e15c3a4d17bb56e54096f3762b9d872ed3a02965323b876d4812b0e95c4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a608c8f43bbd479fb4bfc51cfdfb66415dece0bd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa005b7ec37c5c43bc18350136e713abb148b0a7f1b452b320bd1d7cb26b7e37 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a570c4b6f3cc83b17822c990ccbf0c1d094f952 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f92607824c6f93b0942730985d21e12bc2cf3e18a8cb34e7e9ad7fb96555e26 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0dd8da8ec69ab7fd964f5f489936b0f5cf69cdc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c4b2f5c08ca3c416c32ca5b20126e4305bf748893344ae48598f399944523b5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3aa8bdba98fa09f02cecff2478f7b53ff8f2de0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:977e15d75eec5f1e036ca16e1403ff66249cd236f8a5919d4af4731796feb08a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1784fdebd996339a77b1f4e91d1fc3241d05d72e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8815811288ffa4b9ca6e5321677f2072da96ba643157648da142d84a109f2b0c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2343e26f9a7ca97f0aa0e4873132634389b1d5e5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e883c0eaee3c980426cba934c8f4c335d8a094bb64b4f4d24fc458e07952a243 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dabfb47a4280d8afc7867fb369a63c925a8081a3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bb0f4099e5897d7244b8f07da82b62b534b47aa02bfac982c48bcd950d1a85d +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4211282379c222427f69c898a1cb2794768291a2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca373622688d828d744f80b4a0e0d708b809080c3aed5e96dc23bce500a4711e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c17af30f909a29b81a3782e042139fb31d286e91 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6046f583e6bae7600b816f32338ea46951d4733a4f211797a8edf6757144255e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc0849dc511858b32078e31ebf86a6e963b76bc3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3c569e27df9e7d543460ffc7fca6bf5ae35cc9166d1fc34dce66b1e7896c139 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..89628c6e4c23c4bfebd872c65b1b24160b2d760f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b47ee2adaa63976670bcfdcae59ff6fafd5c591d6bfa9d75cb6b877b28ec3db +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfcfe047b5066ff90a917e51ba607ef5fb4b68de --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52bb8ca2f08d17bc23265087a0a88eb5933efc728c4fa5d2c3af81d6139bc6e9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..891940616880522a36a082364263e823dde9c248 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d0fb6cd5c33c8c5756866accfd2e2df907f9b64cf013cb013163c13cdc04006 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..986c8800f7e781ba3fd27e545d58453a4dc0de76 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:350e5b5e7dacadcb8a18108f5e428d58901b627ff6ca3597c370ba09d660a639 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..80073f9eefbad53fcc2a673b1e2ec4c57e273536 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df23a25c5ce1d0ae1444c04d7f7adf5cf497639e7f59955e5369aa605c893f1c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e7fcef8558b48de1d4aa76d1854e9db330f734f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e11918df49ad8b56f9d98d2205affcd188401564e9e4b555cebb302be762952 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9a7340d02e9822c9893b650123e0bbd123e5a30 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:906854b1b2eb7e73c54dcccc5d5ef4fa0a7d929d8861b6afe42da3ed678c726b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00a11a3605122754b82cea8b998a756261752954 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ebd2c21e01115a25b15fc44d0c1aa92d2e2d3271dd7ba90c802e8996a59ffea +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f86ad23d9753bfc4b42514283c5b57ad84dc463 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03642a05a5ae39e8742d2d30fa09e447dc297c38d1b34b6c3fb53aec2c822053 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f07eb224009f79088053adf85a424784a7772abc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9be766f76259b4ccd3c1543de6294f4e2c54921ab77a1d0bd614bcda48b4a10 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a0b46055e717ad101facb5471930ce1c1348ebd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d02bc38a92f468c43050041501b8e35d3c97e9abb0128987de10b74c8269a4c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4f1f17ce7bbeea9b9d83bedc5dcba911549021b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2482f4e6971eb007de0cd91687285e0d10993fafb5db9c7d28d78c1427bad4b7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dbd7b72ec818e3a521026757cb7e7ed90d5de6a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a953ce154a7b5baeabee5ed8e0897488ad21d1e5cac565b47e9e19eb9ccf31b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f34082127bcef3fab30e8b574f1dcb57a2fea357 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4edad3873c12e1617f85dff0d87465a9a630cc34e9223823e0758fa1fa5bd74 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..786d7d58048b950a23a2aebe9aef9d7755a497b6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd574bfe7a77e8b11e296c8e54b8a3ef6c46209ee05705fc7e87e69c40a12fc9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a81663adecb3d54606ff739c13d811643f40879 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc8e12d66cac80034545106cfaabb679f24909b3b44794cd84fc1e15d026aba0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7b6ad5b3a919cd7a8899fc10d73252deebb5538 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:139a753b873ed80457507778d83435abc6ca4a98dd78ae42f189d57e086531c0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..275bee19d42f3c842dfd064d2fcce0aa0742ada8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2b67d725baa73bada0ea97cb8de780f424ab1406e1512093fe48a3920b824a0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c20b205a3b149063ff6b12cc1d664208aad5ea01 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b554b20c32a39b1638f2cb440cab0cf64234d4eb10f17726399e71b61934de73 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53f62abf1200629c7533525a61eedd9e5aed220a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b1c7566e3f155071ac6d2f128609c88674f862ca7599c9fa7b969ac154ce7c7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b48b009044b256f8b3c96b98fafae7b281c5b5db --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:250bc6b6cb6cdfd2cb73bf3a62fc034cc7e3b575fc51e51f2c26a75e8f6e5cd7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddf449c1d2241070f5f6eb0de68dbf8ca750ec00 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99deef755c2f36705f04f4e6c152aa52259eda03a033947c7aafeb72cf1842a0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1404891e14928716fe756925ccc3c8621d72eef --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b57c7196b517c0fc4b565a40c64c8234fe4866c3c1e59f1ccbfe9f4aef79abe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f30ed9004aae25c25b8c41d6d2f7fbeedd9a2bfe --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6f7991e18c77d553d989a17a321bb712bdbfcb29e758e1f7830156658cf8966 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..98cfba838f3a90428a12b35f3f42d0868a330d60 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bb199f42960499dd0181b98583adaafcafd24e8691e2c2a01752a98f9975a4f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa511d6ebc07db6f6ddcfcc90108f8d94b047374 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0548e0e613ec9e54d33ba771d09c709d8660f7d6eccb67922076454d208b6477 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce1ed3e5e7ac375420ec47e524d658b888934712 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70e6d29d12baf0e157dc4609efddbfbf3395d095c4e10c377d719d057d704953 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fcda0daf190b144ef0b96a2fd148a6226b4e740 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec8132e7ac720bef73fba13c0a34f0145dbe5aea84b125248620a2611281f8e0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca3b7bd087ea6d28b28389628d8588fe0895e311 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:835b1f2e03f39dcc86842a563b335edf24f7f88b8cc274a6978820ceb3176df3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f561341966eecc60b4ed83140d2a71628084104d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6c890914ccbd0d7d438f2810fd078a9c7bfc9243b5fb34d24544d32435c0ccc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..67b28fd616cd6c1d816d7fadb9616c0b1bf0f93f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:798a32c71d79c91cc9197053c87ee1b185696cf7ff27b53de5768c87d805d241 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca650a7e0cd926ea0a9661ffb4df71a8775640d0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76da2eb2dd6036f06742663b8796206eb00e930a1f6c4d1ba6e83d218f387697 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ecd1e0578040370e10138cc4269c120e7c22562 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56fc4883f2d72c5b4108685981a1f7eb39328e6fac2acbb6cc44c33a3ba2cbc5 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6d71f9532efd2aa349fc9ce4ea785241ab19496 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aff158c1ffbfd6883c95116021eb6f8fa2ab25b21bc9d54ef7e54f4502c84746 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..46a9243066eb5ab6553016e5483bf0e70ee0c335 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecd2b49f5a42777b834a25a791fb2ea51e1848fc7eadd770f625b4d226a7e931 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7ecb2187fb933adc80c978f57808a275e627b7f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:843249509f5f051a8a0199ddc5741f772025cd5ba188914e55f6d587f41c1522 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..edecf6198e2220437bf900e2d1e71ce54cf63009 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:650fd2acd977d0e471b77835b022935f1343524a56f647d907890b9cd804a2c8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7384b98f8013c5d4cc91666d5f117dd631a42cd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82eaddb5e5c5658c381063a9166f2a4ff3c27d24502e5e31f6a4666466e1d937 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..798248fada7af80d0fcfaff25f648d2776115fd5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd7d1c8dd4cbcb5bee989caa6e1c5fb4afcf8aa7908ab790c554b29f457d0b36 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84171fdd0028550099928044829cb8ef087b2c4c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd19cdc997a85530bb1d888b0d881be9cd5775dd04fed9bc35a66dfe3c91138e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f5accaef91fad5c1634911841d224c8bcaa1cd2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf1be3635b8841e78b47ed3a4fa46c60d9b216e3ec39ee3dae5e32603296a3c0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9900ea848fb897230f92f94aac6ae1fa3141e606 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e6c5924dfb7c3dd13d93b9070943b984f032e17bd1b34a51b3a64211868e275 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4a9030889266c0057a4d1c2a9a8fda7531335c4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:254e6c483e3bd4bb3f9cb868195893890cd377ffa7d09a6c6b44a8e61d0d990f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..28ea34f0f18a6d9d75f5a8352a612c6da6c5b215 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:886007ef5e500a24a91b99ceb65dd27e4098bc2d6f6c51225853ed1b4529dcbc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5621fc8ef887d5e2fc7d1d44df5b026307356c63 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:395db41a5e2ad4ab1673f5d1340b5ab4a6de41da2d914c85ac4b0512b109b8cc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f253159131ce4acc1b212945f6b0d17a68d4a590 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aab96194b3bcbf5dc3b9060b9f7ce8321209c89bd05bc3224358d9cf744f1667 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..687e5bba194f6b8d2e50dca6da341a77d2030d25 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b61015f48ce41d49522d69d0f7289063c7eea751f475a66dbd573f1c6ca510e1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3c98cebd102edbaffa745ac750aeb52d1445cb7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a7478d64f56db0c5409edeaf43e958d9a3ac1e6dc618cc16047c1b25f541a66 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcb714627130754ba495dec466017705133a2d8b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10298a5a860d06240554a975e62f329f0236e0d44d27b068134ac3abe2f3e175 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb50900860bebfe2b76639b0e9a8aeca986ec105 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61fc57a63ed130d1e462569e10f514fae2cf6d7a4935094ee44f79a77ecfb22d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8bcf92a4fd1662a78c8f1bf8fbb8454f28e63ea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf78cf64f196faafa1525b3b911116038272874c02d247f352f9963f8b9f4697 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb54aa69e3d847f1edd37a0a2b8e8eea4fa0476a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ce5c526f57f3da3203d3461cbb1491391e25421236bbc5781b7f41a37f988b2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..adaa4cb4c0fb1cb607887033746561199d17a6b7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6e7479f014f3f4c3e8eaf4121b03e4276ebce312d2ac759e2229a5e07a1867c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bcce612e4d824170d897c7d5618781cfac5e080 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b23083a7af7c6ce15317426b760f376ddd5fe8ba7e7b30145f71af5b33d343e6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bb7b79d1ab87aaa3146bd47368bdda83190f0ed --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f254a1355d9146355fc1d0f291ff63be9d35cd56d8488858008ee3a955b415c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..419ee3f13e2a5ef66cbc9afa3c6097d690445a62 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49b90d19e642d0d92c46f49078d9c17c90525b204a9211bb96874ad7f1b054de +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad11b8bf377509ae8a7fc5cb4da3b2a5be57bae3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9560a5332bbc03254b63403f80e900930eeadb46e1be7b12db7aa9f1ec8671d6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f45bb3d102f23a4ccd71f28ac90458b121bc431 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ec602e228fdee94f4470cc9700380d8ecc28e6ef7c193b4640cf135b350ef29 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d65e4a0fc1a081877cc041a55f99ad773fee0554 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b7412b733a57aaf65deeeffcfade3e9b3b6e48be69e3daf8053b61157164808 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..192de81466be1ede817d3b1f88de7743eb93ee04 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb05c0e24faf94843a5c0a8d4f4f167ec1d97ad8574ef7333e67c0c7d2eba3f0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..766ec9cdfe91c4e063ffa5552cbb98bdfd2f1337 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb544da99672fe0c834196bbdd13aa859db0a7f07b07f1cf9378ca50b87180f7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfa7437b596f817d7b1ef0b30240074321c4733e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b89381ce4f876a650da525233d00a070a69d99027381e5032ad6a7c41f7abcc5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..043858ca667130222d8206ddd57220ef250b7602 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8ae7e7892c9de930d21eef6623c43c08115a2c9e13ef28c6add3e1398b1e7a4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af7383b089731c6ac3da530f14d033c586bf87a7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:042f673458de2e3456350c9d20424192ecf39826d379fe46128b3abbaa9babee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e786ab021c0b807ed79f4e613d97f65660ba78c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:777c580d340059ceecf90659bf43210ecbd9029c3c69016e676515f782cd8abc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ba99ec2ba33b82c5284bed82f7e0e2b72a19b47 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ff2e6fda183f8ae5b12b48f80a017ba488cf0e41c22192d816286e904f2f609 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0e1ee91f12505e29ac46fb62015363f46407f26 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1244fc0ddb1db5d756020b755b849917d7f29a82d020fb4e1646e4837a377eb0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..220600889d14f7dbbb1fbfc770b17c0d9745adaf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49717e71ca1bad235235287e09c16dbd56e64ced4a54f16fa403cbcf3989603f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a5fbca1d50f0864103d24b8f9a0dde5014b326d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a96d186c88d67cfd560b7ff83bd85340685e903592d878cf3174e8808225d27a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc616a934a33756436671a9cd6d4933dc868271a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b89f867f85e14d63fc9b6f683987da218e704a58028355755fbb6783a34369c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c785e45571d1c961d09f8c0558fc2c8fdf1ef53 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4503db766aca54ca65be9b45131cc8e00f4afa1efceeba36349f98c83dd80bd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6eeff3ac8d02acdcdf0297716e435ebfa0d6d99d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a13ef3dd55d7be3fcc9fea0f74902db86c999eae432feafd2579769e75fbc66a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e9b625392e6df86233c6d0ec3a6ce86af280aa7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6186f5b3bba6144e7f9d3d6481497a3d8aa7e0cb5092811775093fc136bee29 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be894373004d71487bc46cd5a718e61d478c8d82 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f99e05453542caef7c0fffa828359bc89fc894c97f91ae5c9fbaeeb00378239 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9273face9db9b69b19b98b1eb71621239d8939ca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2863e037f5bd85957625d2567e76c1efe4d65d91044cd821691a2c84c2c99bb1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d433fa7b2d961f4dbf2f93a116908ded0b7c6116 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6caae1ea7d8b02b54e9457d256a2c9eb550a1e88fd6963069d27d635fe0550b4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0de727add3baf34d50d617d4be6856cc55aecce3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59519882afd0741e3f6cbc2c9a7cbec2d471772e2fdf26a84507b2a4bdee76a4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..313a9ab37743ca6f98f8e720fc7b77fd9383e0b0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ac7d1828992b54f7618c22e41f74d63db67e599a27fe0adb1647f29b7145e02 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..19b2ec3832812a9bfff70366b3f11c793935ed1e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9be598d76e9a7a111a291a26dbf33fbd9b546670b3ca49a25648b5b15e7df656 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ebf9b60fdb4b573cc3580263ab97bb02317172b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9fcddd40cdd404c0f1040d0160f6587c06612fd39a05eb1fda456f6db313bf1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..21eda43a671c7e8102c527ecf01a4b53c0039e87 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b37604852b4091b7e9b96e6edf6561977130fa3b69667e1b6b619ac19f05706a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45c4d1683bbec5f040408466b4de48d191c99f75 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e2148c0a2e24d9e9c817d6dc943c285d0d83e62e7c8701c15c3727a1f3ab303 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6d414ec7e4b692c0a7947dad677329798e5cb84 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:409db653847d944e531eaf48f8942332da339daa10d6667d57c64f302f77839d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f7a15d1d5c7084c7e0e45c670d0d0ff42758eac --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eae3625fb0f9a94cf2d6acee1a3428e3bf947d06f24117668944c3638b8f1832 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca62cf85f58275d9b6c3a1fc49a804d361a6bcd9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0df4448a6ddfa90b41693fbe1eb13b0b3d4d1e331a197ddad1d0a529368249d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7665000d2c65e9353f43dac859302f73d5cc6513 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1311c258ec5c24223e4e312da8d499de51832814cc90c15e711ad07c327bff4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f23165763b18bdac323459fb96e7985830a1a23a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:479573f668a1dad43b4cb73e9c72c15115dc3d8fdd199f079d1a17a37fdd44f5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0aacb54d7ab223e9120c75134fd6749d1cf40e62 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dc54f7d55cfa0f40c40ef4096ddfa23abd5f046171111dd0232d72fd6071e2a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1451c2a6e0febc0b0a207039f7a2804a14b10a77 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a68f92963132ff761f12b9ba586a34a3f3c6085c7a6a44bdd36245c12787eaa +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7959eb923ebd7e0ff7a36a628d87f12c1f484b86 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3567bd5eebd7bfec8854d01d60d859475819d0f99880cedc457e969c05b83cb +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..21a276026e519756a073f8b42e6caea33864e189 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d98157bc02c5280bada9bc26ae7285a9b314f3215af34b273079aff68e76f88b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4eb9bf68271c697558e30c87648a885b5a0193f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f322ab366cac0f3a5bca5d44332aa1597ce1fc60d0ff8e35927ae315357c9a2c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e190337056b9cf332b21a6a23f42bb2a78949e57 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afd282bbc5039e4196d3711938d9f7f0c46718e9b0eac851abfbd10d6588f006 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d98fba45128e2512a0debfc19b1b593d058d4c24 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feeb924d6228c51d6f2eedd241f6cac50bd58a186d070f45c8f5bc60d43043c0 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b387b9e987f4c28b03467e17cbb3ec26b5f00a56 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fec3ed05199c0a0f855c5a00cdc13c813227159e7c079f27515e12c6a23bd6e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..577638e3a5a2f08a6f501b3dcac6bba08f072fe8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c441d5d18d5f96c42f44e7481f5fffc2a07244154e757632135911b3921fc0fe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8635230f51d8422453e331540f2c7a10704b3e9f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91c9d03f2ecf68ec072bd4b6e0c9ae0b6dbc1108fd369cafb3beb181d7f955cf +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f159727f51988e062f831e006c9ac7224a6a1635 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6d59b398e6998d76684e4e607d298e980c5dfb8085853b975292ded7b6f4cd7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fbafe59c63ac2f7bd139382260ddcc199e3cd9a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9abd0fa04af72aae0af8e4f7cc5adad932f027f5254ece147c78cf70d05e157 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e33de178ae4aa3da1141982f709b7ce933a967f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c677430a5ef15fb460a6aa41c839c87241cc1fb07f51b9d199ec348f193967f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..00602543475f0ba6b008f19bd1cb031da32cb271 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65609137864d0963265142dcf6d3f3697e760ca7ad5fd6622e3e0c40bb6281db +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae4385969409445a3c10805ab2db4629f2e6835c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4194388cf969780c821d3db5fab7434566e8984d89fb84cd5a4be0ffd0c31a07 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7db655d04766581b05027f796ae62592fc9d23c6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a7a622e41febb8af0b281a5c88e195b9719c3daddd2ce07d78e89f96dc913f3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98b7123c6c6674e81accde180963c19878f5ed78 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9add21738c4c31f8360ba2597bd2252221cd571cb5fb77f30c10b75fad81f1e2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d006336fd2cc7adae49db90da86f04a0013f34dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c5bf10e4f820d7043b3992ce996e5415b1d5c1d97188bdfde5652c805138d3 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5981f1e5af4e704b094c9f36fcf099b02246bf04 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1959cb166f1cf13291ad10444771ee088b37debb5278807fdfd16d995a48473 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7878e7b05994fcb06e334c17fd2aab0074d829f5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a0d43ddb814fea537d36f1719ea9391f231b99dac3a03018efd81f4759d14d7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a292ec028b4af59952059679a4883beae702194 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bdcc1bbb9234ea773420474ab32486d338827c36576280f9af57fd8c59d4a4e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4201d7911e1bd642c08d3a5de25979c05416b737 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdae5c81a6c1e1ee812a6068a81c9211b6b763d296e962c5e425b1dec7c9b3f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1f04460998b178b23dddbf8f759d7190cf7405d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31fa65e5e95306f8cf50370c0fc8399a180b76dcbeb5eebf2365bb46d8d48cad +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d03e6420e943af560b703bc1fdc4b111141370b9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa92918c2524a88f0a254ef7990ce4c1332dd5ff198bf251682007b63a56e53b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cf7f418c59bc5e7a43172a7ce00dc4a27f061b5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c68e03ce5841e01352c85bbeee722a9f0e83c6806c52fb18bb5e3bca184435ee +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a89ad058e2927040ccdf776f02f1bdfc5c12c5b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c5f03c40f968f20038937d5acb34167d9f586fc35002cd2ea22eedba9de9b35 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec11f7293463adcde1a624d61c3932b0ac0bbcd3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebf3a0b0e300a80d33987799771c056dee90bdc83428461ca361980dde63bbd9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..72434a2a941a1ebb536ad8c701ac98fab08039c1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d91d1b6dda0e49ad14de22451ccc225dd0b121e494e7a861430dd0488d10c4fd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c59f3faa5d8dcddbc08106ff769992e5af066b03 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:308e9be435420dbe28a7161415dd23447266d38ae6aa6439ace60f852560e6cd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed61b05203523eacb992a45dbe4d531760b27736 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c65544151c4be1609536ddcc52f443838d5f45fbcb187a27fb7112e37aaca18 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78cbb631f5fa94745643ce96909eabd2678de272 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d7299fb5e35790dd5aa204b0ec9831f4141ac3bfd36005a529473fbe4a21a4e +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be7ca11f9b4a482152b8e98dac99c4e7c4b94d06 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0827ded3b7616990576b628410223db2dec151d1efc44a4a439f407f5e27d7d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d94f3288fe7f815ef44eee8d116f3a34603a7f9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:114af9e98a7c39aac6f0c8327c3e4cb87ccf767ee2ffb251b6219b9c3af6001f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6581bb600cef3b1341c6d8dbcdbf7b5b8fc7065 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0149b6f004cb91db49841b59fb41e0c72427f0517e6fc4a64e227f8458bdffb1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b81dc04db6518fe3d2a7a718de8ecded7bcb0f0e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e215a68d7a2e251d441b514a1abb273cc28c95724ad52dc639eab448c84408b8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c3c6cd1b44aa132617f470ee230184efb9d0932 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0238232463dc51ca9f5a808e4a9cb00acfd7951809d011f338fe077c33db306 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7630113b7fa2fcc38ffcf0713a9682f2047d1e60 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e438782e7acb52c00673993bfdc6da9ade1cdfc4a11b33c449cbe40fee4ca4e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bb800ddb8f4898589f4ff9d2c9c4c8c60932a4e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ba1d8d8ea5427ea71a785e39b9f6c824331564349ceb944e7b2101332848ca +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f9c4b30831f42841722c46c0f4ee261f817d997 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baf8b786cec140ec1d5732710fb638a52432f3e35977ba7b6a99a99919f53516 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d115b43b17a5682e246bdcc80f8998c72f8a7e4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2583077050bc4c78d9e5035a18fd665414a93a442bf2050107d9c5d50d5e7065 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bde93858e8dbe89b86274140ed20add50670481 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5c6df8b820abf78fe328fae4e062c085c407d827c9b379b7300e0f5a0733a46 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..13cc2e72b8727b5279cc381031ea7281b37d537b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75194169e99e0b81224cab1636c0dfe897e3a61b2bec3f3c1dc370e7c6b4bc97 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09e6d46f0a8bd97955d947419bcac3637779ac51 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8776521e5572a063f695d8b9cd090ece8af80658be57722f8b1b076fba97f23c +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfe039862b9a4466c7beb54fa19507ad12b52b1b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4f07d93f30cdf71741273fc67f61cee7d363676601175146c551d7b71e1e0d1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5012a6db2c0f281fad845f76a3f9acdb5217304a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cad797bc5db914d962d26192d4d015ef64c75c7e684a13bf553ad1e5d395f660 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f11b5c621af58c983f1a1e04913f7adadd1dc3fb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48752e86f40e5d05d66672adc2ddfaa9cbf4ffaa3db1a2b4b1c7f46f185fcad2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29affce344899a1561b0bf91d8d729de0d928610 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:508e5e12ee3570c1d3bdf67313005b1ad9c3ec44c5569c7ec2bc1c85bce748ae +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bface8aa5b91929c96b8da17c869b338541f783a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56ac75e312a0abf70f87d86d9b1a0d03295c4206177b10827158c2e1dc83022e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..380328d1b3789c467cdd84d09e7e67bf997f70b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50c76d6c525a9951167d5e50bc9f4ba69bbab73740c33027c9eb3dc1560900a4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b31250240484d0fa26e15f152d139b5a762bc6c8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7709ef6b2838ae86ee97bb9e3e891e9c5745f370aae344c52bbb69a3ad85c2a2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00308ca76a04ca9b7c90d20938f3fba488a13ffa --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13485c6d94062402387eabba29758d18e2add8b664f0a54c985646f7c727b623 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e77f19f2608a64a0a4430313d020fbf35359f96 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fa65ade54b716e323726511bbb431d41ea0653850426f73a260d12e5f8d392e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cb763601e8e1d42edfe30b12231fd413c46dbc0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02f07cf4754c436499ffa32073ec8111beece4637e4e3fda4174394a0bc2b049 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8bb1e65cf9e1bd531018c0362906ee7af244f69 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c6f3d33d639c6180c2b6e37e89e8f4feb2e7edf298a5051a9cc6650a2c4cbaa +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f13c347c1bea225f8f617ba90d04584164d64d16 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8408eb548b8ca2e5c3c5bc839fb9dba27c1928c600b5bbbe92247b6fc5076a3 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7d136edae4921467e6454ea71b3944256ede32a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f916acf927d98dd6d57cfa3ce920a566b85f74b7509eeadba5a07421e39279f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09cc605567934c9e60e38a9f9231bd4a4971bc76 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82456ac700aeb76dc028512c49507f36fa532803e2e9df059d865b88d69e11df +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ea28c51fb1b737fb2c5e205d12c623445df7209 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3d33ec14c4cf9c01aa40b941922c996cd7b6854472a2886dc2299157d9595ad +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66abc54efd6beb9a5666f90a99c9a3e460eb6be5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f85ad9ef07ce5111c64be11c0e3ee83de8eb812f31479329b5a8e0e4683c4986 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c510b4f48b2d7ff3121579fadfea4045983d5454 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7172a37b614b34c1bdcef0c15a18e8da7d8737e7b711528c96356dabd14e2b3d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..285f568f9eb5a157369a54d3664a0815399ffc43 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4748812d4714e9e9acb4c9254e65ffe7c15d34ee3a0fd63bfa01ab47b4bce453 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ff73b902d44b29b87c224af96236e89172bf0bb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1790b8d29649b1438912ad7881a89dd87fb302fe69f32e506cf3fc1fc50009f6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76761ae7c9023b40b08569c5bc32458a31ff164f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea24e9601902dbcc0e17fe12b8ceacc5165baab0bd5c61303025595b469ecb53 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..914f1a3d418641f5e01f8f19a688673a95a52a9f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:492650dfd47ec564de75464cabb18ba28fbb457a9fb7946f25bb570046abe790 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d8d942814cb4d145ce554429106c2ea5c93d3f9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b1786d68532e05d0a4e595149e9d8e87ab5d0817840337f6aa73486534cfbb1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bd4595b3b599ae07445d617b35fb6470f9be2fd --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a02e5c0620365e39871fd3c76f9e9b1bfd2ead34b044920742abc0cd3d8249af +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ae81c0f641e70f91742c341f58c8e6e70ff4d11 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4009ab1543f59e44a513897981f9a394b43c7779ca8d2cf09766d9e0bc71ffe7 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6270b6f0c32b07b36493218fa31c19d7db73da54 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8605ff8ebc0939f253ede0d100b08cbe0b0a2fe52b1a798eeca2d4133ad54c58 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7946ce7be3e6b5bd8b4b22d4c18c2192852ba6b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:695f731f22bdb6a3a89a5718da9c7f33f2fe7890ea049eea6d5fa2c8f6672812 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f5bb9b6eb868d4559235323f50c7ffa7bf9f1c9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eb5b8cf5096a3c4e1d4424c9f83848863f2c328e1c5474d434b3399cba6484e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4a340fad437aaa5a8a4809f6406136456751237 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:197510afed2e4f887e59b85b7e8b32bb79b1c788fff9dc9685dc06fe7aba0640 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..57c5b41d965267a213972a55c440be82bd361fa6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84245026a0e500ffcf16f95dea46ec446f9372d1b01185ce318c7f54e04993b8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..195d3853ee6ba45bb866c42fc73c603733999fae --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50c25ffac78cf14a74407195b27cd142af60a9a7167168cdf5ec2f14f6b764f5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfee1e71f2374b547c576c231fa3548a462988ad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da6e298abc1535d2599073facb2303aa7af9c8432fd4277f368481fd2905cb7e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15b4aa57903bbc97086d0b8b088194521d9f89f8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c20a45a8c565dbcd11c87bc53440a5716db40f70557d6c196b804419e05b9868 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bccb62b687c57f7ec9e4ba28f03581aa68c287b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba0ed65f74ba09b60ec5d6bbc9139dd74fe6963adb8dc702ac2a58439c0ffab7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76799e93459af72cd812961d4c0263425627328b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0d62b81fe12162b9084b821a43c6d7105cb0cb30c36b52bb85af22c439bfe57 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8346814dcdc925ec5b65edc84f56128727ab5e60 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c37f6be354b7043fe2c0b3dc888fb31a73f74c9b2b11dc1708e2308e27bb6d6 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d93e500f7dddfed6a21f7ed68ff897f52d34e8cf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bff89739cc770bd4169396ccbc076e7b4e06a2c004ec1e17c71bb7a84abcdf5a +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbd85300c8ea92e649dd579a8ac15a927f67dda1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed68fd9270c8d03d68206c556a54bd4ce6d184abbc2866b8cee658586f8d9d2d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5966850617a97a10ff6d7f876607c4a6da4f620 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56856a46f1a9e105e7a5bd3204f81cdc4334c970b155259b6fa806906b274f1f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb5a24d6f5055fb44a41212ca29080c3e298aad8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:088b016363ebbed84328ad0827536aee5d00ddbd2b07c50971950face345ea11 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34b6f1a41c7c8661566b2001d4aee2c9f53edd4b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:808eaf8c00a385cf4af25f38b919819c47720a7b7c4d353946879eeef36e0961 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e52c98ab93efdbeef8e80d56ea0b2e5ee98e61c2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ebf29d15d00dc2d6e1f33be14a99176d2d11e65b4bf50984d21dae7f1fb1d41 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dd4a75f6ea7d7f4ba9af8a11da9126e761a6bbb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c62cb3eaced3f1f58958570594670d2beee4294ed38ffda2572aa2c87498e5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..850b49d9d9584cb90aecfcb47ba772996a605e27 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b567071da9f07448f8ddb0ba63067440a1cc6c869649f6ee1c425792d451fb52 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65656e796ee08fbd2d00670cd448d38b7433817f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9a84abcb6f12f89f69916b244831eeca3ddcf8febf223f8e7822f9af004947e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..83af8a28fdaf759378dfcb4f1d569d144f4eece4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f3fccbf9fbbbc9fd4189178e6b4a0955054a2b0f66ad72f71acc0d40e4191ff +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be6043f22cc2788c2dff2bce642fa377329a116a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e223111184a3973216c15e4234e6c47843d99756e387cc0db8ca89e905eb6819 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9ee06488dc02822bccab0e9cf02ea0af1879f49 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecba2d49f8dd1ff07e1d58840bf1e395946a2b6f2435b8cd6774f61948e715d3 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..402652e319ffa00ad6d5875b6ddd440b1c999461 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7219ca6b3c54daad6eaecfe45e3bdc5630767d72663e4d73412c2bb91684f397 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fae0008d1e20afe815d34c354d8cbe2e7f709a57 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d87ac67e872945b3ed11b74415f329245b7f82bf7d5534e120347b85f09fd58b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e02e34135abe57cedc5e3739945b31d88b616b3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a40987ab076cf5bb92b9e38b9c1662d738ec49826f340b0a90d4903fa7a920d0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfb611066614385e401fa3c6051c1a56767c31c0 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f59205c19d0d3058a54641921ac0237b1dfc96cf04ff471fb4a91ebe6b89f1ba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86af4dd69046b7fe62a3e6b18db0537c21fc6d55 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f8124ea04ebd9147b787d8dec2bfcc6cda443b623186ec0ae4a33a369ed6c74 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..160e865caf854a706a0358f5355e50ab85426a12 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0848d42d1deeeb27d778b3abf53c67226348b6490d9fe1fb2189ee75e22adb6f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0b2b8c1068507e3cbc5f85c101102462e003782 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7efafecfbf3e42becd5c76d40d9a2c3a40243e17b9be5188acfdb02ab413aa78 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..896a62f274190d14a8b7bda91cc9756a2e0f9c9f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8f8d58b0c3af9436fdf76d6ec71f3ca68d52116291ba077d7732e4a379333db +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d0d777a651de163b5e90dad1fd4ae0d09df2ba9 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c549387e785dae128e25f31ab43f78971aeb96fac61f9b51cc1e55fb133bb340 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3bcb2d05b0848649c4dc5d0245ea061055cd18a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:133a2ef360657e085113f310c1f015387e211e04d43cf58042b366ccd583d366 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7aacbc242af8599abe1848b1eceb6e64a187443 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b2d0df6fa0c9f84c9560e6bdced9bc9b0ee2c3639bfbe24d824a8a64904e51c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71d4ab3c870cf838939611eadc56de92b9dbba40 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47865f0b94b87a54eb65203f2e3e8a9ed2a714dc445be0b1599868c2af74f552 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed3c3838e7bc8f610c17e29aa8945db82e0c1786 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6850db8cf488798a6719fe6e2b5d851532b20877dd238ea0a7a1385a0a5bb5e9 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ae82f42db4b6aafe369e4a25fc9e421d2c3f574 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70893b5c6752e2e23c714c05047d6b344baf77e73df8c4e8f62c22afb31baa44 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66478eb6652e6617a5468b65201c471f8d7dd2e8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ce5a6b78ae381e9f6d75fe22e026e54ac66ba866f41bb407ef84dc5a96c5954 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce04e0edd64a88d06d53da3eba184168c292ba7a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed66bfa4152b9f1cb6d557686f2685cc3f8e30e7ce79043315cd7b3a16a5097d +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..485da938fef89724cf05bb28aacbb5e0f7a9dda1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64b2bf9e120727f9d4a4891f0c27dfdf75bb6ef2f0e0271b011f81c7b723bf8c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c8217684f14a997e4cd6e5d70a2b7975e2f5e0b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5575fdf3bc9dfea5e3d8b25235903ca60bb1b66e60a26936901ce24db7ba5808 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b9b982930de46d587871b9b35ccf0f2f70f6130 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4744bbd657a2d20d6a3b461902f51be4b806708910f425a0eb9fb4b08cd9b153 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a6a8a0dcc4fcd60998d764a211d6758c583d849 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0565f7d942bffc592873d615169725bc2cad86a17676740f5d7e2fdfddc5157 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f5c65f7e07139cd781b7799e2a39a6813a20a30 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32afd414c287c20de4b6b218f8b9b5ac1feb4e9a728d9fcdff4e526f6fd12c4e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0184a890e3344905eaa369283179fb86d17abddf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ef93e1f7b27dd462fb76f28a84811973fa538e35468e2e5032b0a50764aa87e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a33716f50c1a4aa8bcfb698603fb6ffe60bf0285 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0ed7e07e2790d4f63e4754223cf0b5cd5b45a64467ce5e218b3ac80bf175025 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f204bac11651be3a7c9a1123c3a911c3f9dd447 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3c66d0e896a14fa3643a9034056604dfc1a020bef8ef0bceab48820b8059ec2 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05661947531f0765b5440a8135f07480c1f9ed1a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bc7f83d7a27d090485ddd51a9b524292893d009f4d5ceeb38bcb4da6848c764 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce4682946483317e86423c76a6d83fcd1cf90ba3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bd11c3b174049a0d80d214ec8447e0ac0609c7a702c1b83f32fae1a7a9f36d6 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba2f61321a2f94b4c4d4484c3162b6f9126a2fe6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53f59f9916be5ad1db1a00c12110c30ae372de51d256f14283b70120687ec0d7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..04014e41a301a44593fefa1675e978270ac07bde --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4642869065c1fe57e019f136bb14c0e514e9c15dda1f14b743fe42ae14ef6a9e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef393a8df718436e1016ee3a1d152694067e34ff --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3827f5483186e1c8474108121d430b8828bb1f8567e64cb053d478e29741d5bc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0074a1fc9651c65868d8d1988b1ca0083b25d85 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12b2ba0eac68d9424b80a1d93c92fdf5778a8655facfb2b72f61cd260e491b4b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..726d4498e939c0f537e5c74eaf33b67a75b7452e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c33a643cbaf1ac4e05186e0151981ccf58b558a34da1d533c2d15958ab77e41 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccc0750098b46f326eaab68b0a5cb0f069048c79 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ba7fbdd6bf35c401581f7bbac108c43f324f9978bd9f09391a945bcd84c3edc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..557a84c910e06ef22438eb8ee662386501c03c1e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42d1d0d50c600bece292c97761fdbc75dca7c1c039e646bd9e1b5e5cea4bebd4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11081cd1920e4d8f3756b183d5588bbf1e6a16cb --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32a940fab0412df25f38dda1ff71a274aaf337a3a21a6a444dc7cd9f80133c1e +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e20a68f7902fd3c542c10b81718fc9eae3550c1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3779db591a81221c5ab39149fa3fe4e100f62f4007c8af012adfa1293c25ce1c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b46c87cbdf4b80cf982e0c243d6b5d828c682f4 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1b28e6a7c481ac7ffee9f60b93561970613cab724184630d5140c0e87e69004 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a24716bf873b083efad1e0d7404dc3d7309a216d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eaa7f5c5575cfffbd8cc40bc187c339d897c5e63a7759be2e7e6fffd1eb2d56 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b054d3ee52b99c37907e96e05f26f97424cecccf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8604067de33611c1652370bd8e1fb392ee7bd89a5c018737427e5d8cd5af1c7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba4d78e489e1e4cad13c9247f833d94647bc63a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f2c3efcd2c88af7331972c60bbcbbddf0a35796e328fef8ecbacc1e95864540 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..492ab33eef3554d4de294c32a105da53b30cb60c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da76baac9799212ed0715cd5cda25ff643e0bd9954ed95a4b00f7d2bfaf72d86 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd752ffdddd7150aa1a134403cf6f770f7d0df02 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcabc7bb3df4930334837ea0a8841df4dc87ce2438fa115f7f404f7525df92da +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..db5e3419a23fe2248c04671df821ae16a0695e79 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:720ff66da073988ff5ea43b742ae7c0283d88a3483aa17f5c748aa049a390bbc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62aaa7cc2283c6ecad0382d1416549106050128f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63d0e019e4a93b588eea0289cc34abdea46e141217a33501fa083d03dfcc9d69 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8a3b9ffe776db652cdb18f55924ed86fa03ff87 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9dea9d2946d06a47cc5508ebb37e8900dea0c89eabe47ca7a7513e960811eac +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d71b65ae96f9e44101d6e2a8e87b006dbd49a8e1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4efde2a05659f472bbf1ab54c6e51fb23ce56d646dfee4f63ab2ecbb13c1895 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a93688d6a37f63675ac5c9086b24d39c8181837 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd30260105b2dab29649f2c60f9bb65116f8716c642a0439782e983987dc6e28 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97d22ff6a8e99f0cdda6fdca6557b1beeb893b15 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e9a01f2c716b4bf11f143dbf0fc95a47dd925bd19beb77fcbd734ad57b51e7b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7906af4330c5404effac0a7de2fc511702f05569 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6a130e65c8051f2d00e9f1a928e57fcfdf4fea2a1d6f3b7c44f42b4f09f044b +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29f3ecf9e8b39d72701d41c3e7ee7dd447cf75bf --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33b09f093a9b93cebeba78c9d93d1dc154a043ee6ecb987abccb52b8a12bf4cc +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ffdacfc4a2ed755700b0bb92d106f9915746397 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b72bc0fb0ff167acfc83784e594f859dd304ea47dd10956271ca8e0ec0b82df7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..375ce93b320cf75209547f87f35b44e98dc28cba --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bba5cb02bf0a84fdb44caa4c447cf703b622886820b955da8858ef8ef139986 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8476ab6eada1f02949ca10e771e8d5bc2c5bb39e --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5954a7b5a0bb7d071919d093d0eee31b20a95d1bde0f27d94cc97a8be7e7c63 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccaf0ee45eed90126897c11330ce92235b468c6f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc0a771efd192d776410190e0a2802903851af45f917c8c91d3c83bfc6599862 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..39bf24cf43fc5c09cb9e96ff306c1555881450e3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d856ee4b02dd3830124e260e2fde159d9a1331f0a3253898c4cd39766cb3d0a +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf6edcf0e35f23aecafa183f8a752e4704f89947 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db0054ea2cdc9167257314495ad85f864a01d515266656dd414a5740b56275c5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..944f4ed15c54eeb0d07f5aec07d1f673c61d7832 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99a4ee18e1e15caeae375983782e6c33de76c7a88445c62a605c2485ac9ad09c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b47bebaa3e31bd3a952374423eecd9f7e160675 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03ff447f06d504ebf42bfd027ef4d3d7e2843b7c61e286a00b2ceaf2d1d662fc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7ea36ef4c3ef08e5e456b4c774b07b6c4f477a6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0bbe2fdc8583ee00d7ace72d20302c985da9164ac4bee97b7600327ee9b95f8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57465690f1338230d0cc1b59960f78f222a8c271 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f26a865c456f9428287256d7e2798e00a423b44faac82ac8a8de0efaae273c68 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ff53484d0f26541bdaa3fe1697ba144a3c4394f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f16ccd14e462c275d348190d031c96579be48ce1ae875e16f5c10689cec5b568 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2a832e6d7dd9ce9d9e8b85703e1beecda8f5288 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d6c2675e0de78ac41f24f9c03ce9652fb092b340ba553c2edc1754660731b12 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b9b713cdf5d0b4f9547918914a53521c55d8053 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9db28ec7f63ae43b88b8376718537c16c8fc923172ee5d432088771e0dbff06 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d740c36ed9698c5ece74edca412ff0cf4ec68ca --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81059f5c056c71e15154abd2ab9cc679c0a9c80e7e6286c128826b91a9472be +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e33785db77ba47c623a03945098058b1eddc230 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35617456eef083fb7f1f239c3f5b1627e87ea519668043fe78697cdedc485596 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57a9c37559decb582ec0acea3314f871ab4cc5fc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d529f68ffb4d0d1247e3ff258b62b0761392a613c00dcb6622e5d8cb34d4756 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..57df439882c9b1fced3b8197bd8a81ecd5851f07 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4c85a6547c89de643158563ef9cda88aa6e4e36f9cfd0cd863ac245f3eac3da +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3252ea4499944cd3737fe5715a0ba73f5aae4628 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adbe7b745d71e181f5a69041c1c1b8649678280aecf29b7bc45e48487417edc7 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..339cf819ef030ac528bd398ba853522dbe74d274 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53667cd2d7424beb6051d4d40856f470aeaa30c5af6f33689604a79b4898f9cd +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa85ae7abc4820d6b3ee0c0ff23bd051d82f7e83 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0468c5f56b0333eac6d0efd543b5d0017fb35b75582289a15e5892375ab19bbc +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4f68a9c79bf9d81a8c4aa23d33e38472a157cea --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83327c706b37b8493f027a9701eaabae42b43fbe6a2da6e152adab7270cd30fe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92cde89b4ca7b6af4325f5bf5187991e7eae8086 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29dc32c10baabf7a8eb0f8725805966f53168c888375f9842a47306f5afd1378 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..377a1015331cb4ae7fcfc99b6e46ef22460126ad --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bca07e088f31a24ad4b957057a361953730ab0d00a8c5e701642304da4303eb +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d21dd7952ea3d78e958e039caa980c4cdc1d46d8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f0c813c087519db66c793647af5ab04f8362e13177deaffaacd4c1681f5ab84 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8138c900cc62aa199dec6858eb3581d9234b0bf5 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85a6d9001c3e5469be3ce7fe0a6028601434ad3a11eb45756dfc152f729539f2 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bec9785400ebf52fc01105e00db39e3a5f2d545 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4755dc991c2dd13e7466173553901145ad188152e41c6fd3eb5828d2b5379c88 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c88953a4e968aadd9a0067628a4a52d43f3b4dc --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af6f0415d17e2f484b548ab87ca5f1af6407510e0749cbb352d42c55cb13367c +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72cdf4d2918fb3619ae36b2878573ef64f7b1e3c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcb773d5c560c7d348d87177ed1338660ad3ac2520261e1ded5f8c687e474304 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5ff1b0842a4c8408bd5825c5c803c389e2f1660 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c04c8907097fd5013372f6c376558ace10a4893b63ed69cf2bbd1912880cbc0 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..785a346df33573eb1caecece3125aaa5aa20d537 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8f7e62b15e516ddcc054ff9b482b547842b73003f2c57f88ba1145613311f31 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..647a549443dd139ae28801f450de752ffd7a7347 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dd4eaf869bf85309665c70d9a6ac3bab32bfd59fd2ee8c518433468c97decfe +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..383d489f0a706016ad0bf62886ede555468c43ce --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6891fd224a19c37f62d237718d27f553576df5029ebfd478f8142327e690b37 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be2d1eae8aedd30a405df6f452fa631f77d44cb7 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:325c226d7ccf9fcf90cb5a91b27fe5934f11df2af3808b536b211d25bf5b1bba +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd05746eeb735024dde15af044e16251fe70f430 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5b6e9e8de976b5f0023d862c56f1b24cfdf454eded87bda85833f2062eb427b +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..115639b42612f01bad84001d1e02f900aad1126d --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65579dc03aaad9e3d794516eb3de7498cbd93875722c6f6423f20eb2fac979fd +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9852c475380f5716c2f122f90c05fc2a38de1b9a --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d918db23b20e4bb3af70e7502b8d648f116921542098fb62cc11829b5ef72099 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c572cceb75a96fcdc4289fb4db07561f62531d72 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3e1ebf34984da8458f36425059b8d7d042d2089c9a36b05a1a3bc4891002424 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de3bd12e809dbc70630e1786edb17d944631dc82 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d1dcd93042a8807f9b0b0586d3fe951636fdfe87ec62b8877c1a2f9e3f00006 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..13f3b5eeae181506dc10b56b5ee103c06910aac8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e333888fd276b8a3d5e02d927bbca28423e44f27a4d2616d105e692eaedd4da4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce074521d49c98425f382392c53cbd5bf672f120 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df91adbe1c0107c5bf3775f325dff81c1eb6d92c19335410d577499dfa433bb3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b671e7ee92b37af358760c784e1f8df8ab2d215 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f2657818e76e31b67dbd557cef5ffeac1efcba65449730a0075e27208dee504 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5325a8fab936cb47bd57fcbd4e6061b353e9747b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f396f05c0937b7e7653e4b8152d0ab445cd595b43e1a04ed4a5fb889f3bebef +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0a4f50d92928735ab7c96977914527a91c6c3f8 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd06af34843b278e277730f5a876b6a21b49c6bb4a68b0cce2da567ca9dfeca9 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56a59b524aac541a46a57be75cfb9eb0a544be98 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d54b106a32af5937c6c83c787a480669924c05e2b188222fdbedb174eaf10e01 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f9bf898c322eae214e10c633376d0be3b392eda --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65466898a2fe6fa636e2d38c8c7190002895f519def20d3390a41e5f27c078a5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b587daaad8dc31c18300ed513ad744375dd3e513 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08753b7a5612b2e0532989e9b4bae37651844439f04a9ab388f5fdf667cf69e4 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d8cbca91a0952e4d0403cb12aaab606aae2dbe1 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad744ccac975773b120380e0641279acb9625027d05137cd41b6b50e215eaf79 +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..51202ba3bfbc0ddc9618a0ed48c7b75aa5ca7a8b --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5368b241acaaeb0f7e1a4fe6acb37936235052546cfab0067960276f6155b3ea +size 42115 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba7376064255100b5a6bdb2549e52931c7babaf6 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3744bb473fbbdd92335f02d08026c0fc50e7cf79a96bd65ae07b5b159e31a6e1 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90cee4c192944534a8aad0960c9096434cc3ede2 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d0a343920ab616788cdfe15ed321cb94e87f75a58c9a131f6ff8070dcc5347f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b725141c625706d7bde279a35b6ae92815dd0b63 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60ae7f9ce863286f0437cd02a4bc903663bc164ef3bffd1dc0d1b1ad29ce614f +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae9c266161c503d5b3de472fac6d6615e94ad23f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c8fbdac80794014d5921c62d51909e1ce2c7131eeca20e48e975bd7babf9ee5 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f04da3a073cca4764c85516916b2ba40bb63a931 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ec7f5b8eb124b28fa9f2f2016e283f800e67fc6349ecb9e8e5f2c0ffe4dfbde +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1410940417818398a85134e99a5e63cbb5aceb29 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8c3ca32ed2a221f70a564bdc5c819e0c395a99dd6e0ad5b6275c807d699efb8 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3cc2f7c21587d6054abb70ab12c9218dcd98872 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e24e85ca7a690c2b893755e13e549207281b9b5d8c47556c5a5192009cff2f3 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de45ec6a8767ac5b21ea08af85a7997b2193e40c --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a760a179488b2753e89bb18a306bd4dffef40ed8a6e385d41a73f471fd64865 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0763422249ab33057d725162a829cba1dc0413f3 --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fe0fe52ccaf3ceb2053d744d024c3a62cd45bd821e0857edbe955fd090c4e42 +size 11395 diff --git a/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e949b84d5b8369ce5acd7a7991e3c490ccc6e6f --- /dev/null +++ b/params/phi/4/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07f86084c9ebfa459e4f28061070ef72dc8eeca0ee690f9bdf4e356186c08082 +size 11395