diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0860700c8a1555207e3a7e8190f48308ce3f9f83 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dc8c020b8a59667dc507383ecc971e8a09456ae06b23af7318338ac9c03f584 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49b7a09ac561330efc46e2e959b0a0c6d6f435ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51887e172bb769253c863cbf039d451544439504f9a49f65c467046fbd0e9051 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c2c04157249d8ae6996162d6b0ad775a34e1af2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:162d6789a0f430f424b8866ed145278db44de768846a3caccf87e64381bb5c87 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..edc0e630bd93c0d1eb863ee92b51b98a4cb7798f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef5068f6652161156e44e25765280f61029fba08f262c36392577b40de8d1b65 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8d7f2d1cff3ce4046153d7c24730c8a4fd7c9d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37ac5db9e68673b40210cc998accad8906f911fbf56e568f1cbb81169c3a5527 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e6e7295c8a5ed0add97151bcfbc39d7af5a1b7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06528111dd68563556699267115c31b5bcc8c53272dd3795b9ad7d6b6adfc591 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5c32c6b928b600bac5e61eb45b4c985be19fcf4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25a9827a57910ec6af85c9831a517c7117040d6f25a0ad89bf7781aff8d6d0b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bc8416b9b845e057a3c1629d2f19a4f46a71564 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43a2b5e64314385c8389ef4bc57959ea4c79d079a3e231850e69383eab4ffdfe +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce7ffc8921bcdea430f9bd231f24a177dfefe6a4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:940b7b61b148d7c2f90d9b5280a7536a81b989ade5e51c08f1c53311ca79e01f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1c30f0baf1f6895c40656cacc56c60f70f5ff11 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c02587240e4b3db478c12dd99cfe92b63edd9ac8034bebb93da3f28ecfc7067 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..938e8788e5c1495dd0a5776ee194a252342498c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a888c4efabd0eb92f6857d4f60b53ddae2d25bee77a01362a251ad9cffef51a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..557c495932a3d92b046b4a4f16c256ff390ab5ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08a4bb8d2057261349d7f433f92922369b528d073153350c03347aa7f7057f3d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aba0e18fec9f78266cfb6ca16e9ea1d9be11a969 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27f161a8f21697315db8b59aebe405f9a63c2847b203ea68165c691858df6722 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1232634b3d79516ba3abfc7af56facfa5da16337 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e7fa0e84c0342baa592f050f36e19a56ece9d901f54f4bbc8b7e25dd1ebd8a4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..61b183d7fa83a5ae5eacedea3d67caf9fc3988d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1e80d126e0979bf04348fa0a93617763ccaf4d8d68e5268ac316afc946151ea +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2793aaf5322cd5433f537fbf4a6ca808290aa95b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b18f8d463bf74863b74b57bbe8826641ef5d6923927a5f07ee85a53e9235fc1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..354d53f7d15c5137092d24ab22a5875fdcf620d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11f204c42b55bf8fc9f1d08200ac1478f643e42d1ce556f655bcdb7ff9de1a23 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44b07e88645594fcd38845ed0c3863dcda54f2a8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc370b876f8e0d7f53794ad2ee7d8f928567470108e1fcaf8e676c56a69dc27a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6d1e3fea93f88a8334b9f755b30d9071e45a0eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae668f0c48fc4397eee964686ba23f956ed8195788a3e2cb25b6428c42da5cd5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a64ebb74e84b523ae33e04485e0902f3f358389c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8d31d441e0255bd502e4ff7877c774bf76c8763cf1749791e56d30fa69e363a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a070a303de46c19510c08ad7dc16efc02db3238 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8157c56b1bb2dfe34a24cd3267ded41945105d5b3966288fb794bcc57744663e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b626e92fbc3761b64d17f30873ba60b283590a3d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d8ccb42e4f5e5c0e0d74747226dd6c593900c48c534b03a837ba47935a2195a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfd268b9eab30b482af32209b6bcc1810d30c4de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdcf32fa9ac9b4de36a7cda04c28607b57a603da3aaa282b2ba274218f07e551 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bac66d4a79fb177bd8679da6219484b3296d72a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dab7a42890d72028aff4e1379a4b6b8b40d1759ddc4157b0069e8fac7c498397 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b90e26db14159b3ed426deedc7c84ca3822291e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6efadef3ad7a97026f0b8dde7ea02edf94868d15932a25f3ca863cc1f877441 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e34b77f0963c6be67ecf7e208a205f7ffaa5e8b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d46ff0a6b4a4156b348c65199510af1c387e9dcd768ea9caf18be74c44819b74 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5775fc6b310bf5bb2e860378523245d6e97fc1d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:565ddc158c9429d8b79ebf298b3f057998c96441bafd7215dfb89e6d38d7fcfc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17295107d89d09bc0efc090fb6375dfcd7d468a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c088503e13e603eda3209c2302b67b5962e9f53568d6a0e15e88d9bc6d4709d4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0981c579daaa5df315c7177cb7edd0e70793b05 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d62f986fe6ca6bb2dfccd873250962ff0dd9e4dd26ff8e54af0683904aefeed0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c48a664e2f0a011f96dea166fa390f970500f3f7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fed23f44a9326584880b68357cca06637ae8019710f7dba97d40a611c78b893 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..369ff462ba3019d845f2c0f14f790b7d58876e54 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bae893cca0d63c977c27907c6f662748c904486c441a22401ec6f43478504efe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..300e459ffe1187b0d3efc7305e8bc5281f1cb8e1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c9a25388953d710f75ddab7902edef6c5e320b178d2597ecc8bf0493a66e19e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..caec305f35f0a0b48ef000722fa488e886262070 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32fae3b183d50c8e6a8d95b698336ddfa68c3aae48ffa49af56d8707c2ac0e69 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..383e21d7829e87ab3f9224414c71b7c3b20e6707 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e66cbd942f043e9e25c5be7dca8e014570ef9e657e1010d7b0b89300f63e4f35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2fa071e34a2e90c2c716652a5878fda15a1df36 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3921218484bc9b65a201415045a88c7bea582f40cd0b2e2d8457a5b7ead7d9ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f98b8400287b798aa05468f843e5f000e84db9b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e910852a76551dc0516f0ac497caed04ced79ee6f800354d55e61e01cbd6d3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b18795b2ce7ce224cbd7c8ed3a04f85c4e92572 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8b54f9fd729c025dc64654099a95c8ea448ebb06682738cfe66985d8eb844e9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc56fa0f1c479613d72bd10aea605662593d6338 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d90f22be49d541c861239a7ff59601352f46a38d69d6f5a2a4c3281723741220 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7685c34f9ca3b5332f37af38e77d68afd318d2c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3081943fbe368afea2c1c40abe32ed67dba49a45be3cbe1f06ecded5f4bf034 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b576d429b903757bd85a596f335e83ef9fa9258c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef6e196c6b6f53d590c42341342497f8b79303fc9ddd0e8bc7dbfede51c4bc18 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d7301b502da1bfcada50ca6b6142b734578fe75 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:676b77c7ad464edbf3d7eb29c4580604ff59e5dd92adf6a09fe2acca28da24ce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e49de4958174df3b0ab93c7250c9652293482077 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d05b2acd2bb360d688b1ced51e66b873a64e58204da1ad4dc42d06f51d26549 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d2d6f1271bf1b628589be9ca8dc26b690585b7f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66b2991e62ea50b5e22233f4c73a9d10e614da5091e72ff44dd93e5e330f3f92 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9953a2bba8156b12507e9a7223705cddd6508dae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8263bd91153fce613d81e9b9b0b1504269724e592a7b008d47bd53ecf0614450 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0281c0b96a14d3e73dd4b7ce32cc89526fafddc3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02269316b781890db3d50fd6bacf46c9f1f95cfb6e0cfee4e96722a86394b526 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff4dd86ce14d85df2b2b341b9220eed6c1cb64ce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a2857396956f818eb2c26a7e4c2b0ec5e07626553ff00c83e58e8486ffa9464 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f9c463b33452ecc3c6b0cc645f8110324e69577 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:174dde2409b1851b4acb5e7a688b94792dfdf90aa590f390b9bdf9f65fcc5f63 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42499bf77be7a0984b0498459ced6f6ec88e2533 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:801117c07ad84493ef5e652ebae30c126405e2b275d06f70d2227cb338cfa0db +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..586e7adb3daf77f54b1cea475726fba7e5e74dc9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f3066fbe0cc44bb89e94e89885e380ce76029dc4479bd21d01b78c6266241ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64d17e0df47c72924fa80c9eb012ebee30a03220 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e23f5dd4631062aa786915e27a5d43bdf59b8c427b477b07217460ee730b1c76 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c012a9f1f20212396efa36748c681a3c773d757 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a754ea65e1a9e5e22a382c5d7589002ba81065dec90f0f5dd960ab0bf4ebf94 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82beeddb5e6219efa2860636a266afb375c345a5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f865e53370fe22ea85c8615ac662511e3169d2c644c9181434fea402df9a47d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7f4950c9a1fd020a8acd3cd2bd702650ef52ea9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46bb2ef04a5fc1b678298143383f1cfd0980b2a7c1f5900e9d1563d602516073 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d6f264a40d749dfb726c8e8225ca717f3263c42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e64ab2da20ecdaf86a09cb9b1895cc4435fa5a9e87e746e07d3b4d24fd16605 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..80f23ba476ece295fdb8d0bb41326aeabf4f9877 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8be279fb8ff719da8ae9f56cb7eff7b536ee75edf9bcb9453a446f7257cfd18 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c09cb685733b770218ca33a07c07356068139931 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d64af2d6b6acdd5491aea4b69dd5b7897af32bba527b4ea0670b9c8f56b66fd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4722367d602a43326ffd8c9f57fe12e6dab63998 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93884486dec6271f36be384f81abfbf4f17103a125795166c4e92930012fdd18 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c45ce6096a36c052d45daae7b340cf91e7b132c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8891489206a19c19336085d1c691a82e8f9160aa5247855e3f2ae1513346c24 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e86e3237bdd38e89eac2ba5d0c0ac39daa0feca2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38a46dea876adc9619de9c130d534d3ad9919cb9cf42548bbb1487dbbfb9125e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a93304a993992552e63835021e7ecc1c214c5484 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:724dc4abd865417cdc80f2fe32fab2c132ac1ffa6c15693df14c47b1be508121 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e231f3d88a06817aca6939b5aca585bc88c4c9c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80ae491b73d1e6cff151acba55891863ca2a4cba656965539fa76bd7f4d772fb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df877df50bf6d1485619614ab4f25233ab84e020 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8255939b14d722e98ed5de5a6800769daebd241231a66eb0ec33cd853f457467 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a425034d6fee95f283391c9098660db8c1bb0748 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95765614fab6c6f2372a7bae47bc936f291b8a2f00d6b9e469c98d9357565288 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5fa102b4c5ff3f6efa38583d3ef47fc521e3b49 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dafaf29ce2199f32f6db5dbdf1cf995c1692b06b79eb5cc12fc8af14d125273 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dfc833a89169fb82edfe4636b511e8b2638455c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2b9adc52cde43a52d06a133c18b5c3b631e63ff1405114ba9c64088bf419390 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fde282e79cf89ff4ce8355a21163b7f98c4a7284 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1248c5b79c529bb1dc39ff49e7774d4335494ed0e88391a50cba845f5e3df669 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0080cd2ce7e3bad81f5cddf5093ae4ffd41289e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a9d2bd079829f11e8d539177aae8649430937b2170691bde0ac8f561f4610a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44002a4a5e989fa3fa3afa8498586f43e984861d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d4dd41f0c9d0ef2c601162f41c3caadc696506ce1b49f5b92961894aaee12a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..267a88f0a7622b40f21ba4f596e6e26eac55b2fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97ffe2043229ccd6e61fc6692b61280c67fc0ff5a799df5688d7e98623840072 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5951ffae73c61adfaade99f85329511d3476680 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff73ea2a81034716b5986a3f62d26fd81cc508f4dc5816d5a315dfe6711557da +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..582ab66b78cfb6228bcfd9563451a0312e6fce6a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdc761b99b3a4e9aac78801e0f89b6eb9f7a34b65b8d45c53b9fd308251b0736 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1509e17700b834d38634f18bf2c1abdcbbd4407e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cc38c4764406a4b4dc7e97daa2449fac048724ac56feecc2400557f336fe35d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd13d451b8d9f314d6c69ad107ac16f07831d139 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b8bbf203494270c391099166398fe82bb6987c20b4dde6cf5fda0ae3e82adf2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd6a1b8096674dc470fb19885ba96d26c9ce12b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8ac4ed3d4147d34a6542e9aa928b83845eaabc6832a468e8a87ab42bc0581d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..118922809f536a3da327c3963188cbbacfdb97c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b2ad624ee82db5b736440f9d4d5a56272307e4169ee8843edacb9713474bedb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4d08cfcc88ce3f6c5d2d8e86d68a003bb5bf4e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dfad540d962beae1b8ddd965cd50a2330078482a885a3b6b83a03f85b6e86ff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cda528b5f84017faecf83f48988ce272dfb2628 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9df823ec2d7b11f73d305dadb40854b08d1249b022c6a01ac7d5bb2f1e28a647 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99845e4da74bab43a921440fa43c0fc580ae13e6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d20b066830183295ca8ab690f0c0797bcecee506927312ff8f1b2265ade112c0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..67eb6ee5969b134b650134a2c1c7aa71a2a47fbd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b336256c113c38bb60ecfb11f5d42f42654c00fef2e284c3edc9b51dbfe2afeb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3d28f8f0375ffbf50e37c04d46aa09bff6ba48e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c36543c2566bd601a919e30a2423948cd1411f63370a086a41889c368e91d9f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c51dceda41fca2007c08b83f558c30ccac074a36 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e056cc2ac91248f146964aed55d825abf4ad23517cc5c39e64e706f272fdae96 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef2c0ae121ecd77c85615746f96cd1335ee1a9ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb6ac692b7ed7e53ec3c2856724094366bce8ec9ee7ec223f4d325d2f9d5adf2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db6fa1bdd8588c947de08b0fff132ab751fb1b5a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b0249a57b2399f90ae4579b20a775ce68118ba9187a62aa5d3c70ec40d3ea2a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57767f782c98482e287c4116ce2a4967531b871f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b3e37002bd2b6cf69ca3e48f4af2cbbe2b36ed60452a9792690d52485db9155 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49e2de149d3f74056b9ecc87fb7f893997b9823d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4b9db1e8728b3698dd1cea746deaaa20dc6f9d3be84a1718dd8bf6bb91a61c1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..846c2845233dfbe73dd9e8161fa76bb4dab6a53f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75502c4884d01d1438b586145dc0bd490785942f9c340e30870ca5370f0d07ce +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22d1e796daee6f872785d22583a9b8d13d9ac928 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b09f4dd279e4fac76c83703188cebcf8664f9a1dce100116dbf2b067cc2a80bd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d7da427c451939548d5cb4dcf3cb0e8b8e4b4a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:becb9d2bcf51c9d7d7c9bb3a14b32c58241637f9e68b9c3d5dc0e8df93b6d56f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fe55cfb1d09faff1970589be764068f908dfc8e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5691e1e419503dd4d0a4dcf1e509a1ad54b66794f8553960e0cd8bac7f4c3c5e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc19a717a6a097a244e550e69ff968d8a157926e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bbe7bd6e6f542236919250153df713c5fa7821bc743440f2a9ea5d501434289 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ca8b39377df04e38ebef0412adaafd8aebc2ccb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e4e1b1304ad7a807a9b7e7dc197060c78c8fb9dae645bc659e5bfe3be24202a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45fc69a66e9f9029c8081dd0933f7ff4418f2705 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72f29d08c512621eb283b4137d630471ef8004c801cfcf8d98833b0e9f6d73aa +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f09ad16e9d9ba5bea686a6e3dd89e1c90b7164b0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03233b3d0fa6899ed33ce34268629e8cd63040d17dcef9ef8cbf3c1d44f316b2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ff55e5348ac920f8015887b68d1c5c1b6a51372 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94baa6982f53cf5b82419c7076d6afb77d42a55475dd8c6b8a304606d3019a7f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c33f4350024f11011198012954d9a32761a9fcc9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20815f530a0d65ae315593cbd49661f511a5abc0dd670f0582b0f0f496ddf87c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf36c8771641758545765031bed8756136a2e3ae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56734dc2dd02dce21ce0ebc9613bff7e7d80323142ba9ceb24f70730d81afbcf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ee1fb804d66976122a0d463353fee2b8f3b844b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da4bfa28373cb98fc9a57343159d537567fcca42c8eda533477f85b4f9c67a3c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ebcd85cec02588b8c854ccee4ba2000bc933c24 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8541254c4b2c99b2e9af8d7a3ada3efb418262323ae83fbcba27c581f08edac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f138dca7ea0465d2ab528d5f26c96d387483ce79 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2051b93a279b65f568039d7b770fe33a3e8fce3afa77655b566fb39dbff9b876 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..91e074cf93d2bde96651d8f358751dbe89248896 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e26939b84dadd9861f85fd7a41a47b6d6e6c9d2d0a82be0dabad3ea07b1769d4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9be495d3b33984ddb4a95d4475136f8a640ac1c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3b8c872751bf5d3375d76cf6e7134136d73430292ae7e31457c42381a740296 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d62393056acfbc0e10339fc7cc8a11a3597db97 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5d97f4253e7e47ea73431f6073f6b6e721c80b4d205095daa93ba75ca896647 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed039b55342f641fda842bc369d7ec15bf3b3311 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e80b5e5df13d65f84d98bf91628a9522912aea9c93f4cfaa4f4620c8e3872386 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..064327e753c1315b45256b05793fb55e68bd0eeb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c890a8707e29a40956eccee8cdccdadac0c23a11eaa0891a9e79db6bc41dbfb1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d53928e5ce9361e6940f728a91a6924eb2c7cb0e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:becf6ddad0cda187224895c5e92073d558e3fd37af1ed7d70f0e90c80b55d9aa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12037cbe00f035cf9f6d1bf3dd6ac41152389fad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c6cb820086787adf7d23724a8bcb417748b01e7165314d84d39ed7755d64f91 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8127813b99c390716fa402e4392b89bbffd9c69 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57f4fbaabcaad7a815d1d9436eaeb1e0199045c7a0309c88b508366bb77cb363 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aabc9783aee31a8eda8d35fd415f86441d7fe49f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47f89411a6188ad8c8ad3396c564e5d1ad7d346e7b5d4f2d8846c95101fd6561 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4c046809fe5b8cd1357d6eccba353cbb545d24a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6917fa34bc4f4651fdbf682113e26d9e4112e31f2f1911bb5f84ed6b3bfd0fbc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f47c13df5e6805b8f04597885ff4326e31a0888 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce7004bdd49c4799f4ccc47f1049054a3f97fa546163f91bf01899979be1ea54 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec6380a81d5fa08040621a52a122786c87144b43 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15dd5e22a5063fd29fdcf4724e18af9b238a07f762d1051c83f488bb451bf2d1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c4ad3c5766d5ed897c24841447011085b6bd5d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cba2c49c473daea7acad7bfc0bf66f60176f3b562e3b7a2add8cfe7c289daad9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a32b4ce0853a0fafe9636a8e109498574ce3d366 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:921e3c5fc7e13a48c6780df09e260a36f86407ca240c10efd7446495eb2edb6e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d02196104141b5755dcc338858e6329eec3633eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b240567eb898816d3f78c55757bb66fa703bab75aa6b5c6f57217f9551fe729f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77dfb297c5038049e66f63c85ec3e0a373464195 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ac23670673e8a8198f5f93f1e656f26c3f3344a04d8716ab2e76262fc64ef4e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45494134083f1cb7cf54a571d8298f9a47349119 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4735189a1ca79fb8d21ca075ea11a5bb5cd1f3fddc0f25a2274b875dffb36f2a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d12bca7e0522c2d0c1e5477a70433758d13b8dcb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:554eea014d2dafff5e5d5c4656b36e9a1a3dd42d65a3ae48aa7f4d63a7be1a06 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f691748cdfb33244dd982c2cda9f12dfd4a99106 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60b8b7cc95f5c26efa94a4a3b76988faf7e6c9a695b861cbb723a36b8707d3e2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2667dc1a77940ac65f21a9b38ba52c8f3f20d676 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb5fc96818b0e6dda3ce9e9677e2ba0d97c88c6b6d96754d3599f1153cfcb6f3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..089ee29e8af9d3de98039a37678cf589a810aa05 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0457462b1296877908988c46d1f4f4de97722962f5dd4e4b7e3bfb7f3d6a48e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7d2ca764e33d037a6eff29d593121382fbfcdc6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98096d35cf4ac110522005e0081a18db3a515595776ab12ab21406afed9f4dac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbb4732d20291b8631b0715a61dc0e77f9ff6529 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e793e84b6a17cdb7ced2ca2609ad184b3cd9baf6195fe5a4cdba84736e0f005d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fe2e1fb6672861ee04a7bf36b0d0c3b9aaffe2b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea3f72413c72df749a547fd35c81354ddf815cae874429340a0b128c497a7665 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3efadb4408eb5c90823917d9109dba12e64fc6ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a20315b040460428c4d0d282ab22352e7889397c0c4deb4434e04df6344ec82 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d096504fd420787085b5c65c7ca472d7f25566d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:332940879ede6a3252ff59ccb06ef1abb0ab0601c22c00fab981c1c19d71aec9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4fc6161fb7225b8dad16d5f6b8f5bf470a0466b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c3342c25d84e021bd1303fbc2879a7d84ab966f363327979f86f5a5de13909c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ace802b72f07088ae97143c16b41f55bacf251e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62d173581866799eae1228c81afb1aab94e10b96f3616a4c3a311d04f05694a1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f76e6d637b6e7a3f33c7f6e56dbee57c9fee6d89 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae19b1a9d8b5bb10733da5fb1f3d0938ddfe1b390185bbce2d844dcfbf8f3daf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc1effc66dc9e06afd339f3febc94d1a012ae290 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e391bf7905bbea9040a41c699006badf6d4a0ab6482a8936388bbf658c49f5e7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f90e6c4a8cfef51c437ff587429626f5846291c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:261340f5bb42b395305ceb136811d675b6c6d3d95b996d4eb9c91ae28a5518b8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81df49bb00c86bc997ed524c1af7f6aa09548465 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b18ba9c6202bab26d90818938534aab0abc17847419d7d51a5c47617db7e877c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3edd0dfad116d436a590b6088586e76406b5090e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6fc4b3988133f1c03b493e9b71d1ede9132c97c1eca32913861f5766bb22f11 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c38119f6ffc4d42920c9020cd609a957cce04d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82184c7e7e5f4d79700f2070bd7d369fa8f886257dd4763236e8276cff8f2d34 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4694bb541c971cd491b391c80a3f3550d8949101 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cddce53535900362814438d8438789954fc84170dd51851204b865067cbd091b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c86201434b190a1b93611a17ac9d22bba75eab1d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8bf7799f2fe6e07bc9ee1cf500358f0606f741ef75bcfbbe2f7524496f501de +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9017312e69e43134c416edd1c03a795e5cb2e95 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5a512615e09ed1373e7e042020d294aceed698c5f0b891b55f1f1f629807f3d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a321fcfab1ba4f54e7f1271efd8665ee4c9d24a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c658e1c14090eb2859ebcbf82ab192d07fa049e37bfa46f5d67c0c04eb95b1fd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..147fb94494fd0d7c0a95f31bcc9570f31f1c66a2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b66f9f7b627fe8fba5d1e17c790a2fa15f62f93757c531d1169c25dba35d1c7d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..208a69661e030d551b2bec0a6d4be18c8c6e03f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff9a932e0f2ac5f5a8328b7155db38b20395e7717af497d833cc2d50cc3a8038 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..145231477cbbb48a29edf10cc6ee39b0a7656382 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44a5025af855fdb7e730b72c7cba981af701371c561f5e5b12163526d867d6b3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc816558ee69798ccde1eeb007d31e8080fc62e4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f0cde0bcb368a8b6c609181045039999ba4f12e22d390e49b8bc6b347016625 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c27ca7fa87a33fc525a6938673db8f5a08f8bc2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:991325b5897d204da86e1043a3fd8a1eeecf1918e91c14bd108767d0ae439760 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..447511fe4c6f34d69d8237656f00eb8d48dfac84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c588414aac30da6a9f9fb1e2aad98d6af327b1aacc4f73d1c899ca8cdc014e62 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..860aac4d88b9e700dacebdfc76eb768e338fb814 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e0af01e69406b5d51d6b878ff69c996c2c7f89b1bc93d7b8d4eeb011ada6d88 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9e0c0c5e97dd1837b46c376c1b7570d15f01464 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e71b06b8e3a26db2632f2746d559c1c20b787f641de887c36e04d5608101aeb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb31c44dfd5c2917f8dcbac382f346049ada68e3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c3198e6b199197c98d1f087f3f0c3c528e672b9b5ac55284a03b5ede5bb0184 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b272d9d2c2734254c270a35f0c2716b5fd1f193b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cacc328c061d7e795b6b9d341e89202f6452557ab36327988dd46d9f9f3c743 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e732e2638f5285c55103b788cef1e6957c0c6222 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4bb216e6b59efbb29a1f7ef195199d8e8fcbd1c3f3f55346d9dc492e2c26aa6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c4e97e78b4539a77b70c4a16bebb4f1e1dc297d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8473e035ec66abd867a168d394d94a22466e463a739c837865e9dd4ab1a22c7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e73247ff462770c5fa18cd7553ec18061f9c122 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5843518fc293a67a1bafd481024beb92080e3c49eec9f514da688d7c9974d5ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..89e5f075d912176dd7dd375abfcebe5ee70d7804 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8d044c24183e49c5a1f81c3429ad55d6c61698d96062740eea3357d761aa495 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b21add50bd3a81a33f0420d42789258901b20c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b222d154d094b7abd6bbb113e35016aab56bd2e7fe0a640789b0e22a942d52c7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79a96c3754d06a623c967ae35aaffe90a48bff82 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:970056d6323e818dd72075df0a8e1900e536388aa5bb3b369c29e3e95a5f368c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d04af56a0d7a0fa1792a105164f76697aec48ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:224f714a1a413d70e74a4b8b2b65f8c68a49056ab8404169b512fae16d48510a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..617cd686109543e3fdd0a12be50d0dc45904d916 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6169768100d9ee66abd5172c27d7ce9819b61b9db16f2c99101fc9800d6377a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c36ab85b5dcaecda612b43854091429e29eda15 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9ef73403bfe422281352b91887535d69d6663f30e55017f4535235da4d1a84b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5fb2074613aacc218cab20945c6e3d2a003fed2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0da43ddf1735fd8750f848a1e046f783984a87ac36a67df08f98d3aa7bd9e5b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e7b95def83862aac889027d6fd3d6f748fc0bb0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb114b7f98797bcd90ddb32b2c07847c09a13a3e66c1657857b97df0cb58d08d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..366502db43322c84fb852ed20ae329bd3a0c3c8d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c54f6074e57aada748ed8291422421522f753b5a9d65809957e705a2c03a2469 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b3eaa338f8c1de83447b7cab36ec99202de67c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6019317ebfda7865a35ab46fdf6d78b95da461e0f7ba9d9abdeaa493b99f2c58 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c652c9c34ec74ac9ce9a1b7b6e44f41d9f102269 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9a1da29542443c29c3273ddd70137ba0921b20c2c5414bc9ae48e91b98318dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00cf6aa2d259d496e7715ebc349e6b6b17c5b9ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c2c888758e7bace37eb01f5459cec2dbeaf6a8d94d6bcb3097c5567477a0128 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..350e5cc027060010f8c9b260a403a69106a1599a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87688789ebaf50fde306e8ef871ace289c2e900a1f3dd1fabb89a28a6d595a22 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3a529a8adcab936b2b12bc736faf0bd40e82833 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38718deeab5e279f6c5d8a10e932a2cb65f5f38f7ada87a0a4485eb502fd7f88 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..456548b4ff29cb6f1ff039c2ba125bee27dc6a26 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2601b5e48514d95b972295c1b7244b8acf8b26f24b14a8f7be997d4bddc8714c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c7e2136e2ce5bbbd818fd59ab96c476a86ecd70 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39097a5c26dc4e80b7104f84e4d12bcabfe77f01e71570d34aaf20bcd6b896fc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddf1cfb1b5d7f522d02187664636e59b607e3004 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31d8cea133a80cf047279be2fcba7af4480cebc43b4147e5c49bdfb1692fe269 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..711de62ed1825177fb7e1e0010c7799829ebb5f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ac8da099c91dd9c8c99c6424ca82343c0613a7439c8a80e69c69595403ace45 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b66fe3ff9768f97a608c3a2a2792ca019e92e26 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7542a146f258e51527cd84633f00f84be12c414c50664bded9e2394f0d5edb37 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..974d2faf2e546309ce7a8ffc586a9ed6841bed98 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98c13e7bf4cabb81b257ccf358755e8c281b623bbb84bfdef9028a22e8d903e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a49352c0694e4e49ca120aeaeafc8ca024909523 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebd0229c3ba7dcabf3009a2f37fb93930523c070a0f68fc92ef010b6ee251749 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b84cbc8f833c96aff6e4e2e06e2e2554ece40cce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae70db29b76bdf106cdb02ad4bdcfb0220ed1d551e57b2241dd794e9b7099ae +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5371d96d311eb05e7cdb19460e2acfdf750b7728 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea8638dce1eef10ec6b63c8c2969c974c4d06e18bdeb8fab6aa9276559418528 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..43feffe5c50fe541b275415ead3c1e8fa289d422 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a22ed58f5773c075eb4e1fc304273bf6ade6251e788ccc937f2d66a8e94ed4e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f144076273157635d5c7e6757d36a63435e5ff03 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffc3e046c1230bdab0ec1ac9be4b0db719416a991b23f85e35385751d1a4640d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b229f2dae5d850f76bc324f675222bae94f6ab1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fdcca41f4946454cd7b34753be4c71a7e2824fe7056385c9d59d09d60d44793 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e8b52318b05f8c80084e8f0a91715d7363efc8b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63351031b33bd65072c481d318d28a7924a68f5485878f69b4ca49bb1489d433 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17532f3631506375bb979e8a3ed98edf400bc618 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8dc0e173c10f41255f9de827cb167a63dc8a467db731ef23803dca223d9522c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6e071ce9c049a6061d67d8a350af0d772b08d3e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:461e511c4fd4ff4f1c910dffdbb4f6dfcaee8749811ff93cfb16c795d194ccec +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c23b490879e1d183248dd9611e1930a1d622cb4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2cfd37381498a0ab1cd0b11eac5775cb3f4254b45fc47b39ee0dae4484d2dd2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c8553931f5252d62b7f27d4b0c0641f55bd50b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:936e63e3eb5d9d845fb865dd2ea2d5c89565b70ffdc9f4713d188cdace916609 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a795012105adbb07311dd7d2e8b94d92d3f2b2f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fcfba32378c80ab8b860e80c43f502e2a922ec6823366685e290cca2b6d586c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b087e115cb6833c546e0796d04a33d0e10dba9ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f6264994cf508562ed5234f5b09e0f8bb584fc43d16eebac607c6d322332877 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6824d80426ff956d51b8ee90fed1d15b48a14150 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b533e853429218ca26e0f30858101e76309e6aa8e71565773e10ea99c48e2f08 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..766284d257158bdb02fa0888d3bbb69d05ccee93 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfeed1241d5e83730048d6f38ef26192ea5a9a1a8050e81da61b5126a91ca709 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a77856f41f58e9fe8b71a086e696cd909dd89f9b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d375e92f13e850f821d1ad3aece20107aedded1545d14a19cfe97b0c94162a8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..231011cdbd2ac735650e9b7b95362f14d1f235c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26c9a92c80ea9c50dd33cb3a56bc2b9b682cea806cc4c925c8e21565841a7a4e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9baea896a00b135ce597d776d199f3113717baa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8082f4fc9ba0ada11e19ef317db5f66cde31985fbdd375b137e19f8d01173feb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd06e10092b02941555db7fd0d03817bad43daa4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d55097d7a9dbe0d93abf7312d073e056c5bc4393027f1eea3c7b1f9a5812529 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13c955737602c0a420df4d0afe8ef23c6edb6cc3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dfe9c462161d7978f09d910b46ce5a83abdb6d8dbbf465dd159d20ceced949c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e30fab917c180a58a62cf2125f393e8d83db0a1d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad3f3b930d887d48ea1a64094e4671cd7e0b3b643f9b70afa2ca52f987cd9ef9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ffad116b197f144e39a6cf3d3bfba62c669de93 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85ad341867dd38f142bcbb0199b42edd38aaff1a5d377f5eb8042fa2bf8ffdc8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..520b99644063a7444309e1e43732b8b4619b4ed8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3606be78ce4242ae83bc35154e3e4ddaad1b1d002e693c3e96bf32ed86d92e77 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6514895067815a14dc3c51ae7398306079aec10 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0902285b39616d443d31c1a90097029ece1ef547e7a929d747693530ebb67fb1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4882425a40a9ff30a9e849287d15b23999dce676 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86df0c65dac1519a9955f67300de6c69d17d9a1314b60d8e35e78b6846fdc9f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdb5b06f28f9df767a132c52acf96138368caf63 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c294cc9f02626e93eae8730f4fbae03fbb97d65b446f654e9c693b4abe2b7a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2748d32cb5ef425405356a3ee962fa6466cfbccd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51ebdd4f665e601117a10b56e44f46cdeb7a0f207609174a94ffc4d887fcf51c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45780fadf9d5925f401fb672c620fe3cc0867880 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14c31c0a9ba1f4786cc778a352bea3bc7857975723f51366249f064320bc4bfe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b56509410a2fe29308f7ceb0566914bdf2247033 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c32d5c0ae94bbd0ecf4e708921cb30ec74b509181d914f64128f1bb54a3a562f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb6b1ab2882a3bc3c969f28db586c86d62bdd180 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cee46fae06979e99f4e8710601deff91b688e2cf2836cc73af5c3442c4511266 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c5ee399d87cabb21ae0537c2b9f44ea0c9b4864 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fd4ab6bc94abed260152036a3ffd5e2e4d276cf84a69e0b7b7de661bdba9d58 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be80365337e791ebbc5eca7303fb576aec74d61e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:503a6418fb0b28404388ac7d2c0ae4132292ba378ef935641957066c19d9f743 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d15ce39f0943d36d88cb0f2fa2f65354167e1bcc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1922bdfafeb2bb0b2ccc6b62ad2b304fbfa5987bdb8e8498148aa00d87313a0c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fad0e1ea42aae2f807e2fdacf539eeb60af1be6e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f526ba947ae644cd8559d5759de6c0fcc39d2c12d770049a331b396112ea1649 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6834a4d516896700e16b3cda4107f587183ad30d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1a0c4f1da3585ac33355150cb093fb432630ade7f5c635c9ccfe4ec75dbaec0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03a24499d5bf5f0683b188816a57e21edb62a20c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b303ef65fae869b9c7652ee8fa5217adde92cccc93830b336a0a409d488d51e3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..395ddc957d1a0e644bbd6b2fc3e575c9be8c882c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3723e86fe511801a50fc63f23f879576704a2a5b0315c1de66a325d773ccf4b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34dd4f8dbe6b9c707e5a27fa79f4ca1f363359de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:941c4a9fe95a8a16b2a86308866745ff2248dac10e67e853ee919d80eba73ae3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fda6fd1a9ad5fe8e544c5796bf2af7c8514c9e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b64e043d6f7129c4ed415b1a6f07f97c71fc337891e32aa8699ea8e20ad5b79 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59dbcf11401354c712bb05d22e6448f4116ea89d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2df3d65a5eb19fe7c29663f55724b96149332321e668d057ba34e5fd10d9b07 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9baad6b43853e36be21d4df9bc0493d98e023411 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:005a139e589036dd070f5904c96758e54acae3310bb60b1c9a4cc218c0958e36 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f48abdae22192278d9efae826caa74a3690772a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a561e087de7d677b1e416bfc32a5a2becde6cf63673f47aa3a04772c456a160 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..51f6a7f3ba3d8c018a4470a0a6bfb7b304a9faf4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:974ea59c4ebed33d23c7be46cf017267cda5e913d0302a246c83465230aef5c3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..267cfc5e44bedd4f7fdd9db1c2ae4ac80a469cc9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:197721656cfdd3f4410345e8f7d313ca813cdf8c2353cc40b105f170735637d0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..47965195f2ebef08e0a09018d10e4e792597601d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2da014737033f39625174a9dc537dbbfb14b0f323e2aaeeea39603d5fc2c264 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..96c77baeadffab6607df107796ccac3e30dfb3f8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c819371331aa4b63268ab816ca2fb9b443c028fad25a81ddeb3698253b7a48f1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46e3fb54d15ae292507955463230c754f796492b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bd237c877c4f72130050232319ede1695147d08911e9b656852091a231f5f2e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e36ead3bb5c2dbe34e6e7ed5bf9052d15e53d6e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7848de55e7e3822a890999f13efe47cfa64e8deacd7bf919afa1f253358c831c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca9eaf4524383f56b80661c2d797edfde90c302d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b477d16d39b89e2cbdab757ffa3a03ae7f087c5ac5d373f74111d546e61e9585 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d5c42918d109a6955c2f89f20b346ebe3ec231d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c97cd56ecea4335fada48055079b1def73c004b620c929c369fa618a2278fcc2 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f76935305bf8956eebfc4ee52fd3d06b87c15eec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8ee16566a5d7be07a1afd1f2144e2879984c81d4b51c963822e688e2c5a38e2 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..45f0fc4abbd5f61fa3048a9a5cdf23e96bd25571 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2055a2942dfbcd6599d67092f9006e988881673a98251bd8516d038f5b9a33c0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..804f72bd9a92509ff5005dfc31cbd82255b502f2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a057313c135569d2924ef6429f32710965522b2523a8c6a224a580dfc9b2322 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08cd08ff14a4eadf641f69ec569cb5177838aba9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a085a4edb7c91ffaf59abed65949d987c1c83c12daa25cb1d438e201212b7553 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7519c3b608d7295dff23f07e99ae81a2098730d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:973d361359ae4f5f9d840cd861c8d5e13003bd82cac61e35e82d8d4f4d0e8249 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..274258e3e21f12d160cc879f4e61b8f57b1b2aa2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd1c7787f30bede8e99b9def7f33910a9d42cbbcc6d1192556151d12016e9812 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f26f80da87a336e8959fb755ca50fd5f368396c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94190f06e8770c75cd76197f80559af9c9b969980730e35cbbc2ebd9eddcbfef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e9345436eccbccd1bc7d3bdb7a71a68cae147ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a5a4439f0c22913ba3ebaa0013470d9570c0d0c9661117891610dcc24390bd9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94ea49f9b57ef3c54e3b1509930dbba3e0cba529 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95f111c8ca3fc040af8ee2157837d6de516fe91393d0622e37e19911b0b5b7cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b32cdc6db33c737aea00b3cae55aebdc0c6c9a45 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c45428b7f4c27e7af7489a193240797a0e3787e234cc2d52600dd45119dacc0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5d0c8f895549013a1a96be361f6d25cf314d3b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:744604725a2d503eb17c161d61c3f33a4072b33dd19d48b65d17e0c3a80b1a08 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..59008f919ede341b6f86cc60256c283de2f4ee6d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e491ffb49fe19289f2942ab48344f5ea2aa83c6605901f2ee636bb60b616c31 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7422449da2544119ddb1d89ca17f73afe0b13195 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b670c366a0dcc0a12003c04679a82698a5299aec38eff93d9e130a522e1fd36 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3addfb7126905216d4b3400262b391945dbf9d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34bc8f99739640274f19596efdcc47923fe1a2838039297bf28da66b40fdec7b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8aaebccfe8288a27edf1691c3cc4d953024380c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ff7b16d8ec21c9f254227ecfff0bbe78bc80d4e697a0a2f04e907d2c684c1ec +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ddcde009fe3e3cdf82c6917629873d177b860ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9787ad6cc2da843e493a645add96696b3dc5e5c69dd5595d87b081b7862b57f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31b4b8478b008623aabeca60a7bbd533538dc8ea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:819ac107749f285ad9f79e22c2c68febb36e2e7191ed8c8b110dbc46848ae729 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..35f2f97a3e874bfa162c8d8464d0f495133794d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:574a5fc3afa3e20c08486e20eb8d6ee7f2273f5098173f2c487e5912ef00db9e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bd575907e56229eb1eeae06de6a7762994387be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c3cd54b5741968c09bc49da729bede2086d20d68e27893b246482e9903d3700 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae1bf0034512958586823df2aa4d577ccc094566 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ccd1a2f9bc269ca6de49f65551a997851b46bda5ef289a613fc3906315eba12 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99ee7f94ea6e5278c418ecfd33b8079f436778f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:387257445e6b39a4eb3e93ffc687327e50b16124bb4219dabcbc347fbd9f761f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1550cb3096959b4195356770922873a7057359fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c57154180ebe9daf1718c7520af760638474cce05df79352a9188507737d2c82 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad33b26b19e902103a7e5ff9a4f7396ca65493c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd27d803913c9a57f7842efb75e161de0a71c691ca8fed39041d2494d8a058ac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..301d4f2e1134846be428cca7f79fc65e75ae2b78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e69d44ca610eb43b62d1c5b35bad83043778fa09eafa723b7ded2fdf52902a47 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7447f660ceeec8796292edca0c08f2ba34ebfcf4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71cb2cf0e8e7dd9356daaeca2343dd2f26290c6a6b6be0ca16d481299a925b60 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ed0dfb35a08664c0a79b63c2d28e556672ae6a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ad9eee102e70ae7ab40ec565b2219c1f483b0112ab71a737932a367346da8e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82897956634359364f54cf267fccbe6573ffecad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af3d65ebebc8b1b6c5b7e667094d37f580c269a74bed14310dd226b45767c5a8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b4f76c81a7077809a0864f036ad87c5eff6a25e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:794a567032c6fd36ec0a24567bd7a063ba14a766b159233dea6289844cd3bef1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4791284616fec12864e784c677a5064076debf5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee5acd3dbbfc22e9661e7be611c62de824c8c273a3d01fef7d1b920fdd9bfcb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..75d4fa023da44ac57e497de69ff9230aefca837c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1602512758d54a16b0774eab51f4cd8d48116e6a755fdd89aaec6e4ad2d99ecc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bc6f3dc1098af9b1c33350fda5b93ec9d37257f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87e3012cdd9be593a3fbd0295473ab5211ae033c19348da8c9658dafddf97fc5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..472722284b3362888ca2f735cbb4c23069ed88d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c751b2d0928809da2013dc7237d23dff1774a81423829de4bbc7ea5d129b187 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d96d92e13a28b766b4c8c749c72d9d39d1902303 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2214583308128edbde8162c40646a634e2e93121ffabfec933f66beb2dca21e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7aa12365609b60e20c43a49d9c2ef8cf95810cca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eb49a43a912f28531f517420f45656c10a7b9bf58fe09c6eb71e6b9422739ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6b12f2607d06d30617d86d8a07b44c29d55c263 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ed4a13ed855e6d57a13ae58348fe0da9c49fe0bc0ca8ae2485c59fae41af180 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c70c352f43ef6da029644e58d67784d38172ef91 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c95d0c2c5dfbf738d6d4f5144ae643a938cbdf09cb40bda6a271880870fe2325 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3c0ebb4274f07ba58cf2c286bafd38b66bc9fd1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56dba074762eb25b2ac2d99bc228d82dfd62a01e451b54e937f1b730f1b2c535 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..017f73f0b7f5673da29793e67b4cb4b5b4126f78 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a759debb7233fee278283fb4156b0a09ebb56e10a9a27813f9dc189a0dbcb70 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b3214702743ea331820d2933273271400242c2a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98f5f2008a1d05c9e7b9ac64fbd2cc7b84881469f7e15711780064bec5dbff98 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b24eb7def2d5da76cecd7dd7732900bfdd9814ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa73a1d051f6bb0b12abb91dab9b993eb675d95e4be2a43b9d2b70f6e089e3f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a472482bec83d6d8825edc09d474206d98d207f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0e7288f6a005469a07f9a23b192d06753794446b4d97636f8ece375857599a1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3ce10c7ddca6a59f8059d1df539d2a239abad7f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f362d357c7cd1d3cd953d0135f44b0be9c25c28e1edf69b4daa70e24e889b704 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc4eb2d88a3b336cec7bfd02b0940568e700ae6c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71b64062f439cca17572ebff725afe80f060197ed6aaab380e27e66ea1dbd9b8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8773c3a1554ed623c25ce53f08b586d701113f22 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:998d577f75ad5fea73bdc356ddbd8a0801883c9302c3b8a73a7caebb1538c13d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb97b37a68e329e45c85fc50709c90b9cea140f0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e61a49c941434b456eb29a91e7bec6f436e00be047351f192a62a3db3f2e059d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c71cbd5286f61e6abdb33fd51daff8cce3b14d67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3904d522f0436b4945eeaf0cc77f671a964e468065c7b400d010739c147a3a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e99fc70ed4594dcea3ad35f63815123849e0f7a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28d3a6ca6ad88ec23b3d64710f5117a5b645e23246d117c92ec02b388def61c8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bd7ac1d418115d1bb183646f146bc4a706b99b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df8368b67357103a4d27e9f25bf4f2ab6d7990755395a3138725ef241ed257f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b0da66a400c81e87f578668089bad8535c743aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0e923b71e24c4696e5a41eb4cca3f92766760f96dfccc4e4d4e3f4d6458dd43 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5979ad150472b525b29ce644acea2aa8a59a6d8c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d7ae43e94337f08374cf5d2d87a93ddec66388b7aa85ded303c9420caeedde7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..129f572c1174f079e4a14c7d8ebec7ca28dcfa67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a98b767bd29ad1e70d66d35f4f738c2bd023af7c1f8b74d5e98696539ba8012d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a303513fdd760d70c793ee3ac3be8d9034e40a94 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ade57619ad0ba9e77492f41fca32220c8a088c9d09938176b17ba3d7b8bfe724 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d130f3dd0cd4b5e17495e7d8f6efc034d962a78a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e93c73c09b4433aac74b2b7371a4af4a1e732b63185b1a5b18ea445024197655 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..db9f016c3a2e3ae23403a6760bf4a5f2889f99ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d918699146447af1462227f54e8bd01e7ca85fdf67602bef13d32f5533569aab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ff6cbffda99733405f97a851ab5850051edde4d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3175cf528ceeca06ecdbb878430057a273c1bcd423c5448f835cc9b99bebd992 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..25476f93dc6071489b4c872df51b2b72cc5f680b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2da653980cca1fea129a684efd061b3e3e4787909bfcab94c587c272ea7fbf63 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcf16513420b0482228767cdda64080842a19fee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d089f8f5d8287b1b85a00faa228ff7adbffa33713f4abfb680f757cdba0bd28e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..399ee49db0aca293dfcbd280739221f52b33cb20 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23ba813f5d0e525fd3190a86b4ec94ac26a67189a9e2213dcb0c6522907641c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6a928fe555fab3070fa4e68c1f80f44f9ea5b8d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb5521a62a9cfc79cd2d4d5d0e04ced434134e90319a0c7311dc524e439d083a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bef79daee98ca490d28860426024a591a3618c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe1eff337f8af669307222e96b11a0b81f75cb105c622f1c223cd806bc6b2851 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c356e175f869781b25cd401ff126aadcde20357 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e941336d4092cf1e5ab8dac0cec309c8961973df9fe70a5b4a4da5c83b57acb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5addc8c7535c9536fa8653930ac045aaa1514588 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c1e4d77be2d4fb6d6a096264bb89de1a92c85e4300379ad22df3d12a314b32c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69483f72e4736fb922fbc8595c2e66e3e28c7bc3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f152a9ba6f4bad6576017cdc0ec832dd977fd871ca6ace1e4937c64778f13bc0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5fc23048e62015c9d37a88da916aee8678b6c65 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62b6958c737463aedf198bf6f65f10816b8f23109f59c9d2d9f4056e73940ac6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..294a7fb117ad7e65d291cc3fb521afac55d773bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02b5d20efd9894e465b606a0f4b5deec74a06116febc0afefc57df215e817f14 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0ccd904b385b3485bb737bf55be5e363913cbc7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d6aa8cf7d5d4b34f435a26f6af1567dc8b81d0e6cb4a01b6e3540bf534f5cd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc413eaf06ffb8de76881ca6eb6801dc52217ad3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe2cc09031cbd7ac7f8fd68ee8a2a2f332b6b7fe448d8550f26a2eefb3cb3967 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..709148653f7aea634d4eee7401ebcb39962291ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7c07aa097e98774c19638c862d3649c2a853ed8731554f0fa5ad02671a75b87 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07f4fa9fe3a2e7c43beb4ef4e0ebc678c7c41e03 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ebf87f522b92c2ba768be8d099a2843129edff759517cdfbb24f9cbba4d1b8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e24c4d2fc3cfe21f87f45c0dbaabab9cd5ab975 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97836b92c15828e5940a8159f2bce4b89ee3f0de3a8cf418a0b8d99da17116aa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06b041e550b906349a3b832eca3f6d8298fa8eac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b1676b1c028b4f4239809c4bd4e34e4c9af5c32fb6f2484feeb8acc61dbefbb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32afcce8f36e59e77d72256268883c1d5b909d13 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d85fe13b56c4d6efb3c687c700417c795b28db07c6a787a7ca9bfe9d33046fc1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e611ad54cdb3d7bf16cf16178eb438b76607100e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40bcc9a708dd85d5430002c6012cb87bea2fb30a5bc6e0625d0cc2a5f753e022 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..61139e613d88028b62d3ad43fc7d093f8e0f21f3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:344b242949ec20b1ce659a0e90f220ffcfc59276705240276b7c81e701cc0e10 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a18e923fa705badad59dce24f14693acd3c35b3d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391ac8c65d8fa7b0cda06d53eedef6d73253f2911964e0092a3271048d1fa4b3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..30f8967530a7f522319f80de4d05838bac4b7121 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4361078efed57eef12bc0befe4709f77aa5c72ddc1032f4e7de740a037e7c698 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a3430df01b187b7a9baa7dcf054cae9f6b34fb4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d00ee2d1173a96ce084e769a3ba81fa7a0212b06bc2128dbe62032226cb89be5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd9385002a7980cff7344d4db108006a993c6db2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c44ef2ea06eb1aa531b0b494a374fa3ed91e7ce5e8a1e610bd54e68e34b8ccb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dca2f3ec8ce8b8cdc24bbc0999df75142b118736 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97096566dc6a6cbf38b8fdaea14ae826e8d8d101d1e4872f98599a973e153ac1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeb2a9561141febaceb68491cc604e629cadb5da --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337d5cce4047eb473030aa19c7b6b97acff67f8f3bd0b5af5c98f5ec4c412eb1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..afc9ca3c9f64277f6ac707b65b2621351719b33a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcf76b068537de9a7a66af254012132c9ba8f64f9f7ee46f8ad9bf0b185c269f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b6531f37216c9ca2121545a24c3b699a831e53e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0e4ebe0fd23ea1987ac71da6598ef2dd304635302ee5d5a704e8505b963db37 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c86d3b45b62069e615ceb19104eb46dfcc8940d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ea3970cfe6a58a49c3d2142b9d00758625b52d5dbdea148f68f39c4531ecebe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3caffecdd99875bfa1deb1aa16d4b3ff73bfccd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2ecafc21d01ea1f3983cb97dd0320ef8e51e5194af72201029dc1efefe6a0f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2d4fef67f491eb84c47189889cc134caf04f540 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23172c4413b080d5f499cc119be2381422e5e50144248c8ba1586afd7430b4ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..37df59310eeaa771267893534bcaa0b72f99d894 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cecf0f678ebf0e39c59f37d2334a4df21f8ff19b1cdfea7e99fbab6e7d2ce59e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cea96635d8ade92d5315b61881e51d098b4ae565 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76ac1988b1487910d36be7cb2b73fd0808e30bc3ba1b8724091e139fad59159c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..93d71cf5453ab3e1ed994c239e70ff231b7e1714 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c637560758e688f5ad8f41c2a55a14cd4d3a11d938cb8ffd4ebafe6a224fb92 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0e0258f6723911a12b481d6edd1ccdff8b9bedd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da5d7b075b584c3ef669db7306b81ec9c8e31703c3a6297a060486186dd943f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..16db983e3be9c6b4cd07414e38d3b90ac6360aef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89b246f7e1868fdb82adb6865835df20002a507b36b5ed1ae0771bd6625a65ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f56120123291eb3a5ec2f0f2544d4ff20de1659f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93b2a26e00cf9ea1f90af0ab3ac73fb116982fc4bfc423d3fdfecb61592abdd6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba85b5ec1129ff43c69e27831bdf6ca0b75c8205 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:949e24cdd2d4bbd77952d96e2b45672564928deebf63232c952cc18b538c0973 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2ad5dcf867580173ef04fc55e61f5559fa305c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:498ddde140bd720e5e3bdd2148df6274c8acfcb5092c95afa6fd24a10de8695f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b12c223ab27d1d583df75fa00833611cc4358d7e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:679f13f8548b0309e2452e6cd4722f9c9731825b98846a0e2f6bd1960e0488a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cc75192a2f56f4aeed47bb560b54e6d97bf0ada --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:601a2edcb13598a083b32744e7cdbbff0a02083331560a663fa73cd833abecda +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0d928c63ea5d67b315682d32d4a2a9985c0a19b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37d1102c13f9f15142ff382798cd92d101b5e2763d19978071754b1a4955b411 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91317fd701ef3428ef99af708d918b91ccf118c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c22b0a8b991ba9225ce64e8abb7d92e40deb224a2f678238bc1dbb3ac46828a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..81f9bbb46235f66d8f27f504b4074f0e5cee8ef2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7859ac57dfaa8b043e696eafd037770ec091c82e6fdd698ed36bd08ebd2f8cf +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..20dcfc83f38fec3e3271e1c7736f2d6aa627c50a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18186061965781fd67ad59124aceaf4c3b0d61a8db1e782eb1ac82113723a7ab +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..562f8e1ea991312b04750818e1a5240d7bb652e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a929fad454bdcff8f61bb7a3698caa01ef80b34554c0d348d571caf9faa9599f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f071969211875de9a01632ab35b4bccfa5cb7d91 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bdf5836d582a29f198f9950df948fe6368e4cab3928d29ecb7f291bfe83e496 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..db7ed1949b64bbc2d4b8025e8f49f8df5bbb1a72 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa8ac50d44e12ac002d26a6e376d0b1715899623b90ae05b935d2945859e7092 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21b36183851a8641d82ab6bb73bce48c0a7fa1bb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbdffcdb343b3c210192187a46becea4a3da159e009c9bea390d788089154c60 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..637406be3a936537eed7f920e5fb92702360cffb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf00089a5471c95766af4bf8ed3cefc0c173a16689b98ed291d6934be2a9c7f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7662e4b29176eed54e975e87323b0c50869a02fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d22e7bb5e9071b9070821a3f76e18397ab82e55be9a2f4747a4488ee665b2f31 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8464d03e24d2d88390b6cd87c30cb82d782adead --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c607bc2b42a8bf2aff745e257f0425edcd81b8fb402f8a2c28a1f303de068118 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37d44aa354ef397e9efdb254e51f82dbae976981 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60f6624c9c0ab9c4ed1bb5a246e56a51f6534a7b01b0fadce9d90d0b61d01a02 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6664d8f1426a172e8562bbfa7c60fb7714b4272 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d735828dc7d315ec445cc1eb6b8bd45ea3e8bab0afdab57cf2cb448175eba5ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e63ad772cfeec933f232d8c78f7a653e6737173 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd5cbd5115c61c6e8511f899f0b47384b04b6ad98e68ea106a989de33611085f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d3c3c974dc56f9e4b04d492e0d8e8df799b82cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef308203a1a32230b61787f0689bcaecab1a9d013802e86497eb3a9631149835 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..72a944b04f4b23aa78eca5b296a097e70ff8353a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:493447c6ea2b3e610af5b0f6754d3140ceed10f3366fe5c596192754ad4088eb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdf663d98861dff2cf1570c14207738ff978aea0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:280a3e279a69fe3b8458f0eed51d0e909662243628e85c47876253f026305a1e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3381bff12bed012ee7332bb9e694576f022de386 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0354e2c95ab7cb7e7fbffaee38777686a45ccb965ec53104ff359f57b835fac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d7a6231b5071a9031fafbd6da89a300c17d464c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ca136fb9a08e7bb3595083c799615121b64e7747abcbd58f694807d7a3d2597 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a288bc7691e4dd4b1c09921573a9e72d2ed25c38 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c03294d4a854f8b00b2d1e593fb9b35b6ed630009eb80d15db48ea575e53c55c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bf8ece185d112daf257cd58c1d74652a0cc33fb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ea022a81cbbebd767c357d3a5b23101ec20f771706512d1b64780c47fecdc0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca51cd22227f18008f8f8c4544d3b6e2e27adf2d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a972a9d9af0c3454391c9d2ecea0843f09aca0ccd0c307152861d897034bb7d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a259bf9b5d466c98bfbc7d9c0fff139ec43bd8cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af2fa1dca6f9ee512d7ed72ed3a46fc9e1540edcabf475e476fb9d2d98e082a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9872d0c1696c2a1194455efd265052f51481fa8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8e2ad0686c6dfa4ded799ff52bbf24b5e3ed524dfe3eb92da605f110224f9f7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..77557964b8af7f05651f65356541cd619c64607a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d896db4949aad03641335a2667f48717f9db62c4d21d5476518257662a5d5261 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bce33ff00f5bb5d6d6c177aa7c5897791298af62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf581aef6460e7b9c2c033be70f5c6b4aff7f422fb33067d895f35cdaedac40b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c6ead3f03d86054bd839435e5bde6f87d80bccf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bbdbdcfafdf97735a2ba35d5815604eadcf6d26a08f5d91a21ce6bddb38c2d1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f24ae2fda3d6688ccdd793f8fec79aa517fb633c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80249a481d7af371802634a3eb20039c9bb124ded181dc751a42a002aef81b06 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6c16ee51bdc2e889710807aa06d6b116622eb85 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:697559b0c41f7f03284383112425f9663f1fa13e771327849730fdb8242a0859 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..447a79ae99e108f137f081cbee6fb12011d2b17e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30ed36562792e3c8c0da9469d9fdc274c8d6b48b7d37e7f686867b14b8f415d1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..79dfb9256fd010c38c5d6d88246e95d29046860d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c22af519e9a561c77bc01192ec14703ef58267c92e15970c2ed68e5332791e38 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22b13b13d549ae38e6eb321affee43626d9182dd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29d15640e9c9ae95e446996db281c8eb93164368684105dd05a8090d27590ec8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..285cbd04cd2ade424e3e1ec04cf76d0d2cd8f76b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e748af4903fad7311348db5421ae1a2e8e4aaa3d279043f11811236413ef0e29 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55770b68fbe328d09bdf617a7688eb750ff5d579 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:472904ac56eca595c5b7b5bc0f65cbbd1b54bda0e4363832815cc4feb355b488 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fdc1e7b5f41144321007c245f16cba4d7e34989 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b6af7f882cac707c5cd91c91de19bf7175b0c975fd78c07e824c84db7d25b97 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b663dff3d4a783a6c407271ccc61550859d8eade --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fa867750f4af2d2c96ae9b59cb35ec32df625a5e5ab469298d5aaebec78c750 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..99a64e292bbb6ba6d9a53e1e38cfe3eaa6dd4dd2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0e30ea3216fd084feb79782c3884baf2b7e1ea2df0cede7925e46228b50aac1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f2315b75857cac632193fd02de6cee23f7efd21 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:236aac1180fc46dcfbbd0e2852a8b0df58ca5ad290596c1692287bc2d9def48d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b91fd6bf1f5bb9d47e29ca45af34f8927f355f26 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a00db870c842a436c33bbaf214130e7787972c2a15664cf888f99de3a0404450 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5efb2c937ae5ab54e2292ac96641b1bc50f3c0b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:232f143f48afffc2902abd4fc3a691bad384449a523ea4aac90b18733a7cbebb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8d2ebc3b026da891c9536d50e037b6a6ecb779f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:178ee1809eb3a5761b87845993fca2222956287c2b3fe84fbf43f48316506146 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f49059c01f66c63e2e90ffd36f4fbc10bb650a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07222c2b950fd4c501cfdde54c190951d4ac106e4b80ddd7942f142397380f8c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b20a22d4af89e9db350d14a22d96dbb78e21d5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21603c2f7764c2546ee65db2de07f6cb446dc0649ebb82c12d0740d3227ebd19 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e697ab83392834d420b75d0a28262fa083ae42d7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27c38979d003e4600fd6ec2cfba301977a551aefa46c35d6c13c8d9484a9ac13 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3c81a88327c30ed5d29f72608d0c94ca556fc39 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1264919af8c6ff2c00b454e354cb7da8e87d451167e873da9c3f9a0ecff92279 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3599685b1c2d914831973faf078b7d443365633b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:257f59945c00adb00f0ab67d39d34f733cb21ead0cd7cfa9a028af73c266a7fd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1fdeba775aaf55dfbe853199dbe59c59cd69565 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08aea7d9ca1c3402c1beb6e780b34166eccafa7137405fe9cde3c0d31a3cbbc4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a61ae72181e3ba9a960738a8208920c9e88edc6d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1962aaf4b771d7875a7a3c82a1e5a7d8df7a2e1739857226d8ca4194b7f93a7e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92421b15625cccb395555f8d89a843aad9b761d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb5e8e9e3207ba44717b7138ef8aec72ccdf750861f4c975f0e13c55caa7aa5e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3b29c2b0d4b3f7f21d1dfa2dc2a1ba7f2a88c3a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0441d2ce5ece13258f79a08789d1f3cd473dd89934ab970d4f06271795d75c39 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd99cec7ed666bbf46c6425a79c60e5426355149 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01077fb1b02fec0bf135c175270abe65d2536d6ae06bac11c383010452e010bd +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d406b54f0e45f1be74ac236aa94b8b8f05e3b38 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00a2ae876bdbf9b4746975a594f246cbcb2817574c02d80f8d851c48cec2bcd7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f3e9961416e07c1686bb7aa2d537ebfed9de5d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f1c3a43b65f868de126e8402d7b4509f4147cec42e2a3ad16356beb7303438a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da1694f278d020af41575d4823deeaeac20ac0e6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d3f2ad89e27939c77e3e58e46085f0d63b2b2f6dd9a1c94b708a1e1b07e9cef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..02178188284929de5480b8a65e7ae35d59ced64c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba6ae3a41c88b9bac0ba71c88d621e087300e7346a518fa2df17f87bc948c3b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ff19f64006610ac641d2c9d87bc2e717f81b9bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ff63371cc7cabdde99a1a0fa70ee7f11f25119ca501f8252ab5080faa072ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dd353cee569e0a8a7228b9a94402bc4f7e038b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855dad7407263d890566fa2a0d6fc49c6aa88115b710537182e78c0320273eb0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..255f5049393180e6909a5e4960948330c1ae37f0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86a5bfb2b9f18123a332698cf8ce98330b701f31060cbe28a9a9780744988600 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ec4eb0a955e88654f9cc24ce55da8191534ef98 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a02cd8ce5b7782a41c68860523125af1cc330035d2ca6b5148c9f12839ceedd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dda65faedff2a88ac513febd943f7f2c490b24b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f06bbb842a49aa713bb7800885a5ca0e0874f3cc44f3ad7a01e40820f4145f19 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ac0de5ff96b55e7656210f59f7883f35c7188e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d2fbe4692ccf46099c52db5d41dd6d4e017331eff8cfba385e17e16d8afab90 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6afb8cfe6d5314f6e6a441225901ba0fec9a4960 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28268d5b7acd3b5fa4ca0f925f4fe022404587c2cd09d37c4ece3cfd4f208147 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8abc46b11487de86d5fe96e4ece4b3bbea554801 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:390ffef0bab8c8c58a4a19ba0a1acd310a062af1ec22cfebf0c482e26ef221de +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dba6fa1f7c2cb47d0d0fc31c3a3d9359e619d1c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a68d430fb687a4ca7d44ceb7f0c474d2a1b5b0f4f2fe3f2c24169f8cc804a7c0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eed91a900c10cf71b865485d97ccc243586b08d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66efdfb83047b0fe63a48a8283456ea755e9c286c22b4005804ef4ccbfad0beb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe2c29fda45399d226310b8ac7adf3f91dffc591 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f50c05346aed3ae69f50f90160afbd38cc5e74daf16fd847470dff78b7dd4665 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..451b7e39e2930c5d1f2742670d4824a09cc56d77 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d7374ece5babbc3fa1917480edda0d9dfd69c4bf58bef3edb5915232ff62d9d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13879f88a932243b63e9f3534662516491a090e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7013c19f276578d7066d0267d8350fe2ad2d2c8f9cd904178753b10130676700 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aad6b87ba669039eb791e680a8beb541a63c58e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2eb0373b39b3a3d07685d2518c569288c2723eeeb2013f1419a8357a1fc576b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86ff95a7acbd20e730c26cfa28f3a63968d7761b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1feb3290fb31aa0daa46e68ef47f79baf10b21d373ddd39523eaa92849750dcb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b0e54bbcaf27211c5ec08309fc04b35c6b92139 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8160f0d6f5c7c8997ad840da22a807fce3418226ba3f831f187dcf53a5d6d66e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30a31bc668e8fe0f1aee5cfe07e1f5253cc03eb5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52a05af44872d9def4af9fb3c411f3b2c0942ee5b7cca002b6a9cc4bbf5c5e86 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..60ce4f3dc32404859a8baa75e10038050b27a9af --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6babbd3c9f3a9d087825d70390afec5627974a85111d5e5c86456bddf9cc62b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..73e6db8706a04796cf203fa3e7d25b20a63178fa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf0a796cf68168fbf5c040789275ef3c0109c881555c89af64aae6e48414052 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..65cde09922d0950c1cf626dabe401dfa20cd26eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:344c3f37e9d451d6b1e57fedec3cf94a71b23b7760fb63e3b0335ed6d42787db +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..344664f5221caf395d6448afe816a756deaecc91 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bca163a3d5be894493224628744e036c644adf4fb66087d8c67ec033d6923b1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..879661398a3ca1619ce5009406ed6a51d0e7d179 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dabf24864aa487f8ef06cf229292022a5013e8ac5dd9bebfa86e70a6a88fa4e3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab48b1ee56f47e8f0e4803bfcafe04adfee3359e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b61b3ffeecfac02c16e4495b0a5b6a87bd3af1227e4a989ac8eb0ac269347ae0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc30f3575441494b35d6c84c7038fb73df863728 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53125a33584f3ff942d2e67b1e682a6a7abf4f96340c365a578f54661225c6f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..287df0eb3ab29e70625460c3b3da93ee4309b633 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c9eded8ecd5f3f34e6a21663a6b5f95b88469b982278f2b9ad196cbec54a725 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ffecd8866de42b566b6607d528c5d6401df0772 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4edaf9fe7ebf0db33501793f82751deda35f003f5c3cae42b9f991c9c92dedd9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93b92093dc198246aa4c08505ecdd0f58d383179 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28c7217c27882efd81d1074d3c82a1ba24119f5b0d460d3fdbd72bf03608283c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b5ed1e4e3dd396a03ccd2eb38ed3981d22eaa21 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:947188b12fa47907a9796da7e74fe3273c1e03ab050989d35355669d21fb42d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f690a455781da3e59bb4c56d8ea5bd8ed6f1e6c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b00da9577b2b6d7c1f021da5b322db27c9d2b1d20c4e38356f3159aae968b3a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a5aacccbc5a3622204c93af69d446a29f8e1664 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:875b61f90b282deed9793b1c312a361718eae0278b999bca49947eefd5af7a25 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34cec5df02e784190dcaf4504f4367c80ff77546 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac95a7204a6b639de77a92cdd1863e8298d16be00efb5beb052f7fdcde5e4614 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3554460f80b0208460d83c51c68b66ef8f944796 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac1b86f6348c311288799a02abd649cd4c05c6e9f1ca477dbd51d309b48ff385 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db38c24f49d7ea736f3fb9f495c66cabfd140abf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c583047be65d3de69854a9412bb9a4c392c8c20a064687af60b88fe7fa35aed +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92ed5c65da7dc8d073a53575cad3b5a1f5a26331 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccffc15e963189c9a24a71943c761dfdb8469e01c412c4d71fd57aa27c5091de +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e467d96a221f2ff8fd98b07551fb2570a2afde9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbcfa4d2915c2fdcba5741e6e8166e762d934011ec86fcb60853b3326f0a8278 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce96221d45971a170878538be65140951c8b7074 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed55f15e91c2b137cf38e4258a97f45c301848350666c7938d56dee3d66fd46d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2a4115896a8ec326808a607e022efea767d2c6e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c89283e43e15219a4838aacdde24212a68afd21b2aa878737b18a6b5838e99b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9813120a2a79376de2c1516421ec4ceeb3b5ffea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8cee43ae2763fc678dff738921b1e8d7cc2dafcacedc4dd492c65d8ed2c7a40 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4301c5ea1a04841889ad3bd2414bd4b8aa5366ee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1cd7108afcbec0d57060326726eb3657bc3036d069d2bd657b18585af18cea3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..09139656bdd7b202e8740aeebd84ae6d3e1309f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327596042622d1055370b50633da45a9f08b532012964e9c19f3e01caa72fe10 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cb87c01c30dcb4c49dbb893ad34679b1b3e3e7c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0690d782481e206dd0ad7b83c95fae81117f411f71b227db06cd2255e09a9ff8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ed75fc2b08fec6e86e02e5e557b729f6a435f90 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c98dd3e6ecddea5dc558d70026c5a309d7b9eead9c90614b1ba364a323351fa7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc1ef9d786ba12e564181c5b08576d1d3ac75e10 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:843f1902cf15a9c57a60d621b7b6dd26f4be19caec8534fef8af884dc2e98f94 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac542ffc485d2d12fdcf2d50bd613882975871a2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe55664abb55a3b53da50721acf7d21b8384773c83c3fbfaa7ea8e83f46bbfd2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90591b0e414de692a66d26fa628068bb95d518e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afc0f4321b2b8e049a21fc689042b7921299dd9b63685fdda7c490b1f0151350 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..86ce934c28570e4e847b3ab4e989b2dd6f52e338 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e1479cd37c8b1de3ce48112d93ef8601e819b910d24a1902852970a18ceaf07 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37be04681a2748b92afa63ae1cc186736c8b5ca0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e210eaada6c50316574f77243c82eb02eb755377b3825609cf444e3c7471d691 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e35a2821f195db4077ce7be26191e4c14da761c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7805c57899bade378cdef6afb3edac73d5e2870365f5b0849565a240652436c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bf503d5de07cb8132617aeb8c9266e57be505eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3810b3a36be1738258686b9070321c490ea33dd3f22100f4600c704bf813aae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b6686a66caf838db7e912101b49fb12cf3b848a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b1e30d9aabfae3e9842e028f18602678cd20edc1b8fc639faadf90f38307f5f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ff32483cac3186d1d56d4aada2f2ab5dd9fe3ab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:871721f56e11e7203ca0495a909c66c50976aac6c8eae3c0c51cbce38d83da5f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..160b528071d17ed9dd493ac5c0017d44ea71437b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aed0c9a8420be2a1516f60874c00c66df07816c0792fdc97e24e84ffcbc75698 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c32f00457c3cd74bb0ac881fa89f88b9fc7c50c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2557fa48cce0244b4757fdf5256e981e464bf72a7670a598d25e7a2e784ac545 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc43fe8d8d0c846b942fa8e7dabe3b59abc16265 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5bc111a9b5b30127fe1bb04685722a6ee91c7b2f71a9ac498fdccc67bce7192 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..90d0da96f458c88a5112e0545da5fb31ff6bdb26 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85559840432e5a052e7f6e3b0b8e675270695f046ce78acb668d30d6d46d8ef3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2150c23d8cd81f791bc3993341ca924d460aeb5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65676481523468f714ea5e376c0e8aad1dbe0ab6b674f5b98327c8f2ef6ede40 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e37a4545f5f61192caec55966fa29f8b4e5fc4cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53d61f8442569e4bf23aaeca8b89127e513f6a7fd186f87bb32337d165f662d6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6955af329a8fe53ebcfca6834e44e25c384aa8b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3830a135bad9ea4e317c1f363393f3b9fd5b92fa70616abc443b5caff2fef64 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9222abdc93cc6fe28bcc22ee8ab541a748a7f5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50930bcd25c89b0ae445dfade976225cafde890724157d47a77732a5783982e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c79ce107fbffae9e2a763904af2512c5fb925ab3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:825ecf1ba70266a54cf743d36e2378fd258ba3c136b9ab6920a6f26799e94b1c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..57306e3d76753c98dd520d5889eab5f8905c4a79 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68ceaad6e3e9359e31b8a3baa32eb5c9304d54448c2d206ff6a754ac57a78897 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..83c4f103d2ae07132b5bc832fda327617d73f3ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b90e017c8d4f07011c81aef95eac6f3293e3348593710e4b21b5a998a359952 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e140954837b0138ea10ba522d0419fb0b7bce353 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c107f0871237b3d77a9f8ec32132796cb0f321a3867f10621ba161ddee8a938 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a9518b64bfdaa740c540875364cdf2c5a6cba84 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbab8ab1249490ec935f8d3cffa77ef36dd69085e471b6af693836047d862c97 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7e853ed9d480b8d920b0ddb42c1eba9d3d99bb6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bac35a9c232c138b64fb2cbd9bc904c671844ec9e21b09eeccf94f8d8bafea3b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..db06987e9d159b318b499a807ba4b10d788b6b08 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e71c67a0656b66903fb48ca2e3b5d13bf212804f6d1173ec00f7574f1241501 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff00d3740e855909ab166e0c3a61912e59ec83b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ea21d68a70809c670bfbd44c69c04e0e470e3bab29d09af618be3f8ad838f23 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e83d701cc3c0d2c2864891f89040dd90564e095f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8f755c0852e0a78fb4048f463e1636a758871f4c97398c326947aadd51b7d53 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..930add6e8dfff7e4e86d7a2f393c51652be4c79d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9c2c43eb705258a4980b2ee55b3310cc3dd5c28b3b5a98f3eb7d8c060ede76d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..75863341edf2ab4a5a10ad744897aef0c1737782 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7db6282ab4c0b55af1696adcb1f23f3253335cec65cff5df49d4d3ec6c7faeb7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bd5a7a255d8cb3f52a88886387b890b7f7f5079 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b8a50c76dcb56a9277d349a7c37fe625fd523b3f906840a5cf84a7f844e970d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..365e9d7fc430aa3858760308c43a38de9e4a1d25 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a50307429836eae4342345a0c6db1e9d93103f366a007be3bea913676d06ee72 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a379548801de6ae84d9ea50d394062c240aee3a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7ac00babe6f5e3845810e36b20fe20e111062d366f8de002c77bfeebd64aec9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..05bc3502f889d7ff820b1f031ed8d8f867e76f77 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b317def04ed91ab9b3f538d82fd0336bcadcc5043338f030081aa3caed8286a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5e006315775c2ee348d59cb01964b3fc520c046 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9c7cfa23c18e96aef8de11b0cd81423c67cc84aac2bb3f35e30e472b856c090 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0456fd569c56fc869773e28c04fcc478ef8b2d34 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9339174b9ec5f030c450fb882f092c7aba5ec826cf299f4c4f8fdb2e3f6137db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a8900bf415f262e157873691259880c6c2f3514 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e45bebd0234e491fd53d26276955e8792536a25607c3bc22cdaa6d5b152eb0f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8c817c4eabcaa54e9e849d7c09d2c04bb314a89 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b6c0d34f4d07c853d731f28c8cf0e5a525d81775bb976c950d98dd5adad7a3a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69de6a4c02df483c199034d59cbf2dfd2d5d5abf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8afeb4a6dbc7e68887a0d2e8ac33d910070df3d48b12ab6c626bcab5c2e49390 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4397f29d5248ef0b5df6fd55bd443b536219afab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50c3dd8b0836ba35232df6c48209a2542c2d182bba039db274a4e1d3f6d0cb28 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0be6c59cf01e6052bf0e5e2983cb60531c52e85f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:750b4c55c041f4e29ec9a6d262185559bdc13988410f7925fa835cd2007c7294 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f43b39e3d270ed0d3b710793fed8ff55721a85f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:252745ca6ba92344b4a9b06109c4df6d5bcb361857f3c9f7ce3356192d68939d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b32021928920b9fa8363a727c113f9c65c2d6731 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0401b704b1956a4b747c89e948a6bc38c93dc4ddb047aef1e0a50d5c3d96742 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bc0db9b59f731509c275393b93beb6b44e25fbf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:883eee7595425794d01e4a051113a13923646bbdf04393d35115e9a0dc3b39b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c36d88529400952e327a2a2c3f89db026789def4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4042164e1214ea5caf17f77b4f745d4f8f0a937eaa30d62254f184172f98d8cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e2699f066c93486b467ba51f7dd76b28129a2eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f4d5c3555eb5aad80f06659f79e85b2c324d518dc61f4034dfc0f38e2797e41 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8cf0dd7dfe49c6186d1f2044fd12258f7f8c354 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:382dcd708152c25e1479da136ba513b471234593478996ec786fe28f97f068ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4b5b96d935e0e8d79747fd3b167fed819abb76a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce6b44b5106a8cd494d418176204c57e6c19a75c10138714214648cafa62e53d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ff6ba45bf3838da41d80016f1b9d11e094c11b9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d22c0e01c3141bffdc627b4467bcd80d76327321faa83b4d097b84de1eb9258 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4c77cbf060e6e5a18e0534030845a3d804b81bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f9380db9a3ae3c6207055fe18f79be76295b0508d95b59234a42f974f96103d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f5590fd7b40a774309871047fca8943bde4eeaf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:878817699c2a828ef65b59711a56f6865bf5274856edc01f74a730c942b0dcdc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..99d9d5f06ac19327a1947c1198e02cbe83d0887d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d18d041220e37688f46606a79c845f1ae730035fec4943d444266ee8d58e2d3b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0797dbc64c370feee8857cd6af391932b88961c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13e3247f03753faccaaa10c760f4bbfd47f6366de003a1e1318439e66aa90a60 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb2ee85026b41f5c06115f19e069fa6c022e2dc4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5a3e28030905a065cab2a8f03ff1219f2a29726f1c8c8fde6b4002f36a9d297 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fd819395700dc13d20aff054f51fba95316cd4f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf5698a125d6305c4eeb4bdb71e607c5f7e35fee446e67a64ac0d903f06e234 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03338c0ff3e40672af1cc5bd79990cc939834526 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc4a22448ef55d157da20aba608d4304d42e9103216f2acfedf1594ca5866559 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ede4d3a5ae79ea0c3a4e6e1f2433a12fc7e55d74 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b4bdfadbd6bf57b88c1d1f64ecec9e4b13d7c4d9c4d7a4b0a893a808e59d1d0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbcdfdfcb65efeb01ed36e27b763655f99637102 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e82b89e9ef0bebe92da112997d9ad73358fcdf907537f658a09a08edd536329 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7cb538b44b4574fc00a42ec304cbd7dd77a1bdf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5683e7dfc96ca8379e22a16bdbf41592dcfbd8454fc34acfcd04aa2032f2e2d3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..61d5f8d7f31cda3e5b08e2e2ae723c34a4c2e772 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c7d65baa055b53a260340fac59a2c44fdfe471ea4f0ac9a4b066080e834175f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34e36207086ff211031d4d0dcbe5224c68c3ae76 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5889f953b51a2d7348b1be49d8c465bead01ac205ea9e029f1ffc6439b11cfcc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0c91d6070e049f1dcf0dddd8a0041f0e4c8b72f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:957b8400698f088c6b01d6780b830f1183c73e9a5d2b3a54db7cd4352a09f8f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d64c9e7e491abdfe84c3ed01b32c2cc33b8f18b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd66aa44964f7f436c80aa111f88f35ad997195fc04c76e4f1c5fc3256e1043c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb322d7c6ea08c98712030a5255015e403b2df15 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f9b2bf403de01a2bffcc2b33abd621c3b2b63042c0f02d15d127533b8627ec1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..791dbb6f7032075d5854c2853511bc3f6132d1b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60645bf931d8e43744113d8c57d3161c48aa5e281d7afd85634af1b1f659b9a7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d053ba37baa4cf7222cc5b33a8bee147f2d7160a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d918c6385b6132667338ea0478f044da2dd514962e37aee7b1df9b1f10b5e6f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab5b49b95f5667dcef29a3c229da79648a3608c3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc7272e8bc36733726b7b6088629314aabafdcc6181674a68c6b6c2814babf4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e31fb3f6dbd648fa2fcdf8e77bbbaf0c25148bb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81a057843980c1467dae8fdc9a285bf332a5b67af806963e6b709571a212e2c8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f37a546b6504e429a9a24663de2118c9cda4984 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afc01048574187d2f993810a4b450ed0fdf5afdaa4aaa04f38488e121d3e1dc8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6dbdd51647d0b64806cda25bfb5ee4c1140c471 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aa8f1a569ccf1f1b2d19c0c78c61d4f2a6807289894b79a92e20c2bf2acf34c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3b4c19a60f5d206f7c04a7af265385c39df41ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f77e659d3d8a13dd2343532555d88fd30883fc2447437b4e119ba06d791f7db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d69f0850b3bd620e30ac9b360043954d90e0d97 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf6efacc2a031c358706a0e8eeab3665209c5931bb497133fb1080f9aa0c8634 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb7b7b0b699b070b5cc0e7acc764a5d064ebaa9a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38419cf9c2eac61427bce0bb9d4b3513c5920197ce65898e110f65407fef95d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d91d054f9864ddfb780dd78ca1e506b1b6f589d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11f7982df43fdfa14be477f2b6735aec424d2217f45192685f93874ce95a85d3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..063bf8d480cd7932f2df9e73453d2d61b78e04a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfb97491ff45b151911f8013cf2933283340dd42eab2e32adbda06257b7aad8b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc5043d7201deff93828e03c6a5d73968ce89a68 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5739b74c6cecd5cbaa4207f72e7248ad2840bd3c523e8f0194ac765b746b6f3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3971bac750cf53976cd159e0b5eab1e96945be1e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1fcb2ea889834c438190ea97af0383614e400cdc0af5b1ca5fe81dc8f5ec90f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dc1c1796827329de1956a703b01ab0ebbde0028 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:709c20aa79a51e8b9ce4e647adf2c3a1d3a296453c06e7663411c190266028f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4553555ec79df149d99fa55593b6fc1c0a6d916f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4ea0c84122c70730ee5a22f3c34105eb21305f9b662b32355403180627f4b83 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf07033195324ac5832e90bc74a3a9f8175de60d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5d7e799bc0248fd02987bc7daa75b4e6b51cd320cf730022a9a0adfce2f2218 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa7845d6b5cc9318177989c2330512cff2105625 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a07213bf6e52bf53d438a01612f7a7afbfb24da6909db5d2c7b7018a5df78ef7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2308c82e96eed0996483f3b9ba760e60f639c387 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91b7804bcc696580c8fa04210ac973b0a96259a26357bc3a6137fe8727756269 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceb15f40d296be31d435ba015bba0c850afcc526 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:495c20a68c87395aba7e91a1a419481b14df6e43bcbfa7673bda984b7699ecf1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38febf2e99ae24a9656b8c29962f902ce5b21de3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e640be564ca5c96da77397ae682f4325c6084f3d809f78150ab48f116589c0ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44364a4e24c7e2c82d4e23a35d5bc67d3a649875 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:402aa7875a0c0a2cca4d2fa503f5b29d6c5604009281236fed9e82708c9a8e54 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b910714fc855eda83f95b37aaf38b332a5c971f0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb9e11b81637f896ed733398ef3a809f38f66a0dc0379a6307b49cf19787f8f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0409398831ae92998b2b4be7162a9ff288f22687 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff59b6dd731e1d69853d596ec8a722bab3fc6a80e0ff9434ab482273e57e396c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2d283968a4a5b5e256c99e80d6b80b01e464a39 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6a198388cb2c07cf46485980724e3d76ece7c9f493dc0aab28cf3d830e2be68 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6b2b3a2bc74abcb15feb1bc2b4d39c8d716fa72 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3721de7480edcf27eca75479726f50c18ebabda3da3b524702536138868a9a8d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..57ead27749d35fd7910f6f8cee6245e2a639dbf9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7362d7fb7818d1eeea964d97645e6caf52e06192924e7f03162f43c2c7676693 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9981cc19361c40df2ccf8d2feced62f82ff1ef69 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4267878b4456a0b37ed8f8594d0517659249d10e7a19e8120614175034aba201 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0944e412f236729b8be4c818948c2b062e68cc09 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b19c5f9b90097a6148736e8b980bf2228f8ab0802a761bb6baaf10a0307e32ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f062e76c90d07847cb017160bf7007c24672615 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41453583e4279ebbc33ce4a3ab643dc60a72ba6bd97bdb89011cfdcd1012ffb6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4a6622729c43f0a7e8e60371ab1e5fe51fe62bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb8393b01c883ad5b4d4b2405039da47c34c3b1d44a68f2a2b2e64470e7422aa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f24b1762b3e664b5ad58fe84139e4ed2dd7a9c4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:744f7c9be7101f59e1fc305da0191a9a2777335a5c2c7bad68d8403fb1983475 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d45226293f3c093bb982c225fb99874967535a30 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca70466d65ba25757f9f4922697c122737145ebd29d0f9f9f587babf8a8ec1f7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1cc8feca8273e1689782397ac3278b6925b2880 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab61beb1fce9f2519a243eaefa07eda9174b0bcf663f211839155f871eb45501 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..efb60cfd99e7b072f248ea16680910262402cd60 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2a39dcef1870bb2e98aefd9a0f8ea2a1eb406fbff2b357a3c7528f714bd5ec9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ecc36452d90c4c230ddcb06698afcc77533519d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99e45935ee08ac6f8cbf88e00d161f9de1d38612a53c0e990357e6143f95dd27 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..02b451b5d02e2f91271bbc07308c1a476500b620 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:723249f42acea0ba891b831a67ad0ade9c4e5bf4b31350f875b97e07dfa9e689 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..905cc859ebb6164b940553225a10c5ff173c5492 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48bdaa53720a19eaa2fafd8f8df1442e9bd8253ba30006f5d1fa885f9b1f6605 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5b8827bf83e65061150427492dc2280545e41cb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:200ac4e15dc12bb9053164aa633f8d831d751141d67ed93962cdea391c2090b3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75f93facc1cef453a3d0f01c8087933fa155bb00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc693143171d08876825f73e93e93a7614e5f4803db84801521409caa24f5fa4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f46ea459b96c21c54cdfb1fc06cbcdab59a6d50f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bff579b37bb7fbfbd453c2a4135838e704b93d0d554345dcc678383b8378cfa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b626ea6028edacac37a8d140292c5c06d24235c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3661ddc3dd1ab097dc32d1c3e778f4f8eeafbf55214212f0a99e01897d3af871 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5423a547db6e3abfc5a5245d44aa42b67a78dcfa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dbb6520eed11d78444096096e6493ef07ba52517765188f74f5ad93d2854df2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5cebe77942c115a999bcea69a32e26edd1a15d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab5614ac6f50ba46161795d49015805a4c1b5b22a178a039367d48de76e242f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d53dfbc2519679b804186dd061c31528898af098 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce056d2967cbd9a79f02cfe8b18b3b3ab53d8af547dd4578b10809e6ac76fef9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7515fb70cebbd0f6002737faba90188daef09b0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a4d8cdf0858b699ab0e95fbbd66abe45e62b9bac3932b7264256842481d3b9a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9570304ada866d58c5db12c77592f1e990da2f7a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e84618c40959969c875923f357304d849b91e396d60d2e97630f6f0d32add31f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f3cb1acd7e9ec8be6426e43dce39aed54746a07 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14f23748234ebc584e9ccdb75e794f67363204812e7585ed2a26cc7ddca96e8b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eef7758da22dbf3d420df793f60f7289e55c620d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50767013b133386d463d761ebc792c601b84cb527b6b3b51663999de0e26d126 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c123615010e28f048d432c7b8288b55e8703c87 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e0f8697b452a6731fe48e8a4be928688cc1fa49a4d0b6c5a180c070d0a6f76c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebda49178430207cb35b5a4cefefb254f405d444 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecfe439325943f9c00857290043eeaa22e45336cbccc45cdc3a73680d9052b84 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5c934c847d3a86dcb1d8b815339d128672868cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afbc1d8047516d0e1d67d0c5b9dac0b2c65599ecf637142ca0f8f085ce8dc61e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b4c2621621eda80b1d00d7fd080c14d3c4d3cb0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3248b4e72b11dd4a502063a23671ed54a7e8d2482106d9a721e30435cc190883 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..107872a4aa5d407332a844104e4c62c22a9d8a8c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af432b376afc58cab3a2b978d60428070c3d4c289262cab1ceae71d305a1fb65 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fac77ca7360bb4d98d75732abd29e4e811683a21 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43d63bf939545fd5a9838bc2b059b3a084a5b03cbacafcee6aebf3ffc6d9fdb2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee90ee712f5d7f1fe2b43c1465a33da8ba1ecb6d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1d9386b11497f0a74354a6ac88728da6dbec3c94ecc9945dc834be270de05e4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b6f37cf8aa7ae32d670fdd4bbe410d19236224a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca302ac4a1ac6827ec3d7a1b3f02c3b2178dadd7bb9a913952c8c9aa7c1f7527 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e99c90d3f575237edc19d08b661b30cb49151d31 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53947bfaa6c83abb9e87831055fb31784779716ba3f6f2a4ab9975b364983bd0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba8b4e2e6c9e2dacdc8a37766a63e65f770f1fef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98480b74195ba9a8e4d0de3faa9901017b7c18b0815ad53eb556b655ee0e26c0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..017b0d72cfb2a8848d3e14c2384a72a3c24fac80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24925a3d3797be10d9daa7d479fccabc474bd4c1e51d064f6f01a9444432f7c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..addd40c54fce1992ff76908a5e40872f5dc5ad6f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5460a815ef807c8be551dfc584cf8aac05e12368b6302bf01304e6f3672beb92 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bc3e98b9f1cba973d9a01e4630c70d0c96193b7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:014e064ca1f672a0e472503a0ae6abc4bf9a8411217252c1df97c515f3ed29ba +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..76bebac8d54f5a7d4ffd7cdedd2a22183ae4fb14 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68fcb91e5759579b955e198576f638c1675b879fe3fd6cd69e1a239f9df66fa6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..674e4197e7b38e09c0f2656c3c592a3d842b1b0a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52049441b48cad5f1ff6a4548e87fdd82a23dc2dd1472e3dce41e66349f1dab2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0237b1f6bf6d0690c496436fa54230c90e05489a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58803da78e8d4d44d918360e19f90c2a937738d30c6a926bf9d65722dc7feff8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6de9be40963c14ce7053d0452c5885e4bc58256a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96a4c7edf5f25a51ace6c6c6c6dc238de8dc030848082874f949922674c80263 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3879e91e878da7436796d9e5acae420f3d6c0648 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a32db47a50d9055aa8a307ee2be97ad89bdade9bc2286146f9bf483c46738a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab1e5cee655d5431ebad86826512b9c9929e33be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75210cdb091d1cd8bde7da27434b7d4de54b907b08759c256876685c5dfbd74b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..07f48831d5d96c2f50c8774ac908fa8ea27bf8dc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8e8fc91c5a4f31888b8a1f3f0bc8091e88f6836be2491b89c7c389be2964273 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..142ae3a6d11ca86e3baa9b35d3d1202dca003aac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e98bbbc25aeb95d41da531e6d5659a0f5c2f47376af12b16414656a137a8b0f7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..badf68a6328716c28019e156ab8f5854f015bb26 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d3331c9d2e1e0e02ac906cefc3084df1429ecdf4ad8e9d87973016f28d218c6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3adbf964a55be6a9c07626a2b2d34d2f0653446 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15a5da3f989287b6ba55459d1ffdd5714bb6bfe1bcbd75fa0d8df3abd6062d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..430605861d8d30eb830244096fe12d4bd8ec11f8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:832fba36f91840f0502c0d796ef7ce8b0e7aeb66861e7f25110daa58a6da065c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa0b942f307fa59ac174b86edb56f85c0490b611 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d8ada22d772fb4c7c707e92dc4aaf06519fda2ddd2c403a41d9e574a8030854 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cdb063a6a67530620059f287a6dcc1d218599dc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eadce4edd4dedd652867a74fc02a89d5941c3d3d188a31880bdd69d751be590c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95aa6260a9ecac34ee1c080bab71fdd5cdad4263 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86fe31cd3987f9d3e7451c6a31a4cace672133dee7f6740fb3946dd9a513d4bf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c01de7e4794e4126b717d2c3862e4e173aefa590 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:954d8b47ce2a54221b8e3f59e0ee474b530de2b0ed1e4598346cb8da172d0b18 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a88788b40847ffce7c755c4521b361981780a14 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b28a4d00023b825b99e3b88014d691934339d1f98496d6038c89238253f14af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ecd5b651f2521208764feef8f6d72f1affe5548 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ce01c5686f7684ebb9b4ba5c91be4301a3307b0d37fefaab76d89e115ccf37c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1885ac69b804e6e78e1f4195ebfee26d4d5bde21 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d38096159491e95fe507137afa44b46df98df71a644621d4df69a0b727030c1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..74ba3d8300b3e7f4791ff96773f970ea55e9c131 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2ba271510f0388d1f35256962a578721ef00202c4e67ee99a93a25bb39ab854 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2a623a39f75b005fbafd03a5ea5b4e8bc36d8aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:930ba022e1a3d13c21540cdfaaa8a9f6c80e5217a3f7dbc7281e2a05629a0ddb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..18fd328ff0f0d46a3002155ce52f0defb816fb68 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6ca4bc45873148419d9fed3a70c174c3291b2cf32580ddc927ca0a99a4d6322 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9717fb8d989b3b33e6468f6745b7a021ebc39498 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ae6f3db1af596e78fcb3de4b3a6e9831bb85241e800ccf4e75699d5ba67ae2f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0858ead49bfcc68d613f82414248551a137a913b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46791ba0cda7c50eb3e61a851decb3659781e5f2e7b7ff3a5fbd5b5072dcb2bf +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42d5478d713546eca9e7cc4c2835bd2e45cc0f8b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aaaf7a6e293b6497ac073abeb6bf8087def54145aeaf8b26a49fefacaaa4258 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b50456655d31ab25e4aea8782d52899d25316ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e594b5af572682eae3d9b2ee19d05268d76cbc089115b2929a7d76a2e72026e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e23225aef72ed55b601aa33b75301f275728ace --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc8f0d822883226dc4c6a5d6c1615d14d0bcc7976112db8eab7146f5d13aa4b7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdfed2461654304a0dc78ba8f150cc9d0597f27a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65ca4490b81cdba462e93a21a3c7e0cb05ab2750b6d8a46c6f74c128de914cde +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c8089960e83e0fc3c4e5003696ee48da11222f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30cb62ac7d4a5ff357dbaa31a56330dcf9500c704e5932c87d557b99ab67acd4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..65a253eef4a7502801cb7580ba61dd997f05935e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d05aff2f625efd0a62850285d1d102eeb3fbe445da215075b15b6b27297516c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b8bff42ec7d0c356a4936b09a79caeffaf991d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4988eb5f9b9de260994549ca8bf29bd470925d9aedae255331477e8bc05ce9c1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0210276aed4fb2717235a3933523ccc3936d0378 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeeee340088c45b615e4a93fe48817b01d6cdc6ce57d509d93b43f5d13e67662 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79fc3d5898a763a5c6a8ae28d885c6db91d0ab06 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:475a23be5c2aa0a9a6dac30fd9a25524724ae130d5bc6a425097416bfd86bb8d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..557f312f68c9a7e9c95ba2275c8c59bc41351895 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:378476f4bd6c31db58dfd7c56b745f84bb6098c045ddf01bbd58fab58cd3858a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..181e0585a6ca4305c57d49876f1a05fff3fe528a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b35b7e31669429a9587806d5b3597d3c8ef24e0cc9aa8524d34999efbd4811a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3018fb189db6ea5e994deabb72c674ed5f420a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e447d746063aaa049197ef8767d86ea17a1ab5368abc4782ca7735007f0da93 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c56f2c762da005343d958667442e1c2a88194da8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f430d7e876633f91605af45d1cc0897b6867e7ad86fe338387c3a95bc880344a +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cd1feb98cdf2a6b9051fbdff6884f7121091e04 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb317d8ab7595f56114094107e48dc3ac7c59e83b2b73466baecac4892ed79fb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13ae8ea3acb1fa21b11f3da6e5e377636641c472 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e38400af26a59fc06ffd91623f6fea5a4d1b08513a7f9b08922a0d997972081 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d89311e708adaa7d02c57a2011b0716260228c75 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b722d3a7936cdd51d5c9884e345eadc0730556d3ea45dd27ca74cd6e635175f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbaf8074f2ce2974b530d59149ebf7e97ac9db89 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edd6ff066a83e09514a61529678f732c0e081b8fdc67a05288cdbdd869a2887f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..691c7d7814822d6f7108e2d277aa7630f74febf6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:992d08019e975a593a39abbaa0638ba9b90613ef1ae68539a4746b70bc79405f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d08c9f26318bc24139079629cec72cc541f6732a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c44c5916ba05e22aa82645824c92ca338fd1b9d3df88feb05d932d61dcf5c12 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..87cc3252677de627797c158467976ccb43781bf7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e851a73d65f29498f14a25866cbd183c2364f4760cd00206fc6184d7feeca16e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..468d84f032867c24a7f1617a75d2990893e99740 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52dd9e7d22f907cbaae093e2a876fc3851cc844d421674a67db3b9a217a5ffd4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed4ab3331dcb0674674eb186c85d8f0ad3fea0cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f7d0c5d9ae62b2c0b0095d7ecabfb6a64daf8f80a1a8e5890d6df4351240a59 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62a45e434a2bcd166fabce0500f1a551e936d2d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f3906dd040d81fc9b1d442e1695f6cb6cad3762a6b6720f6385c56afb317649 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fb974e3436bc039560d6ea3a134c799c403e32e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b17f8393e582328267020fd7203a1d05f8a7fa81f53657029af6256accfd5da +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66bd21350d18ce6a31b622855fbfccada0b1f4ca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46135dcd1afb0ed05c9d3746458ab5a0cd3cc1fd2b3085c6b9bad68b6b7077e1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..24b9ba50fda3d7ccf4e1729f377f95feabfda05e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89f13c31004d8460b62709401ff0109203ea9afa8aec0f4d60c0c6bf0799e6f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed9866b5265439edcbe03b1fe10d811fc86d4368 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74d084ef3664beb753555691d64405c5fdbe6f7a90046264a197379db6754652 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fd775b4d2e98b93287df0c45e10d0d0cd779a07 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:139537c5875ba3f9a8ec51f1f943d95dfefb43b873514d80946ca9ce818af5b3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c4b0688c2bb1db0f76eae1cee21fefe9f873534 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f5c1c96394cd9c0c5ac3022720e3989c3d1585d94b6050953ebb7c5c857812b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..00a9bf80a505123ba227e05c4d36b2c9c89814b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64dcb29634ac5f2cc1f07f093b8aa91e00a588fe93079fc09e325e2f6d99113a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84a83a35ba545c096d7033aa5ea521c79fd61ac8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5b61751da03163e98e1ecebb58c721c536e1d2dc7d55d764d387df438516bef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed9dcba8088f416563be3841533b5558d01c9b32 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b62a3f8711fa4db630f929720266e1543a1d3c5f8e6064100e21496020ec267d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..933c520bffa344e692ce58fecc7ec0b48229f9d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e80d2bf500f2ebf8e8889ec60f1cbeff186530d857a7f962c3666a1fe911927 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dae4d551c83b2130d4e657a470720cd62bd7f178 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39921ad5136196c77a4b92d898d2b1e1300f1b60b7db0c6bb0b1af87fbc7d596 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f4115de2bad0c0ae8461648e95152a6c78057e4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b6d4d1e4b80962f54d730df1a93da0d0ba2420924f360ac7ce7a49158bc825b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e06fc3ff34e76f0b2568991c073315ad7b194f77 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8ede1189e956281739ed5a95a1015efe6617fcb42ad30a2329718802b43d9cf +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3386f4d4c5583fa47fcee0133c7171b04834bf0f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f9bf85d29b45a64f6cbbaa8af3b9d0b5e8035bae4ef8faae1c685f85aa80a38 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebdaac72dd56cd849513f70af497f16bef1fa02b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:144db7077c7bd3047e98bb303859481b68d9e3e4e22f902427aac1a9a10968e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66a23a992ac1dfdcd5134e37d4033e9cfdca2d56 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0d463b71b04cad8059116e6bb64e91b547f8543da788d02169429054c064015 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ba173fd4bc9fd386cdff3fedfba812f607feaec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89b8c4ddb7309c7948c29389c0732e7d21b12f0958bfaa3d625ae81374e362f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a485053b3b029c10b2e5cf8bf7e8f42dffd68efb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de6b0b4d724c4ef4c98a491bfdfdbf3d40b6d39175a9e2e091bd216dcf112469 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..89d17bb5ba7b187ccb035905aba57e7e26fd1626 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b78f94c0136fc4c5668505cc4cf90d0c526b1da7bbc92259b36d5790f1947df +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..381ad61f8e61af87386707b2786b6f9abf57b5ad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f827c8e133e405f409993b16f6651df2a9faf4dbd51ee3c03bed90575575b6be +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..424a706908d29168248dc776fe64e0cd57e7a3eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ff2095b4520f7dda3726154d329c115e0eefb3c1a81045eea0fa2027d96ee84 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dd392299a476054af28a62de7c765d9484c4410 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2b7c7f764ba8f03078f61ea8afdf74d71a8607c8f269ee5b5d1427657b1fda5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa76ffce7037bfefc93bb27176e937d87670f8b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:166ad6ac49b432efef33c69df4af4679f3bc72a8b374a89aa0742f9c03e5328c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ca50bf56b18de969b271acf3f4a393774f006d1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_11/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0047b10e98116fffb57e31d342571e519c872d1db680f35a65807c01af08d00c +size 11395