diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5565f061a296395a207af39d6f34c9cfed1eb931 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a9511da3b259146ff19c2420c69b2e6b9bf77e72155c8025770bd97a174219a +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a468e60436f675ebd340325436cf1d51a8d2bb1a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b59cf216aebacd3d79b358eba73f0fbb3fbf1ce5bf0354479353e0e05100281 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fde004490f8a2a4d1f4b4f5b9a873f9c1bc311e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:621ecaa46bb5198e7a987cb0556a44c47d6349e0051c7c75f0aba6a5fb523daa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0fb197c6ee94490ad6b91a189514f0e15499a0c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deb59f3acb343f52c7c12c18be23790ae09bfb88503b0f5148ebfd40d1624fc7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f336c1e6048fbf8ec09c6508d5fc70054029e8e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23f740c4915269d0bcd6aa75850aa529b3f4a7e070b930b19ac6073ee2babb0d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..94db89dffb7395c8113ff4d9d8522ed6592b6fea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e704537c6a4d2ba564653745d1c5c95905220aea812f819a836c5cf8b259600f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb2b874a2ec82de5abf1817c4db6fbe201919993 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44fe1cab3a6b427cd007a8aea0e70ba4869b1d97ed4a5d09bfef82f43c8aade6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecf1caa2b618c42fb6e0fe2bb46d4aed28b262f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad9ef3a2459fba851d22094be890a7aef5b26af9ce3abb3a3b1450db85adcc38 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..646c79dfaa0e84fdff3d8caf1afc65350e47bee2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd86789a4604e0c61a4baa3722f03ad43f007ec3e8e5739afc9f7d9c93ca6b88 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37aeb8b01fe076f65d3e88331342dbd8d7c7ddce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a1f3670471c318249b575789fec609dd4753fa1926fb5c846a302076b47bb97 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7794da5b5020243018ff8018fcea06d24d04942c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8ff208541a2402b3cf1824c06758b4d7763e5c4f610c466eec4d09510af6354 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9c5b81308877319c29dca61d69e70650a1de2bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12c80cdac49863cb04370f2e181e67cb9283756f6dbf66aa889677879593674e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea731a7627559ea89b3ab5dc4ad5d9667f09349e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05d79124bb599224870df4adf324d36d12b193ff887bdde6614fc32530501f62 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0906bc5a233afd12e5c83d73a4c0d3e2a25f7bd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91436fa7b095e225f8690274a5da65769c3dffde4a921deab5a47d641907a55e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31ca3ee9413398c15f2777a916a6e41787324c6f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d7a412c6cae6c96abab4d8034777cfe6ca9dcb881114a42a5398e62fbb679be +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce7dca3a6b3b9ce003ead90c1478677e7c82baa6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56417683286fc762a110c6680a25c30dc81bfa83b207aace421a7c3fd5d20403 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7065ded2972140c649524e824a6b0ebd3943d02f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b80fde81daec10870846379b85a20fbf14351c2566ee10d3aea632f1a3e6882 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9c17df58cccf3e98ca30aaab9fb52e89aec1616 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a31c0af8e6e62ac12000b96481acd118748d1c1a6f53bc5ce2e665ee33dd3b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce542153aeaeb52b7361bda0ac2129d554130032 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3652005e2d2f30c898e52098a545eb07e8be5172e32d56dd566b02e677533a7c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b890957d63590ed846b71a8dade2692fa088d8ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5ded6a8420766b76c9663348c4056b01f0c73a2c663eb12b3b381be514cff55 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e1c5d488caaa0d522f024514fdd3cdd7bc66dae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc817a86a39a96580552480752248435479a8f456ab3ac322d05a3284b62ba8b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5c7e64d7fccec696463cb3db1cabe364d498bde --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79fe113c1a9a1bc52f200c15913820bd7f2261831a8a517362a3cb420f1b3250 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..99c3fa5c63dac4953c07e00a926a0efd25b1519a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3321a37694d33a193e72a68f44b505c5a6a4a9e46e2f2e95840b2c48b324345b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b502a36ad3e888cef4742a0ff82894647681f968 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:813f1f7e6d075756dfb66e82b1198d1131899e9d4dafe08f65fec08e792b8638 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e5aa29342fa0dc58924639ecfeacfb2339daf44 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e11ad8788f8b8ab84dee894248cc71ca871b478b93326105fe78d235cca9fde +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69cf4d52baa36da04e843217a1675ebc52473392 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ea5536a40de7592a3cd462b1ce7ab52427872ba8994908c0998b786a788a1cf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82c442acc2518321e533e18bee443fa81f415a04 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5c81d7758609ec1b7574e385dee2077e0d4e79da56089c9755f752e9f078d0a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5cc50b11e3ec0dca902bbc95310eb7995941bee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9c8f5a654afa4807110980996f711bbf6a90d8a2e39a930cbca6a7a509a9fdf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a30f7d1f8aaa004357e141da58354f84833b048 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23f530db255cf20ade993c3b503b9b52a1c1bd6817615b8d18d883496284dd8b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3c60f38aedaf96312be3c511d3d44f9b9c05dcf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18a120979e4bf7620fe87ecd6a7000ed7fce9cb683826a75da825ce65e825f8d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06ee7e3710b3e1758bffb36c1197b0f460506d5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:758a09eefd692c4c9f4b7072b912fe803619ff59e54e235908f57b0b47868a33 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10ef72117bbecc22226dbd9fbb4d6d17efc5d2b1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd6cec0b2e642cf0f1bea0b8c875dd46c59f911d59053f643b15fd1f03042c6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..49888aaf761602a8281758771923ac19da5babb0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b41a1206e25a23d9bdcba6eac5450e898fdc402e27adf1b349b065bbc066ab9a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d14470b155ec03078e5c24c228579ca4a352b8e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fa33b0f888f39e9fe9714ba292896aab8a83214d2eedadd02bf79948ae39233 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34b3dba3eae2508e248cb343549708d2fdd0568b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d39c4a4af92d91acd60eb7d85384ee3ae24e6259033f9b842dbb9b9221138257 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..08f8a752e1c2aed5bdb65cdc8b6f04b0f597f9c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af8a9d66ddca2f80a9c9a95d0f14f5103010fc6471f66bbf1e82e53d06d17637 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bde59e40ee568aa6a85c7ac7462fc42eaca3d921 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50fb8bdaa966ccdad05203b85d7620a3f4a1df57a3657027542bb8fa04869f23 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..416da6986bccde14d65047b5260419ff731328ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4d1376ad05aff70b193f7d8abbfc406fc844217ceb6c2f10d5f3e33da5366b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e4c5f0797dee24e6eec5851260dd54dee506115 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e8181e47e52f8380114b6e34f60d8cb0d05e0f6285a8a344f3cec099429e5a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0cfb3fac95103906865906734ab5780b7281d9f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb7678b69280e7ee14a8a2cddd6a9d3a94ac8b6f13ee2fdda63c6288a34942cf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e25e46d8c999b7749c31ea8576bb893d9905e228 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95e4c34a831edc779547fab7c7a1b369f1fce9c8347b36fdc82382901a51b882 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4c63f54695aaba9817066bac7edf5b0795d068c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad74c0dc7a2f2019ae13664032b9f7d73b9bf33a462a1423f7a292517ee77fb0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5013b70fc9d8719b72028f4368f517bf72ca73c9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36c16951a19dd7983e4c0d6ee50d8d37b02af31e1bfb144a921a6821d2a445b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b605389806f7a90677752e5865053a446c261c83 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9115f1d92b982b8acaba16135cd3363a226ad4b1fde3fc15275f664ee7175c7a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46e302ac2358481688a4cdb94a30be4191e48b6a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0eed169569285821e2c67d1348f98fb1fe3ffa4ee29638e6d3cee0c80df7846 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb8a9e1d54edb9ccdcf2529f1b4cc8fd2917a5ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e9722b28c12e92cfcb287e6c06e250fc8438d1bf39b77ea1be4961c250cb7db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf1736eb6870b2b4e2fd200fda75a25061628df8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:124f43bf760c4d212bae5a4b689b87a405d91d8b21a5c1179cf40c0dc981d6d3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dba0bd64db4f611a76564a1aa5a395610e06d803 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:823e16ab7fc164f123a367f3d4eba12e9031dbd60b12384a239f5b4f2cefb5a5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec2222923355f5857524e5f5169dd5debac0a793 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e21077cd18e6f6e70a89fc8dffd96a78170b0cd9b8571fe27fdd2fcbfd1f34c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..adb73100e1a06dd92a761b14fe31521745818404 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99ff089d7a99336a219943180bc01febc4863ca3dcbc32d5846ba44aedc3704f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bf375fb4ccac2f854dec0c139703ce8dc1ff5de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c93b13c69b982d53851ea133da23383ed374ffd80d9ba0c71595f386cd2c2f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dbcba7d4868a8b05a2a1e388debc29adf640542 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:180221e79b90d7834bb9c226f610c0fd1638d05b22c6f8296efd880512eb3e10 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2709421bfd22ff21cb2e73711ebc862cd5beda2c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb7012e59a7d00a7429def672ffab98658e4d94efbe148c6617ab4c1ed10f2e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1e53b3615453a9bc44224117eccb442ddd70be3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75e9d40f633d9142b9f32e87ae1d7b3d28dfccd3523c3b3cb080f5492c824e12 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1237e2d3210b9960af2d6fba475b536aca27a73b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7252fcfb7e07ac5767fe71595ed2b32fa69e4b06f374808e369123570ececd1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..02f450bfd42f27caf63f91c085a837225d7dd894 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5ef283d5c28cbc4e1ef63c639fcbab53cba76a95ad4c7286bc448086e715de2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..450853d147b75db5adde5325c0f170c4f50b94a2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7449c2ae37970580dca28312c817e6a1fbec61d49ef83430c89953ad69d00d00 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..418babd683d467af6c1453cf75f480c022cbff37 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d7208b024e11428bdcbfb9fdf8395ec8134e364576bbb5ce06b691e2729e2e8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..356333cd0d1c94ca8429ca4ffeda3603031da9bd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40ac364d44f79ed8ebb8d68727e744b8edd01b4d4219f3f280ade24cfab80c44 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..45d07ea77201f80778dab147e8b51ea6113f5ed5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f02b0e243039e69e9aaed509e9e19a482f20949243bc2cd7bedf34cc249184c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..876728945050361bc2a8d92dbb3ffec6c6ceecb9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7ac2d4564bff180107fe5c564130177abec8527d14978888ef6cc811173e9c6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e44514b49cf578e3527a8c4bf61fde9d405410ee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a2493b26b52138111e8c9da815905d9a5c1e21e9dd45e59b1bdd74d8c579076 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d213e98dde3ce20520a1d9d80a909ff06b1657b8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbb92eff4480b9013b6057944dd16deabae4b275f8e237f6ac3e4e69f50c4cc2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77579e170db430ec034bf3540ace479c0729db34 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66f015587cdb521173679f3e1f90e2d0c1b29780ba33e0aea725a01d6da977ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6e5c89d030f6329097e44dcfd0c61d27a827ea7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5101a916b8e3ed134683696bf661d3b83b41c1579d95cecde4bf8c45f951d77d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c822e996679ea1e176e985172b0fef1bdd706153 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bb2a332a5d66e03ee1112ca30cbd9d620325b0f4df4372b93d3972832f8f3d8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09e9e3a953aa1a0d5dc8ba574d75681a6bd501c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc622b8f47601d3554af7ae0980c3e770073e8ed2f072691c7475fade095159d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..78c64318872952ba4114baba0241078c43f2ca92 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f99bcdde5950a54d01ed1e7f7a00a98ed0890ee342d2af9da9ef4c2271ccae00 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eda3aed99333e569308ea384dc28464ccefeab98 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96cb91aef89279b06d66ac53e4783c7dc263ab8a4eeb3a61e6208b702e7bda5f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbbdde5955ccc4c476a20ee96904cd1b7a346b2b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b182c69ed8bdd52b5ab9e5468a5f2297fd93da720a5162a9562beba3cd400cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8459ca0cfa11f51d17f8e5ab9c367a844e3dfa5c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ed926be479e29277f44d35f530700d5a7fe7ecdf2ba3d9d05307c0a232a87e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ead4e337fefe641fb0c981e8fa075193d79464fc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d13bd6d9a79d232441fee977820df2210ebb3f1cc31bf67f4f5d8c3371de247 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f45bc41350159ee13163b55150c3d882ba4635a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:258fd4827fced8cc7b57768f62daee5b4273d78bb422416b7de9b472674f2d20 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..54447497578bf00d9397384dd0c22d25fa32a4b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71b6c5a467f710d54556f12d54f77fb11168181a5be916c6a15177a1dc0a9c78 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3837ae6839c7b18ee97f097bfab48fa17590ffca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4415bb47b9014ff1d61a85285c0c2c6483cf5bdd7c43b85f468b64b303a5f85b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cec7381a05977bb916840d0df7202fe6773e7077 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaaf478b4cc159304555f39abf9f84bf13764ac0d1adf7b50b5b9e9c4c71b791 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..946450a55cd042044d31671206e849d74dce2405 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:141daeb19dca74ba6957dca1a715a41aa5ea08cedf6dc16cc482114c7f6f4073 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d7d863ec9999cffd006b9a515cbf0692fabb4cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe3977715008292fc163529446c0388f0244aeeae6b0f3d26a67db84653ed3ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53d50ac5cfd118f4b4b5563e1b90d166bc50e601 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c49e6f666cedcf3819ec04e186bb10569e29834d0635c57fee869d44f92021db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2ef3a211b702131b37a72cf1823d3fa5bfb0746 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:679bc8ed600ee7eca9f4171b8d15d4c9aab08452014f9048d95225a46a5cda7d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fe1d66e954d13f7066626b6b507047cfa1ec2f7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e38da016dddb809419ac883dfe1175f71e7b5fc818164958226c4c381c060ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fc872089da3dd8af403d31bef25bfeb5fffb2cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31694c4dd2a1f756e5571da2f8e9ed267cb99efce6d48a74bccab30bb40f7332 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8965d1657dff063592a234a4d6c2b0f99030ca27 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c61feab06e39ee06a448ba795f4a2946468ed5356fb99f3a9e7ad2ee8e3bbe8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ab42637e6d31ee63566eb5b5287b78e19d15143 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f4dd9ee9231cfc57ad9be0ab904e2c187809a47082acd103585ad05aa29ba32 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3e322bee0e06c1fda63fc6bc22a31646bc254cb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eb3cbb34c8a3c015d19a30816e16ea671a63431f3fc5614a5a7fc883f8c08b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7452499a30cc730f6d020da4248e0fef03b8b243 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd9ca72a41cbae73af0906a2a5629d9800f8706941a984d239fcdc2e6033208c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2bbdfab93d7e4e76ae699b621a0ee0cba4a3ee4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a704f4ed05cc81ea864dd2a97025f440b0775022ee703b49049b9b723967e33 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..932736c566084d238494830824e0406885936ae9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8daf852607cfe5fe6d98280eff1ff0e229f7b4e7d2e1116e77663da1287c3d9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f96e8753633500f918472a68247a40abf4e8b99 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19c0d5d8ecddaa577cf59c7476b11fb7daf86d1fbaf6e4844cdf009dc07b4be4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e40c7fa7d41c30652ee737c696b55bcf5c78fca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a2140898c25bd826c737e1f15f89ec9b5abaadbcba797e99653d9258ee7cc57 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a9a6eb0226bb150eb42a7e2668e09fe7e964be8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e2350f455bc8357063627e1ee8116b46cdbc31d861c70bfd303be70576b48b3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d511dfee3fc7a70c92a72e4b5ee88f8ae86931fd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0156b080e1ae3e99e231008227a480363b7ad91806cfbd3f48f367798b64cfc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53db55fe8e937e758ee0bdeb68376f4ebf231cb1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b5a054af78ee34c49595c7296c5d12a1ef511929cf41f874b60dfb3f0c2a595 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f95ab7a8ee9335cc4f0103cdf38c7c456aa37bae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98aa73845cd509dd0b3448d9d5ccf2ca0e9135bc798b9416e7293df8f1f5c4a9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..375f62dacfa08fe74a20bb338058f4b42753e4de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2c505f724dae493d94b0ffcfa4314d46660b8cd463fb0b90e8ba09aadc10edf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb393211d652cd69588b50ac35742fe6487ca89d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a26e18c97ff58a808f3faa965c536466f766234f8b7ad8cc56f678e010ff59c8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb872a46d78dfd1ea5c448fdef1fe0feb26a5f69 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02ce4dd7b80b74fd06c7729bb1e8bbd0dbaf7ba7cca484f15e9855def0a15b07 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..152a4d333935ff434d0b0e1a4adc751532067bcd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfccfeb865bc5bee67b0f03d82d132068618fbae3ed4f79d8803c5e41ed2a24e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..370d43aa2f63afdb27d8427ce31aea8b03e8f222 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ccd1fd544075c8a36b319f681b43254900e89f6fc065f5c3c828f2d184058f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fad28c82895f29d3360540d30e83aa636659a7f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b65ab61899944c5f095ca9642b42ab7cfe3b98e8a6b26d49c3c01716fc2acbae +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82a2d1e9daaaacb7e5eab577dd24a675388e1802 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd18cd1de42913bdff634f4836112f090b2086270b6690e837446c36530f08b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb2a08891edf89b88524467c6603a1944156c4e4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90b04af7d7214193746451d238ff163432dfd249587aa65090649a453ad084f1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22af541137741f8826fdb2ed83283b241378ce99 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dcc8864e6357672bbc4bbe5425810b9576ad6d50a7a267c428998066bb3dca8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d34776f90d9d0419a8a0f29a368b6fe2d008abd9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56675149d732a4234c50ef281afb16bb71d8c0ba8d04cd61c820b19649df1187 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c43499d660513c13424b338a0d6784fcf0d09cd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef446f4952dfe68e6778e65ec035167d2ed74460cf9477212db303a472f35541 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f253cfc245ac4fcb3db54c0f68842ca8db475e3a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd8fdd8f5b9faa7027f988bee3a1ae9ac84677a8850a6e0c0903a3db6070954d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ea7ea99bb56e6c9be920541fb26feeb4d4d6990 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2564b8e4c343b684d7ff8fb76fddf11eccefc0c28a33718a9557b5b6e8622257 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a98e41fbc551c82e4fa458182c4efeadfd07cad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3954b592e2f4978febccc10de537e4d313365267c3f2dfc376362c5df4f2b238 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3db0dcb12e9039c453c0077c8df66087751c9188 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f5c75026093227959764b3b4ee47229b5f6e54d5d3eb0cf0bb1d5a41adaf66f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ee851e8568d12f57447f92faf7f4efe01982d58 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8d1ceb786979dc6cea2efe865de066b620d0241ed3065ccd7d825a46db753ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34a948d08168387c46d4e9e1a88c65ad8111b562 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a86866c7b6660b9cd5d7f52c49a5cc9407474838aa562acc61b3c68165ef6fd8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0824d29ffc983b77d620f62c628d42aa710be924 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5c32c96ff38bebb12ea938f9ba1af737434d8ab5e9b21e265ad0c531baf0c7f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..faf73aaa0726dcf570a91381d63b65f451d05ab8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bde38f0d6854d597b29e1dd20c2ebb3f8379d0c6e29a0907d9d05c0799591e5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8479253d3c21d6f114c602b062a31aa8786d4624 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51652dacf3bacdf8e6a431c75659c28a27d71afc48efc93a0961818c21a5ddf0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7399d17b058669871e8bbf304f587a8a0e2dadb6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed972280e56a82a8b3f1fe23278a88dcaf83c81c160814cae4efc38f3ba89a33 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9e4d9e75ff4c9f4a9b073d0be36d55a4e7ef03a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4559922f0d000b63079f8306a6bf4eee1fe09e272777637ad4e42e5253e1fe44 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..439f3ef698948534d1894b522ed21c0764187ce7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:823097dbb294ed4e5ccb2ede41ef600ac72fcfb1718056762bd5cc70d057f7e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de7364edd278be697f82b6804692ed6bc5ceedb5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fefbbf760ea03e4741040181936892904195a848a90639243fabad45f22be4f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4bb193a2672ec3136d400fc36627b57086f51d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c1e102479fe8426930849192437d2d05388ad477564ca50f7de457fca89bd44 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..108ce98dcbb2c7cb620a9fa292e19b63b9ceee82 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38f950217ca70bce9468bffe01d861c33bd895bacb0c318bb2a4f226788940c3 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..feba9e5f0f332ba26592177f018517374615c910 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d58158a18358faf2d039854aebb071147e1829a27291a171330e45c2d262dcf2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42806a4c6b18178d37f9a7dc293169451e13a32d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:050faffd563fea6b7559cfba7abc1cf1065903f4b894bb638126de87f1b27bb8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..caed65f83780de6eaa3b855d6908db24ecbf8f46 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98dd6d2cd6ce07ea1c538506403fc6e82d8abc4b2a8222ce3e857801d3c9c9cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7156796ccabf5c50896dbc4f077e97d066bff511 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfe5a99b709313a8cb39840fcf60ab0abba861e1c6ec193cb72805fe7cd0743c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3e933dfe0de535ff8a0edbe0f58ba80a17f34d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5730c6d1d928c232e37b73444f75645832a1b63bf9275168a195d41f54a35db8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ab70a1b9b5d11c6934690c5e7204256c5250f5a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6aedd235cafe3b1b2c32349b402e5c0194ea879ab9270135b2bd4eb7e27fdbe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8d57c9eaf6416eda19819358071732b98be43df --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:089c6bd3d0b435a67ba8107fa7ff3c11c218d1669df4995739824be202deba64 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dffb67d83d854b447bd6ebbb71e80ed2e89d13a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d89879e54feeb65764ee341995d69a35f43e33fedcf9b123c3229aa5b333ef43 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..816ad4ed7bd1b5ad3f27ef244ad37853cbcf9bb6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9431d6e4b5328e52c9346f6ecfeaeb1a87c0d2863fa9c992c2e122647504a6cd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74f777d71b39d3e3aeb12e20ffabe02644406ec0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee38bfcb535f49a52ccc572715ba9180e1138e0f300dc128a12f0ded805cb9b7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4558b8daa4fbace25be9ea05e95a49f902a74946 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e42ea91bb5e2a34e9aaedbb0bb870b0b228a35af0e0eac9a4edc4770b0640f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59932cc41457b4ea4c08868dba7d757f8a20fbd4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d10bfe3e6374d5cd93ae75e2f0ea89e8204111bf8176d7e41bb7988fba57a666 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a861edcc7b70039003f6b76bab7f9c0d914eada --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec9085368b6f2c9a8011fa43e426913ddd8b377da9d3e31cfd4aa5b26a417029 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..544286a5cce481ccfbccc41f5a9eda7355b9d089 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:408e9b4f5f42fbb7c80a70240eacb452df3553b6ffa11b07dabed5ff66d1e06c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ed8674de0fc282d2c23107f2d0ed7458972b9cc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71976ddef9edd330910a884e8564ba5441eac053ab94c736afc9e0aaf0624698 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e824947909f483c4d019003b461e3cda4477736f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eecd9f478ca1c8e842634eeb6380a124f805520155702e827492b55eef92c097 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..571fb23939cea2b767354d576b4bf883074b7ae2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7ce1958c3ab52e9a87051c44ffc2e2182383dacb1e478bd0aab95f16cc42c54 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60871d2f485c67ba5adbd3d3327faa09839e2d0a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcb33d3b7421afa85bb3359c54251c1862c7c4fe6f2a96e5b9e05592dd58a64d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a4f054c9a9aef23ad44c3bf3993235d5063bfda --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9129f534d4ca9ea95711700c8a6e7a03d1b5e4c50d96172b60f0850bfe5cb9a8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f17449899b240db0b23f882423d91feaf78800c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d085eb682a989851e5e3128499cb3bbb9d83ace4587afa0514170e22a7f9aade +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e877518530cfff0a48044f5834402fef2e8f9a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b59c1580173d5ad0803baabbb2b2a735c1834c0d0cc7f1f1dbfd472633c19d8a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1a3f82f9bd9fad8c07ab7bdb7626a8594d3c048 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3450ed133dde8e7486f879f0cdda2b1b11eea5ed77de74acf417d214d199ec4b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a2ac601319ae53d6a7565132a97a4995e2df200 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88a6521bb062d3faaf1764cd18eaa97ba31b266c5a17cadcc01ed9656ca36072 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f39bdd15f46704ffeeafca34b4ec3336db46ff55 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49abccc4fe51340e841d6fb16556f391528c59930f85ea94efd6871fdc856fdd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0342ac99ddb86bbb96cb0e1bc3fb27e5fc1f06ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea2a0351f79abc0a6ea46c3fea301a375b9aacef9678afbabe6a7ffd8ad44629 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..166c8b5af68e32b59d2066c1c24982bdeac726aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88bfeb316263b8c40dcc33df22e1c26fe720e9ec29b9c9ea84e0b3423ca1df22 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c710f6f4385e7cf01a3aa22c49accfaa7c21a453 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe195fccc0eb167a5317c3bee527b710ce6f271717351438715dac8d51de63ac +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fbd860a51141cc5f43792381036392006046ea5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8997a075fe149b72bb081682872fcdcc5a6a80584cf9942182711338cdf1478 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3251bf052ee03a28be1afc8805f89a78f26e82c3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d219611c705a8a708a8ef808c04e3af9f062492632585bb35074a82663c7bab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af269d88a7d138c4ed89e9c0f3c867ebfb3f0c53 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee102aeeaa49f5957a56d10defe30ec682cc0af4bc6db65a50502de2463cd74d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd834f084fb4f2820e74fe7d693af56e279ae523 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:796c7128851d9ad3a20dcb7bab19cbae7b7a3af2134bc4eb9fd90be22088a34f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95e88f7c61d998207297f9d75b30acb7c3dab3a0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f98f0c9ef259a5aead7752628c2f54eef5474d8cdb12d4da89b42d35ef385d8a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e2ffc26776dce343e652ffa092c0fd9fa1a5ac0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f56a31649b50afd0a6b967f3ca8aa898e55adfa2862e517ac2994297bb9b186b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b56cdeae5979f50a3462f67259b2cab5cbc9aaae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fa2a5de464887406cb0b43c215c944fa7bf076a5fce12eea12a3e0122161f6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..747ebe5221910001e53a759b0ce1cdb7baf19da4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc2c3a6cbd837e4e6318dc7dda0350fc07dec7b1de8fbc64f027fccf7a439ecb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d076ba9e4f3c5074afc471d77f67928a1bd83978 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca5a099ff8bae0489fb60e96d2520ac20c04135c670aff07d4463673f545f2cc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62a5f1fc013ee487fded7b16fe30e47062f881da --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b88f6735e64744a840d92c0ed3d58b71c4a00f64d8fc7acb97f9e1d22ca7a46 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53c71253fef9a365d60d331ef3c1500540e452ee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0e6212e297da5afa8a9492c08d862f2eb2b8d396275b51a19df995761fa2dd1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f2048449fda60ec15aa7939922d9fd9dc5a2b62 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd2a5f660fa8659de5877b8b12b9776f811819c033a095ff46fcefe6c196ef3a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77cd723be1e98ca88dc4f64a11786350e24eecdf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7ace439e0fbf785b087d44e8a5e0c0c681c2622fd40a5abb0b39cb40908fb3b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f6a38496696ce49b555ab7f73bb13744d263c73 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcbc7d62415cb97d4e432c4f592bdabfcdfa275ecbfe4f625b0d5fa186188458 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf7909ac54a4c3bec4c86d278a3ba089747a9d2e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b61ba466cb93fd8f1a9bbfad3ca86c420970126f0e90289726300005114d4f7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cbe3848dc889c30a8b0b401e1504a9447e867eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9b378d1766674802f485af84f270c126f7386c8abdbf69179700fdfaedf4858 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ff47890a4f8fa15c28ef62dca25aae73650069a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f23478b27753a4a6ce4bb85fc9cc1ac5908881cf75e867144683e8a7576d86e2 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fde7948335668f0710ea46e7dfcbd2050de14f4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4d66d0b83f0c04e6575d6f7191cc2e4c8fc40b3e1ca20cba26e6f7f0e1eeb6e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ea4f5aa1b14c552c08715ac63b889b04d08f808 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:543071c1ef9ffb9766a148273ef1a4125a5ac7661f90b012bf784a0f2b34526d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d753ba75bd478b28dc56d830a04d5e28646dea9f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32d0aa4ccc35b4177eafacf2c9508ac7d2a025af0cb885a54f61d278607ec457 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7aef56ebf312592eb9072ee1058de85616f736d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77f1e7e4c11e7b50fe0862c69b46142d75932ac998f7c49cdebd942a844421e0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba3c810ca06fa91ba7670f210decef2fff060af0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac5a238343af4219d6749a44fffbd576a830d61bc020066d8ee6075bff3fdaf9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..60a65846c32ef2810d581238e8dd34959d31451c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:003b93ac242ed5b49e6c7ee635ea97ae07564c3f2496fb05fcdf4faf301953be +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..814caf08ef41f7f21cc7ede1b3db282f613b1e7b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cdcaf8d612ee8b4762936d228ce29f7667adc293b5fa54af428c78a9868df09 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dae219d4219984a9be05ed2938fdcc89f50fd1f2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:744a9881cfa2c71ee1ad20d085c786f2059b1920166b3b569c46d85802d6f8cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1faa36bc2bc6be9acab800133149972ef01d177a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcf243e711411da424cdc7df9a0254b08e7a72073e42bd23e7d591a7489511d9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2c73280475f2783edf23efe248c34e5160d9276 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43b9a790da0ffb5c675c6250bd375018253f64f54072b7915e74ab1e39336022 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cba55b1726c81fadbb9cff0fdde8039a7637fd3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9deeb40695897f0d25e8f021f43d984c5c48b79f8ae1f99f7e88dc31201e1735 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..880d45138f1ff7a90873e49228811fe76a725946 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bf8c38a72eaff660543129ee6e8ebcf38ca3533f9c27f57b776ba09f63ee0a7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45aac74d7880529bc73f87903fe25a7f581e98a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a527a0d660a71a59692a6a6727abb799cb5dcfd2a23d76f0607442e37812b445 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..77a9d7e36f0c883e158c217a7b64b77d1df57636 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98c0be79af3abb743fed7c964613da38e3def1e5913b666418929b26f254cedd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64da727e933936d00721c0cfb9fd2ab02ed2cc02 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8372fb83763bf4e8b9cd01683db7bdf5876469ea5ece3a34d3c82cb33c2936c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a307ee18134a741744240c9af53ccfc95283ce52 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f0383d89abc75a7d13ac10d0ba09fde752d607d7d9399274858747db4bc567a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d85b676f1fa14784c59097327844d847111dfd28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35a93992600db7bf67cfc32a712a12655334c42332c16351fbb646ad8c6c3f71 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..66620f3361763a7a3386f9037606e853878c5cf3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66e962e13b63ab23d9b9394a2e8002d13bab9a32fad37576ebb9d162703881ad +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e02ccc4409f08b956639dd0441b3c372b5105e8a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d65122156dc8afe12020a86de8f74eed58ae4fa077a1d5d45e919031f1ab11fa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab197b9fe572cce5c9b8fe2442bc3eb7a27632d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b00adccdcb2e527fb9da3632e591e0b96d656712d9151c1e5cdcb97d397660bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9095f760cb87d67080d77e4e74a8fa2db6cd35f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e82df7bc6e4f66606d159e2ff40cf404b58f9548be6cd3848cf1455ed1283d1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..145835f4c33d5badfb42a12c16e45c55d1fe4b1b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9bba5899a5c895d8e381b1241ecc2bb53391da3e8e4bd35642eb538550d4576 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..206c4a3c5da395d706d3dc086b07cf223a3ca438 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dffd3de644346fdedfbfdf787d130c5fed12f3f3f76f8ab5a8fd24fd1c54727c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a24b9a0d9b450c0cea28a81154991dbfe03951e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f339265e6ded89391f69dfcc9c78e55733f020ecb193f8c79e6771ae0bfbcaa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5253b0aaf4f2a6b6c38b1a3ef39f97bf582d4345 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fca03378fb29512a39aeea07b8429404cf2cf1058024393ef7a7f364c87e7534 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ef1c695d8381dd1d2a9d97d1eac4fbce10b3a61 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18952d582b8d8038344a37c51714e0c3d093847e4477e4ea613f829f1129c9fa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d760035317ad350d007fcd5fbff376624cba96ce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b109b59eaf42212bf18c0475a524f8140d15237ad13915564e3a3cadea5f4470 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ecda7efb44edc1c3b5fb7fbeb5fdafcaab9f821 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f641e5fb73c313800910c66f4cf2bd3cf6ea51e7d231de5245a0710afb3df9d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b915174cc8d5601cdd32a5ba6a5d13d665761d0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bfa2cbcbb08a2a835f2b4b01d55d957baab6ef9e5ad1e8304427f7332b1f400 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7801a1105784a8b783769459507605a9036d2b22 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:163ed3ae8307e1c304785b9f5cb8c36c85447b41e78c3c5dc404ced756c447a0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e53243f38e2ae0a57f91c987f95033dc2139b4c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3f241523ac1b474e678f9fbb8ec4d502ebc2b178fefd23c3305db3cc7149135 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..686e29abf5ca292ff7d32e36457f006e30400940 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b07b67f8940c3219f258c984e53610d8432366e3bd6c64bb4b45b07582b2c491 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fde36db7ff2b46c78300b1b5c27d77f92f2dbb67 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d01615f83c620da6227e83f8b0ddb5a8fe3bd935f364ea640cba761a6010a8ae +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdbf4e96a2c2bd2fb550787220595e6b6c26f57e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b975d293d5a3a5d9d4a501cd7587d9f13722da674d14d674358febe62d4eda7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12ff0445745663b69e49d85dff7b6bef5596f0aa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69db6a47178398fdf204ac12cefa950da558189af79e7ddbdc1e5bfa7650d8c0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6bfcf6ec9ed64799c69b211bc14e3c1465a9e70 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec1ff371b285b653cfc929953faad26a7c3c1c61628f43c7d2c71bab89eb01c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bb15e87f96d9ea5d012ba16ab0245971a040c50 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffdad52956bc45b64653ee52c759ea78774209f70e181bb208f5649ef9295ab3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48618372d40495427f3170d07bbb33bb46bf58c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6384dee1abd307775a04ab3a29e8132765cd304ec2d290b47b6dce5fe74de0db +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3a1699db956fd4c827ca64cff64dfb6944eee8a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d663ad769e9e30fcc514a505e441187aab0fc3fd2a14b2baa316a72191c8667f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..646c6222a41ef7a2c85f07d3496fd90d83f61e39 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:841bcf36e79150a26761bf16d0d4b9ab20c5b906364d97b389e1b0a97a3737d5 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee6713b5c437a5cde653504d2f59d63d887c8d1e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:555fc94bac9f570d17bcdf6bb4d44a01c39f92bf5cbaa13b20cd465ea951dfd7 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9da9e56c0243ee80977967bb8843eff0a8d607f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d8091dadf6b31b16973ffda1566cfcd12671db5d1b7fdad6adc2575006e85cf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b64775857771cb19775b1de66f54b2d2c906e8f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2f3488f3d1d7e216f0facefa4e06c72e9a7795dfad8466d83a0fe5de756e1f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aa16134d5e92bafca76fb389ba400f18308be2e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8708d9e1b5177f2507a9042f27d16ff9661e53e1356fc890bb3ba0b385016f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdf1118743686b0ca596f552f0ea3d772476135c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7070281a62d25182266f88467fbf9f7688e1c5cc91b75a965d896114ac237d15 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af4367a56f1f7864258670d7793ebc5d3d4b1050 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c821ba7c52fce500813e382ddbc9a33eb593eb02d351a937e51845e194631ee5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50821352e226b5a1116e1600a087444b0d3e9df8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86440a33d90b01c56c87e62884a02b0f9e87eb352caebf92d3d4a98aec2ce8d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cf5f7de6fc72985179334d8ad3d077724605122 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:892613a0681a0b9e7973768b1fa730fa528751f5f5c018fae1106f05cb43ed52 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..860c56c1047a3a087aa3495959602aa81a125309 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fda8702a81af183e915c2972f662256c500a8da6bdfb86aaf79aab915cbe198 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2729dfb15b996585a76446c8f2e3a3cf956bde1e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eab42331bd760791f1525f4fddac83ae0db44eec001ea547498088da7a25cd97 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..451ca3f4ff66763221451ef10d6865d550b21977 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a48768200f494a706161e3dd51d07a6f14e9b887ef1f343a9db6a558bdfffff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca71220257b6984bc57c3a64ea3d458b45ccce18 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b595064e1bd642d893c3bd34ad62574421eabf494fd27142ebecd88bafc9af5a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..276cd9c88b292124fa263e1e27db9d5ef654f0e7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20611925614026726c38cccb4e0911006cce39df3197f4a986a18a5313e79d32 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b777f8e37246d6fcf496bb4fd3991645d43c25c0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77242ff8c9d334df71e96d769215f61ec8d907e2b60bbfa03ad2f7338fef3bef +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..056b3d9bdde9dabc47d6af1221681bc5719f3d88 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d8e2f8155b0f03d1b4684eda18545e020792a97b03d88678f7722385f130425 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5712514253b05ff5cd61ea0b94b8893ecd7d6fa7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfaae4e041652268cffb40c7e889e0785f5c3c4530114bff368a012dc519270f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8ecf448d10a5c911d81e7c5b5b6decf0090f1e6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fa1b6e28a63c05b75783dcdbb691625c333c3255a3a4ddbb1f4521393dc904b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a59f9a55476e0b62548eb21c64c72fffcc5b40ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a926289e2f83e2634deb94069d7a17cfae1afd73767d947ec42256a652514f4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5b457dc3159f8fba4be3ac3a74166a28abb69e0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1067964eb6ab1a60bf79d465eb3260f210bb149e2621c3383841531305444d4f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c882d3b46743ab47bf5a7cdfd15ae5a943d76016 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec1305944c441d1dd572db9d447bf32911cc24ae17bf405c46d1fd7b17534136 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/lm_head/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eae0592393cf4bbb9a797ff150b0227e2bad4677 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59fc8a31483225561b1f47706bbed58db66c7c51aa2508b3999fc8dd2d286245 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/lm_head/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c8d8cdaa950fabca69dc3babdbe300c8f161207 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e48c18779fdeef2129166626d4e3882502b6bfb4888f075a41d7961ff0bcda5 +size 205955 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..382d48c303457745356e69a5c1d1bc49801deb83 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3e3b95e251aa2f0e130e012d8ca9d3640f74b5ada907e59c411ae9ffff0e02c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b22ff88a2dc07f5a4b3dba982e979a1624c7d8c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:364967fd0469a827560e0cdee0daf3034406dddd17dda6bf30aaa7964a9a5e2f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..463ef3d5e08c7462d07781fc574524ab2338abe5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b40e43b50b60efd9f02d111b15aa0e783ade6b52190b814f0784b3af60ae1a0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..964dcf4814095665865fc4a6c4cad768d373f11c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f03d283cbeed695e92518ed921002ad00be9a0baf631849c3757922ff163ce5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c24436818500561440616be8c3bfe1067017519f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca40e264150ba217eb3edc335285d2b50e55ce5c5325c2da1c4a27884da1789a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5403726a2d041dc78b8726ee18e67c6c4b4d828f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f5874a72188eb68f18ff1b500576b5441f5a5ca8bacc5abcc8582193839cac7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..db9683eb52a9c73dd3ba34b9aeb285abb69930a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f2eebbc2757469d24b8cff180e23659e3daa573a17b1e420c654113e9019ebe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..341b76eb58a52553403fbfdd928e056f4ea827cb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a73554509073da065a0266fe3069560f8239458d0ef3220d496080926591be49 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1088d88e4a5d067c0b5cb37973de6becc34deaa1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58c5263c3f8c6758387c44790644e771f592f76ab715e178485a25d30c76e910 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65d46d58adb4ff444aba85fea59af91da658c77d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cb28babec1883324a5fdb6063d69f7bd3f0dba1f748b24298aafe5dbde0dcc8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5524750ff6e1db3aa1df0f0d8cf137f71b3ee43 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f28ba50f72a65840aa59889c553e3a9f69f6b4c760c81b98684c4c5a87aa0c87 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2be9f2e0ca9f56a4ea170cb0a8fe64668b3cb4c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa6b970ccc0cc1b9a4dc03840848aef9c29c249de6af0b039f97e97db3b20918 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a45b731062d7ad4b56944ee9ec19eb67fdc70e6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dfbf8a86d0bd5047f7127ef8262565c5ecb4fa01dbb5d36b01852c5112316cb +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..442b23d938b056383ed4ecb131e407a0096c12db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f55635495f8f0c067d2162ab89b4f424e2aea6254850192aecf847501fe7770 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a1c89c4566bc3581d69e4ec6b9317f473860e12 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dc329cc34d7e51a65acef09b169f529512ee5420673dc8cbb132a72e1121c08 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f204264869218784dcec6e780b26615c35e999bb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c074ef19b9cb2c75be3f18cb3b4a4ed1da86e1c746364f7ebf87dd4638670ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..478388bc29867e09a6e9188067789c29f137ef28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2ed153aebed157ed729446780a355b5b87d4c6f85cd0cc86c2c35c1b6c979fd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a137c635b08d6dcc6a813d878d05efe897b2a2e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b0c2709a4450c5c8a193b68da87391dbe6b6762f3add3a9d39296fbf5b5e084 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e553d121de11ab6c13dfb1e885e2249f24e13526 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5422e77006212b1cfffd5189776c4a7477d5a9628925a0d83e87da72ef50632 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f690450d9b52237f3b7f3d49bd0e44bc39854a81 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ff39933df1772af01ca3e5d3af262519c97f357265a5eb8c4bbf045faff7e1b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8b6c41e15e61474eddc5938f4c7cfeaed3bbe5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4219e9241f08dd502652a35a0cf8d9cf2aefb9b3d8cb5f0becfa4fbfec22afa +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e2183eeafc07ccf8bf83f7b2199c9e8b4a49b7f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:becb7024c60439bd22e61e691250499a0a4a54a8a4054b14951feaf9f85e220f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..722d5d01832b89cc3f38eb0a56cb6f25a10c2f23 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:589e00cbc03ea284b79c17b5bbc3471ddc97154b59cd88e3b4dffaea963fe4ac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7520ab1f55edc8b48be23e595d1ac1cc5b53a7d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b6bda35fceafa7e0f356b6ea696278e0b2ab0cb797a36c8bda0b36e6c1c7c5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..06162d604d879495eb7592373b5936f01b1722b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02ac5446caa4acdbdb35162421519bf9b3c40fc0f76e9febb686019aa2e856ea +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aafe1b1756399047124ac072c03272d6c5896f2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5886768243be98afafacd47a291fa929fcda11a4e8f51d999b76dc83163e0af +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b376872ac323fe3c0cdf4bc64e8d1c630eb4fd6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0d91cbea5971124e2ebe313827542327908d5a62c6ae501882ba06e2021830d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48cf4d6acab72efd7537f9699577dfa0edb68aa2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bead357ace814f7be809158049c4360d84350685c86215735446ec3ab7898f5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0741108974f5aa720978d75eaed08db3a9cc8464 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc4fd0a7c3558d4032b6c9982466495b3f52a15f75c4d2630cae9ac70de59dbe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..95d91c6d70271f9071012a8d2520d7ee2988be49 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b0cd5c2867657d02e36d05cd6bc2232c7df650694388680088a4aae062f7503 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b1461e60912edc5cbc3273619e6995624cf376e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ce8100ba2dbe0a58e1935da9f8fc297dbaacfc9861b88d3d963bd03e441f6e3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..769e2559998dab37180eb02f830098c2cfc0780b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70a6121314802717a57425bdb8c0d9f78e69ff1ba1e9da83bc4c01c6f02df94c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9835c436a4db3ff7d7212c7bc70b820d13b57ce2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5783d350e94487ff438eb31e59f3ea1f1087ebeb3dea411dcfaa3613f2c2c7b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c50a34256996fbc5ef88b2d79ae2ac891aa0fba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46c56e9810ceceda6c692172fc94d34ddcb180ec46efaeeac4c0c57116559422 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e330c0cf6a42ac1541f33da0ad052ed437bba721 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abebed66edb77a7c3a334005fac28f48a815b2fa3634762a21cb859c6bdea83d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..249dbc984d1e34b7248fa39f92cacb400bcaa738 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:850efe9f4861f67f3a4d2db8105e889eed750ccc01204802e12268035a785b32 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03c88e30d07d759e278ca380d7746e72bf323cf7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2715b774f303c7aa37543d0fef3941ece870e6263fd8cc51f629cef813fa533 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dc53f3d62297c2c298bbcfd17b34ac1a7b36894 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d41f353a1956588def8bc098a422c81a83e05cd0e6304ad23e92f81321e6929 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a2be1d27ac7d4df4cfdee8166e4eef468aeb610 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cdaa0c2787810e980aa74380cf745cc5d131666038e567203b5af5f3b2e072b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b403a34fe1f92f8127203bdb5178419da384c30c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e9897ae1cb9884e24ee5c72fb596df1443b522ec31b5d6474b788cd7428ba5d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d28b7a0f340f9fa79be0c53bdf93b72b2c02f3d2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7cb6cef0de97a76ed1db3afee26d65d06bd2febcc36c1366617ca8ae32aa2f3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdb5914c525cee0c4939f2caf74c3ac524c53243 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7a9a3f981064ad96158dafca5f5afb3f1a248f75398e0da9769148d1dfd0abe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6505ac93ff1923d28482d6c3f49a9d13a0b0985 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db6e7c6f11204f75567fdeb1affee3392f0010c329366d622e6789a785e28488 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3655ed6ecaddbbcfe60931f2f3313ad8774a7ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b41684cedd11e1c76074ea972632618b70a06829827c64ec0b7e4d697ade1303 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8b612d4d4282134d5643aac98184b499369d367 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e72eb9f594f55f4a9579d15fb4f49062bfab40dc84518b1e822f2b34dd398ed +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcf5667ef4c78311f8837e56dee05c6d7f084b04 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dc4b96f8e62a4d141011aacf518e4147f3057638a6bf2edbc5b9563bf1f8d4d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2e82629288ffa51f965bc2500f1e332c3dd9fa0 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ef8825be30a4751cc62ef3ea88d875152846768a14661b22f2cf33f48152ff +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0678b9fe7417266b6a7d196faecab06681f04c25 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12e5e8fb2924adbab0773346cf43dcd22063b1ae6d397ddac25bfcbd42e20984 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0be272cef99548d0d9ffb6222193f0ed29331d02 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:536d82e5199410a6591fd1d7cf7b735d07f0b0c7bb9461966743279d5734e3f0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bf70dfddd7d9eb2057b182b95d88bf24faef792 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0c733c2ac33cd38b2fb38c79af15335daacb3551722ec56fdbd6d0f881592e1 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0292f37f3e0dce9e66c55e0e901b50616aa5bcc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6d9f4e60dd73d5ad8b6cb8da4e835ee96abb6f90148bc95614064b8f72fc615 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c4a379f870da5489fcd6df5bf4ae731853b21ea --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9f4266fb4b75ec84883b7a2ee1d54b2519039513560685001047ace7f3f2390 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4024472fd5d208415f442c5cc4ca298ca8ddf962 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d2597b4df1c680f1932c2412c7253d9a7d98d6b603b65563285e0286f7080fc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a39bf2264a4b813737bf3cef0e076cea34d4f39 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25bf2b9fde1752e70ef655d165ee9bdaf2c06ce00ed7a152d8caba96aaf25d6d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28da5d0ec2dcb0b935f3470c28a217ecf996ff7f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41e8f61a07bb67297856b2724290505c2db582d56487b5a49474943ff9d76dfe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6182472340b20603f44785ed6028a5f7cf377a8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab5a7ea316afa6e5ada46d100332ba3508e48210da4b228c4bfe6693ab0e92b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e1d8643c326b984d0d4678f1b571be82998cbbc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17b835a563e2c04f842f98947166b328a6d117554b27ec6549e8ff4ae44280bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..27483f6dd998fd241817d69e9c1d3e78dc18baa6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed29fd30f86157ac3ebffcb27579b7cbc7865d70c82a2e34d3fc0135aaa44339 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a9ee49a4bd0641cdfa8c4721bd2f75282c85b16 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e733131bac4f10ba969ddfd11f289ad1ddc082e9feb37d8a682347a1bfddee66 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d47b70d68d66bb53dc0de119015f5c7c44cfb63c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0100cb9b525b4f0db2a7b28f6feb09a4302565ee62f7fa44124b61f3f69461b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4613ac04e2bee7c9c358fdb6e019e252bffca3e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d59b37f92c73ccbcf7577dcdf4068f5c7ef17f9d54d6b4b13e10f0fffc63204b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e83466aa94069545efe17fa6b66e331e5eeae58 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cfc9dd8279b96536b24fa22dbe72648aaa9ecf4e5ed6fc8eb02b49b856fa4a4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..28454ab1ec8d7e693cc03ebc16de930d59584fe7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ee6dbf26abcf798f9fc2935002567beaa905a935f6a23cdfda004cb93af54ef +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34115b9a40bc9f413551f361444f22c7a9acc210 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:155edf48a0819bd7ee50fa3b347ad75951f6de6d3b1529e3f0031436b12235cb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9ae315d309ba206df9ef62be4f121a87c4c3cca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afad9df9549b7e3fed67f940e639c982afda805b702049045a37319a7452c33c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa430c03c9844976c6b0b8c794e7cd929856d5c8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2116dadef903f2a6449803d4ab46dd40f1e1d13ae48f8d1ce626b02134052ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d62f7fea3f6158b87e3b9b7dd04e62f54b648ae --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:414a76724fec170dd809b0f6bd6d9aa1109208b91f1b8ebda7c25e3bb0a8056f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bf605dd1cfbe8e0141dac6158b2632c0b6bf9c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdd6f379ef2fbbfab079e653aa86bdb3ef930c6d3de40f39fb9c7ebc5a452d4e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7b99037fca3e50279da5a82f1924d669db83cb9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bf47a4e25dd0a15a05b0a634c658ba83545f4653bf09a2cc3ed03983767b5ac +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..30c92c1a55ed014b8961c0f6265514ac3646ee9d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef047385452f705b613cb1b9bd6ef121936aa3139a6db1dd0a40dac3b12360d5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..edf604e311c02c3c29602fdce2c6c59413335fdf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:151e32e9798c466a01a6bccee13eb6c7a5760ded60aa8a38706425f2f2942873 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1df547c78c6a9cf12c37f51cf224ac38f35a2e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2efe5c839362942ab4818b48eebdaee72aea2b799d43ca8c9870f93d998f642 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf3ffd3268e2aad0141647cad163cd8260f5a0dc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fa06f167176c7628efe1df9cc6eccb0bc42dda9e5c4d96285cb55f49c63db88 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4ebf45e823f835981266cb04c4411cb43326571 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23308d41b958931cf4d32055a3cee0845626c445daa70ed228d39ca9d891c299 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c12febb306c9f1fc922e5dd437f9091f52906cf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3205872b0f295c3563e1767710edbcdb545ad3e37fa36ed7c9b2db7af9164e9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b47951b3e57a597c1f1e64ead34ac38cd94c83f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e446a789993634f334d4b75cd2279bc20baea1daa2213095c44bf78e78d23b81 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..33c45d524b06b01f3f8277966eaa6200454b4e90 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:110878b9efc3594edcda47145d2ce46b3ad1d10ecd0e7cc19df4e0ee9788a13b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4829caa9e93bf75b3d16b3e55e51a1e5483225e2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acdfdd15d96ab853fd62415d08f967e84d57ef305dc6fc01362f38377b55dd60 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..08c71212c14181cf4bbbcb0c50a69f72e3639a4b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11f56d9c02c87d87fee8b8aca6c29b8128def9ab87691d38ff186f894b1818b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37367ee1a81f8b14bd058c83db510713fca45bba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d0f9f727b91a29d5ed539839b71096c149dcbeced6dbb978821a30e8c46ad6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9251120745b930a8801616ccd3b2ab07ed52f844 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a53468ee0f31d561688e9d7868245fc26432608b5c7c0b322c9d37fc9490d87 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93910b37ea7fd2d52e9b537be69573b29607a39a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26d4a34eb99e2085b7196042869d2c0462205e46c6fbe415b71bbf0b4a8ae6c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..133a6e238d6994ba0831f4d5e265447dcc38aeaf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10244d0fc20d595c0462f7ab225a5bab6ffd3e3debbc3dd20baf4fbde60f5104 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bd7622fa2cda43741e0c5ab86e1614e065f4137 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4210286f7f75f2eb577df1ec090b44537312303670f6ae2ed1badc0dbb40e775 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..925df55e95722a0a440fc2ebf8d05df90ea54e10 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e16a2347255c899c926aabd407c1d0e43dae395755f41e69f218ef4732d8a91 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceec9280a0e48edbf598e75e098a21de98928225 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:028a7d4f39b9b76161da82bfb95c666ef1df5fccd89a59f0662e6a67e287c70f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..11b28d3286ab8316bae102956d17a0b8c79b2a7a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12d1bc22468a404b79780b91cdb507e3d34bac72deb9ab7c077296ba8a633323 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c523ccf4b75bcfb643a84c97102b89cf7bb60d47 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31cd7918d296bd058eee9f7451e071fba4ba406c4d0bba46c9efe7fc5633708e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed9049d07212358d44e56004ecfc305b29532af6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6d71c4dfd3c2365436b1feed3e5f0fbc64f0432a32e45fb27b9f1151e1c6647 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..db4ad506c7d2bbcac7515982e7557afa6d6c91f5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:456e59161fbcd111edf21bd05846de55f5451a5717b7dfd3e1f9d5b400a1bfc4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf408fef45610c4d4d5cd0fee874c48b4a0767e9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc3fa09b2659833fb164ad62578bf872888f23db3488009076ebb90709774f04 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bf7f32d85f537018c3a25bea06f87e8481373d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31d74d0fae9f7fff121b28bf0b957f5cf57a6d2641d329448e488c6bfe24095f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d390dd32ab921aee3d78d1cd959c14cac0b37471 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54ad0ceb184a48a3daf8a11a50606ced30d9df8d5eb2236f2108bb2cc2bb7cc5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c0ae42325496b91ebc0777ad92dac1132cb5bd2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac95b25f2621d337be064240df0435a2f78f0934c5f14a18e2eedd8eec924250 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e6643961a7b19ff90abed8701f7e88db0607c10 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91c47d889a4caabafe4c2790b8b946b8dacbbd84e0b7667dff4cabc44ed2da38 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5320d79a5f8e21052ba437bab56cf2861368a0d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:856ebee77c074980b26c58545785c7ea0dff461fff7d2e1e29e587ad94612124 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..13b1ebe2856be92c3e7aae037a556523ae101828 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:884bec557ac0cdf4e9cbf883939751f1a943c678aca05f2ccb478f83d0ded79c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19c96d15fe6444020b3d044edce1614161d9c86a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97c0c31d3283e8d037a2e3363557b4bec38dd31f3b28c5276dcb680d474df283 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bc39d7f898612cb8c6ead4098617bd4903989b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b77028362f2c53937ef1c4276982c8b57ba6149d03f74ef9a4eba7d979d12a0a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae47e795c92caf3d3f4417e688cc27532f09c037 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57540df7cd96bef7bfa811e8e985f87fc60518e57eec61a7a47a4a66745e3302 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9846d4444d764e7544d5b9f23d21d36ec2777ebc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dea7681132c12be37d333f0ad95048c807ee2b2b9bfbec714248b8cace78ca54 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5018fd7591aec3671c59a2b76180d21e89183650 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:392613bfe2c38f1070487300e075f2cf49ac8959e9c7786f48ef9e8e708c2457 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9bc1969d5014924dbebc3c2351ba092853a201b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e9d2c5f0b2930621473724efc3768570810aa2caaba297307fe2646493344ce +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7f16738ec89094ef4f2266af75c9388497c904b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:539bb6f444b78088d2518ee22f1ad8e02c722d162bc9042542be0ffc6a23147e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbbf85150cc43942e01d6924a78b157a57632459 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:872a35448ece1419e698e69800978fea1ab6e4636563b03d78f3b294e8cc8ef2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8b4146d634656166420b02f3f873e6556d67633 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:741d757c883c07bf2436b65da3c516bc94e2b5c9bacd71b5bd270e8a1ed17783 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7c8ebf857fb608a7de88f5e1331365c2dd0cc7c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f4795a7f7eb2613242820e6ac5821d431b1d907ebcdae2f12c6a0910060fe3c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad34fedb2f871987923b45e3ee8aeb1a965f494e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abc3fcd6522c0203a2f7bb6e83772a7c8502984f68d01181ad1668822da56605 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9666de8dac6e4393b696908e148f936390412876 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99ea99b5c62be6dac97d58febd0210cb5c9ad275589f5147b624a47613631b1d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..266dd3c7cf64a95c8c32a09a6afdb18bbebd2e31 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46cb93fd01722b496b631a6a548aadcbabf40b4641473e3e1f9e15143823a93b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1fe69a2d955fbe45c71ce28dbca1627c359c4c2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd91dc82e878526ff55d0686dcb82631dd6b4877b10ab849794ad169e0b7e8ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bc7ea03e148195b67ee0cf30a584900342f72d7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c2fb16fe04470448009a274ece77647a959b64a8d7e85d816b023535893afad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f77004b093f0b35f44ecd7e33e1a735bfcae4bd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1b26958c59d685dd620bdcb9647507e902f2a74fb500457ae427a9a1626e47a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dad00a00f262bca081d24fc2302d96be35a9fe3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3fc4e579dd21c674ac67a98a7fc7bc8dcbd2a6aaae4d54544ebc560625f2ccf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0d7fe90724cc72c395630caa353f661a5f440ee --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f2f9041de3a5199d93fd72dce5ff54b47f3b83ecfe26ed54311b8ee518a460e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d487b6afd26799983ae6a1c6cf7e0a611db1ffd4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4692a0327dc88481c6790de8402630a917dc0bc2d941848d3c41146379225dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a41d1565550ddfe593f10846a6b108f55740d8ac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c9a01775ff8774dc1c23e52a8b53a83c180ae3daf82eb8d57b74b2e24a37451 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..909d593b43194add4a655edada7861898e0b1388 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78d3b011a2997739262c9a0f70dc2077f36709299d9071869458ae84493581af +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..42c52503fa9a6aedea636f64eb980865b774acab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3b468ec17123310efa20738f5d4a9750ea17f427ac79d71fcf2cb5eacb72f77 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..87fa6cbcf537c350b176fccfcf773c6cdd1cbee5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24de55f142f065e56b0ae85cd843383de8f307784e083a594e6bd3f924aa58f6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fc3703105d6a8d3538005de2628f225485e8ee6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35717387d67f4a52ebc7d41efebf853f7dbda92a1a4df32e9afcad159aaeac4b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c198a09088a82947ad96e8c761ebc2126d152c54 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f4a162d7678b0b3d23099e257cd5bf21004dcf3e38faa6c24305b9b315340c4 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7196017421b7a80fc471948e69e042f394b1f94b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca56e04346eed824b75d079708641eeda11269c81fe6bc4151633dd6b7504f7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1bd22ce08ae0be6199e863200cdc050c454b3b9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77e4fee04e282dfef653521dac2e4db7694c6d965eef353e3b8c58c66cea4968 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..372bd3a572019cae39ee2457ff2e3761b4678b96 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80cce1acbd2f44f0a0462b92ccb3b900948c9407d9c32d316d3c00e4f7cc7aab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..168f4aa6c9d3e0b65ff60244ac8404a8eaf700dd --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71526a34ca3fca8c35a3357a4fd9326fea95868025df1f1fd558f073a4508c56 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..34def261e8afd5c5eceac9d75b3bc126b597e42c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12cde6cde396fcbe0a12b90001b3ef4f3b3e329097f8cbeec6bc4c90459f4985 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..943ad05ce5b13b27379bcf9af4d59275520c4f46 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6005a95932ee3b199ba5f286f0b1025cebf1d1ab5db5cdf80fa59c0148f0773 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3d4fbc8941885e525b6d7134b8fc81fbeff04c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:074fa7e835ee67bb86b91d37efc62ace934138733954d2e8ec95db044af52f18 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a98eaad1c16ec53190c3e0f01491c329c43cf4a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21a2b4b86499c9ebc85e40101e327a6e94cb35783391cc45717a0c5f4e5fbd19 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..04d6c1b77c3e112b5c8ca56e2082879c3d76e77e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd28137602d01feea8d248d95b45fbebdc37b2e2bba496cb8acef2dddcdd1b8a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6000b2d52c41aea1b89900962b3c32343121b578 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43907138cd93784426c1af6960680fdfc858a5e725bc1086fda98e70def96bf1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e6254c8352ef5551ac8bf7e31706604e1dcac72 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a34d899fd1935713268eb72644e7e33d17dd81215e8372cf59ad36884a7272b8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3522710271320bf1634f2d0a20078c743724f9ec --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:253380cff1eff57da97754ba8de69e6c4c28b39c157ea840654cdf5923784bdf +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eedbb6686333c5dcb4b9e916ee86d028b19079b3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78fd3eafb6221d9b8fcc0c0f132dda743983ce268dbc4791b0118d6b8a7c3bd7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b66a1e500aa86505604f69d71560df79ad22e51 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:114b0f4b58cd34099dcddf1f1e496e6f61c256f35410666ccad00fee53222f8c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..16d1fbb8572e19ba5d280ecf8b37aaf432665709 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f8fe0c81da34926f5f824a69c1048e830c8e1f42bcc47dc6085e65f7ad1bca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b52315cd5445fbd472b941877ff5adcfddc65d9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91d99ef5fee3cc4e275e39c0031e19f7894142002b68f57eed1551aed259c456 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..85e255d639de1941a5b58d9955c74b76dcdda2a1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eda0f196463dbb4320fec604c9e92a31550832f118e785ec596333ef978f0e98 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc2c445e9e4745fca3ae793dbd28fd4dd8c45114 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c7e239d2008d63595ad7914f615fe4ff399d3efd15ae5d64df8f5f4e6504f03 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0cd52ed991af2095edeec920bb9aad2d9a87478 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5f8b33d01e73054da23e105805c97d092b5870ae2bbbeee69333178e3a37657 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..caddb31f088397405405c0550e5c253e1d1705ef --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:756146c04869095d8ace2f63637c6bfb663633825319ff53d26b656c05a8a9bc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddf4c3d04798ca2462db72dbc25698dc114fc737 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855bc06e11e90d1e86804b780d559538cf6796e2eef1868d7606170889cc6af7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ecf23d3996e0758591eaee6111318ccedbb646d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0911376658f6565b48232ce68c8e092552b50551f9e0080aba0004507294026 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..96cd543d911efab1598ed68aff8ed4efc8ab9111 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06a8734e6353548a2d8bb48c2eb4ab1835054aad6e8019e2ee2ca03e806c9f71 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bbaf7407124c85dde82e87758697cbe7b39a144 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afb7806865b748e2f598710b3ce7eac8778ae74a227d985e4ca29233e86ccb2b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c1f4762a0cee45c959936dcde5b0e932c824dfa --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e37b9b19913bcb1b9448cb621a7d3c0b4192524032570869e2d9e292a40e08a6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62c0e28a8674fce76e9ed28199059607aa6de2a8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10c32c953f6754ea7e678e3235c52d3d01f9093ad0e587c904059a27191ce69d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d85f5c48b668a113eda6d45e96d189424fed27b5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e37628bbaff3e46cf65c8b10316508989e2a1a77bd87b66798d848893ae1d92 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6a7fc8efdc3cb9aef3df3432b946acc247385b7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ec71995b811679a0ef99caac5ecc3618e1bc3a7fb817501fc9a1c06d327a0e0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..036b65c7c02340b72da618a744560b385d5d0995 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bdcbfc78bb2098053af788efe7b77ca4342e0328b19fd8c35957e28c1de737a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd01bc241510668ee8a7372edbf7c4b22a8d6eb2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a94128ac90d2ef53b83da49b72e33355966806f4cbeab3d49a663e2018ad2b0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f718d3dcebd359be81bec83dc655bfd624ac5c54 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44b3dd2a0ab968b0ce2b7118cbf63bc69866803053e584be22da9726c0dc0f28 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e559c3b4e461b7a3672a841bfdbacc969adecde --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3f814aef3d19ac51b9f592d8c4c14e8b3cad26eea2da764b10b4adde73d6b4f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e14fcd9d306e592b107113ed759670db92f10c63 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ddcc88288d9007f97a57662ebed174e4cc413c4c8e9cf2cce531468e816c7bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf6ac4d506e099632cbb5af0532d92c83a7e2b13 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a68de3899f67bf4905a15961cf24bead7914c19688687b0ce2553efa00255e5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..907a0b8c22e030c85436b778f92a0c4579c332c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1f6c1b4ff491bdf735056ae66a769d6f91e6c065a7ca2ec9946bce96000d223 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6020e0ad003cd09fb7fb261d1a94b6c47f408d3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94bc4d4968dde21b8932d2f3e72a7ac0505e5b926f9b06fa796679820960f19b +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..127fae54ee8f2d553d25f527d5b23d7a4f1dde2a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:417cc7239de3b6d8232f012cb445ef0ca1f825a4faefb721e60643e9f307d695 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ecefefea66cd66b9e60a7a269656f1f8a291d9f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98201c6c111b5d718fe301b7f7828a40f99d43624bdb2589f2e0b117789993c2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb823c3e0cd296d1d721df248c60f28c9846b5c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb622410ba834a3b0512c6f420361067cc4213c8b8d8fb6ae2364995f845182d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1fc1f446553d305b447b580a0aaef00baf3c67e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29464d07fc00413605dae7b86cf99f30e00cfbe63a34bfba565376ac3c762b23 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..26cad494f67f4240c8afe4e739bd368211010014 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58d6b104196b4e91b25603389a530c3571180ba93ad38e6c5b4dff7e7147562e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cecf4904a02f62fde334351a9ec2fe12df878dad --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:541b7026c5bac3f882686c6608be82c8a854394098fbc8905d532dab3383e553 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccc31bbd68cfe57e7fb0e33c358714b62adb9fb3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae1c144eb77c947a5a0ec8404056c32138ad7bd2cff5e89fa78ebd94ed844b77 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ccaa8977c76945c9ec32b3a49d4a8c37fca702e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b97d87e870f416f89c21d066c753bc0b41c33dddcbd58ac7a766bded11c17c9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..381de868bcffd49f94453783188efac618483818 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a06832598e98920a21246facce1515d2ba7169e399ede2bd23b818abb0acd1fe +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d4537bbad3343e2da52235770cfc37261a6542c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6d266d729b30f98801e6432c6adf3cb8daa4b4b38f4d0b0eea80eb841bd3fa2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee1103924eb551ef551e0a5dfea53d81a6443724 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84a264fb53ea4083b4720dec34dd18d6ccc8d1a2cd0708dc3cb14eaa2e84205c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3ff04dfe9af24294fd15a966660a621b26b5824 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b077acd26e97102d357d1f1bdfb4800f918be43834fc83e6228237ceda33e5d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..52568c4d08c3f06e9184389ed12cdc7bb2d61b2c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94e6dcf44503a71a1642b3f451ce1dc0a3de1b9802e82fe858f957259f66cd55 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ead1d8dd7728ab20ac3c6cb05aff36374ddd7d9d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eeb1a60b9a9820b0b0c4a997afc266f2fd3c8f1440ccb03d601a853228ebd1c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f70f666394084b5cef7366a009562af2addbfd9b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90fb17e0bd35b5cd24d9cf6cf875129708db9c6461120cf9d96c281698aa2782 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b15df5fd4721c24f470550eaa3d88ca72af6634e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:309e3afb05473ec094698592cbaf8c5d136471c4bd692852750470d279204029 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1767786b5566f74ad4a8236cf8af349fa664d0df --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:067ee4741acc69e1aba7d7596512aa6ea4768161458e9fa8d153f997e65bc984 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..33012ba10f93a3ce70a691d6bf031cc2ad5f3c0b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56adab5666e11717edd2152e97573013a72f04a38e836528b1bb251ea3a67d35 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..601ada92057f5799f159c03d9341e5a9d9d6ffed --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:013d2eb976b5a8c5bb5c4d3c5327453e94da76b1d44212e447fe0dd0606e004f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6badcb8ed1816bafc54586b0cd0bae7e6089d790 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc942d9e320d497e274c9cd818fed074190d582ce01a1164b702e15d0e0a0a66 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..82a777ce7f397c1a050785b12abc8a8a9a8570c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6248b2e2c3527589257c8ab580a0439f861810fca6d10964f60e5d195af6de1e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03877308bc0a121c20e0434683bf411817f4565d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ccc6ac165787b8740198f48b16e003f5ac025626c4d28bd75c7913106a4aaf4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..841f7981de330adccfb897456e3651a2638a8fd8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d10e3ab9c7913e84b1d769f8ca0d35fb0804663ae536c5af70f9568c9d8cdd6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b32156409c2dfc51de084108066e30abc2943289 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb1ce5e4d33f3f4de7b6eb40d9778769468b08ed24bdbcf027cb178c0fe1e013 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aa2e9055a747731fd33acae0acc26b5d6534fe3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:928820632459ab8a4a5be880aa2bc2fc5f853768b6981507b8f44f1b5bfe2afc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8355aec12d0f03c159c6942fc4789bbbb14ab9db --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59447d75102872dda93d5a9c7a35dd4ed25f59fdcc456a1d9151b8f12481011a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53c4e024c038073deecc5f103c2e23fb8f261a99 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37dc8c880f0618d4c45800c593747d4c64288bafc8199522ff32a981f31343d8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0db75f3e28aee2ef410dc1f320df32ecf694047 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98fe8287cd915540b00d37a37924c94038c58f42c6cfd49acab576d8331cd032 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdbff8f5a8988a5d684c94e923409cdf86c4884f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:765905ab28b1b94ee1aa4daf2c6fcefaf4143ee179a99ce6904a30789d93bf94 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..20946ed1b904663ddf53742a8990402cb3e084d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d8b589dd730920f6d28d2e3e5ef92f5cd5d20b99295ccf98b4799928c1d3f78 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0b122cc4ea97d025ea74fb902a8c22883dcab10 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b5d73fc499aaedf142bebbcf5eb7b3e0617d6a66ccf2a275ed15af96630b866 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..925af28d5708a13e1adfb8c5d39dfddf20fa5ea1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f570847a8221d874585906efe5cbc1c50be64b032409a0aa8f744dee84509f30 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70c8d4491f734835ded316243e18c807c199ffac --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39b0fa34c0e9b8d7e7ed80f6455225b9b1cb003c9a2105734e47709c98b9e84f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1e8b5575554ca7b67d95f3706ceef78dab729f9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9bcd09e218cd95b2778a91ebc61e0f0ded8a8df0be72fc333fa0c85354d5391 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..239f87f7303d40b5b78a85dc5ddd9f29378cba3e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a5e6795f50d72f3cfdd4ce9234aac11b7590b24736aa18eb986af2aa6087f3d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..13d3aee664f44d75c9745acca745b285b9019367 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e794db8a96aec1665fc5d0eb62fa7190a9d41f245f84fca42bc9d8e39fd25573 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8af45cd36ecbe4bfceaeb2136c16fa216b05f2c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a1ccfc7cbcc49d53abf9b1af61f43822da2253d010b914e7cad016a5faf7e98 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..adb313205e3d9e538682ec052b1b056724936a6b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7bc845c9299267030f33b9b3002cbfe3ab84c0efea50f5a74a2cb950ef8d308 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..53b1e45a7e42fa72b13eda17f4a2968c8c35e3e4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cfdd6fc911feb0723e0da30a1ec48f985cfedd90921fc505bc9b65184f21943 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..671ea4049b89353771995248a5834ece016d3b7a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b986f21cb01d02e7a1c7eff1f2b03a7160dbd9f7ab388a98f6ae6bbbfb04c46 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40e376e0bb6de34b3f317ba38d18569a5b3ab600 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24618a76374c1ed0681fc0542c60345c6c5d3ee1395177c3d402bed3b96dc69b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0eab1f5d453335336203ec74803fa030a4928023 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbe13ffa7581b2dd680c81f13c0452b2ecf91a5731f784eac9f9bf55cdc0662a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e63072a9530af5f22a0c957e5d3959e9871bc41 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab48f0e68cb60b8edccb22eeb3d7119ac78891d1d481ac9135b58d41d60d626d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a10bbb41f6af7bc58b754037c20658401621f846 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6f5c0c41c4d729231fc1a97bb08d7eb74f58c9d38abc4bce977fefc1e97cb0e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..576c2eab19c2fafc58b7f8ca106930cbdebf1464 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc5f3b716e15b791ff602f8ca22f610fd7f47af758bd90edf8f3d3b69360d316 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3ae36df8326592b045ac48bb5a7c05111910b0d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ca784e1a13d3a8b4e79bb911e033bd153a59091648fe736c0c5ee0f0bbccb09 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8e92541abf403c4a08d62cb3bc9bc022613187a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b443f5cbd73148b4aa02ecfdad7c108f5066c84a6f21a092a73be8f13ee65e9 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5244b660b3c3a5d7c75ee7a896a96d2c1538f525 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27d94c4f47e36cef0e9273bee0b690dfc7519d7446659f24a74e22c9f44e1503 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..202c04b675599fa7f52f771e1a3c934fb99dc278 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db7b2e1170d2ac90b9ebe31c651fd5404946dc501cc56dece70a1f3ce4942a83 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..84b7c7e87c7e220ec22feeedded984ef8367fa4d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaa3e26086988bcbc3377a54405e4f4994bdde5e17e692d74b3ed1f9b968b225 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7431f25f51c457e2318725682e88a13c4f30bbb9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c78992f60092b91c9be20924c4da267d6bc172425b69b53b7d5146672f74138 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae1c50aa92e01ffbe1d71b55bdf0df84d12b3890 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:104c7debadd3ee363aa41ac402c1ca49286dca78e8ba74501152cf3c4fb3f962 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..46f999f53285390ab7da008e477cac6d398d8ec7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5034288f0009e61561f0f911bcee80edc4539c0dcbf9e2110ba3c91367b4af0c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c32fac80235c483966c076a878f2e2afbde58eb8 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e861f06f6c2173ace2cf9ab5c10d2f18cc6d920a4e1e05a238359ee5dd5acf7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba70865f8f6c3ae029efd6926acd7f95ad091b7c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8df68057d849660a632bcd5c883640acd6d090a576e35fe1a45c58f0c2086a70 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7564ba814d45e10d8c8fc29a1221e189c02cc42c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a40add72aa4fb302887beab319555655ec72b1d7ce1649406bc3430dc5ca74c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7907463a073e08c1677ffe037804824a9d94b970 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e3ef83d89e5bfb62ebb6d30bc825b3861095f4e3b7fed1f0a39a5a37b56fb46 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a3842d1b63fec8ffcbdb3cb0d058e04244d41d6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aa94ffaf41a29ca8f777b932e599c2335e74742df2c56e8302bee844ca79de2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aac8475fa9fdd32ae19b1b01c3826c337952623e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:419424a3df919488aaca8f25e638698d5733e75a696b53ab5ba38bd0881b9004 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be0776dcaaf5d1ef780700eb825593f697d87c09 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d9443918fbc312699271bdeaebfa8ed6583a20aa1fddf1aa54cab010d503f2f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2772bcae89517dfc9f2ef5ef2189e8cc11de9033 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5940b6f7c20d452ff5ef9e07cdb087f23caa4f134a0910c819c386c66a3fb8ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..040a91e7269f621713064cbc0c1595193f43c06d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fb4bf6e33d8b420e678e12d50164a030863f389e7df9c653fdd68bed9e07cc6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..026a5fb0de25870ad401f852665e1550bf0a41be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eafdfa1dc034ec1bb1f6792508fbd8d05a104777ca724968a02554264061ece6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5665c66afdaf4a822deb5022eb1fa22505e37ef2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8136bec59a26534f2dcf409e8de6f64dc454271709b3005b4db5487f6c681bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e425adab5fdc5d7dc3f741dca3f3819d546b56a7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6d46648826cd222bea4f27b6ce76e1391c1e163c8ce05d29c47ec1d1ee39cba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..48cb11495f4d5d5da70612d39e255bba08f5e750 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a766b0ec7f8002d0c1f07bda860176620714503ba90371a1833f28eade833e9b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d6b53e1661cc7150cef3499a8a5e22a8c6ff76e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b6bc7b0f63317bce7e550eefc223c84e1eb707e15bca10b19c9c978653dfb76 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d935bf9e7b6df1f9136514d0d99cea5ed465f94e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efff9fc5e8c79f91c27e8ba5ab76b964bf3a1bd56b564425f7e03490ea699e77 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..004ee4286b6fcd0fa33a49602204c669b6573b83 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c05dcb1dcbbcd95268b5191ef369993bc35d3a761f34f7882d2d5e27725090d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..04c13507b9d85b44b9a74aea9456d155f866138a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15b2a6447cfc412aa1c94ae5138a7a89d2f576e65baa1d9fbd829b3d6eda1835 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bafd80f9a2db3b3e622a620c9ca28d6eae7aad4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9744c01a674e80c378df4ea396a713cb419e22735bceda5e511cb61853323efa +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f047134d7d00907ab9801058c6d90607e259522 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1ab058f480b6b8d504ec9faeffeb601a52967734f7dc9723aeefc1f24b0735c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7f5eb996f056031ca062aebba028dbbf38c1864 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e527438c58904dbbaa72a6e1f6eb1f35b64d754fda79f04ae653c4b5a1a435c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6616ecf48c90a42fe61babfbc815383cd62e32b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca6145cd86f6b51fb6116eb904636a2e69cac8dbee0bfb2d03f5ce9597c7a821 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..abf939caa7064e4dd4e5b743a274d1b2631d7d3f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e95d191ca75971a080366c1e5893b3187baf1ba465dab5a7de7f01316b127089 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9c977c452641c382f73aad44e7b450e323e48bf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee439a1163c35950f138812276cf559100d7f6596e0d0a87fd7066315a472174 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c59ce387f4621d981fe7ec9a0784c19f30fc6abe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9bb44f6972839616b56dc211f32aaec773495518c633e5543f47ffd50ae880d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..20126f57e2a47f8549894265b062d62b355090d4 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2740bad0f1bf217f2ec591aa61df4d02343c640f685345ba4ec887a88e20b1ca +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a67e8d3ef305738c8f8dc3d62332673d791bf1e5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5362daeccf6a7e3ada154921553cf64938f2ffaf18d769bb8f5564eb578ae119 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf9e95b2caafdaf4b756f1ba858a691895c7d405 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:242aa334094fe125fe8c35bb42564ba824b4eb27bee2067584291958ff2a34ab +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be6f4ab9145d9b08b2f1b488bcbec5b487d612d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c71a8fea7148aedcf81f241df27c99bd9e2f6fd114d52269e7f19083940a786a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d321541279cfb6d2c3e0c2ae7d8068c6b19d445d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d7f37e169c0729b161511f2480df438cc81b363b1b2cef235ebf66d8c8006dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdb5c39f1cb07dc5757f11efb74909fdbbc9cc42 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56b75bbb875bc69c95153edfb69b4d3efa2117bdc360b4cc58f54a2e3760944e +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..586f149f47468d3c541deb10404810e311e910b6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebb821f17fd91dd650f23bcf61519dacd890974efea60a97bc0f622002fad7c0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b43904fb8a1da091d339b76053e5328aafd42fce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9eebaa23e2f67a8eec6ca891323bbe1d5f371572613868a76606954672c5381 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe638515dbc3a098b90f77596894eb73d95dd0ff --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8ac204aeca08da038e451110ef04ce214738eafbb5002dc51eb3b8f2176335b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..88765a0ad494e28f2d7341593ee12ff5256ea077 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0564a04a190e8bcd4272623350778e062602c3287d19c4812d76a9b4c8a8d646 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..018b3153006c241e679e918009e8aeaef7c317eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:159b10a494e106220ed75e82569b6c28e9ab12fcda86af390fd85fd90fb1d7f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3bb9063e4aec2d423810cfe89f48f5a1b60e98d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a0c4ed9629d4b9ef35889d24ade38e09e4321ec77eb2446ef93cd718634e1c8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e5702c7f82f54186de2b682bd889832d27fb2b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45b9ad25c045e5972aafad7561fc262433ce9226709956ac30d67edb6fff33a4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6008c66823c6657ce994ef5dafe94323c7db8a39 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9b26fc4769bb79e98af1b61e5593a81bbf55941212655bc599e78a2a326eb81 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c3451831d08322d0ab039b9de181d9d2fcca7c7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c175919572ca865d42f097a85394d31d3d65cc27e52793fedef98760280788c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8957c95b5d4d466de74fff98fde299665388635 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab7b34b317640c49fef86f1ea56777581756a16dcb0804b3b7eeb92a152c14ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae11e0dfd95504339f5a0969e00fb8dcafd52aa3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbd703d2302682f9a6f65fd3554f66a7aa89aca22b57ded3ca4da0d9adfad8c6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a73a28956a285cb1b003101021e2c32c919c901b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1b9fb54eefba3d012796e9c5ead6f25afa4773d6e520a77c44e29e419b309c8 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e39637e7d6c24d361baa36b595115324508d648 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f98d4813662279dfe0576d6f449b9436fe3df7598f69e3019c0f2346f5703b60 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d400e302aaecde7cfd78bca01714c95782f7368 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c44c11fcbc1b31e241de6d17573267445868679e0dab656aa48f8526e325a62d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..726e1c79e2c28800882fec1606ea57bc925c4c8e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cd520f14766078afdab58439209898a528b5d6b6bca39786a32795c0e2ae519 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b137fd29f74dd3a4002d24bb2f75824a8c10187 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebca254a1c6838fadc469b11907a71cad4202d1fa0f246b3df00d2f6311a68a1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..029202ecfdbfe5ee9f5772e90396669c8c9ba0a3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afb690995b2c8a0620675c1bb35a1ea6ea4888073366b2d92d01be6c6a3e85f0 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f53392a6dcd59dd9cc10ef45c97d663d596ad079 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:411c79c6872e41cfb1575937071d1c32576423ca3fef57b3f764b21cad9ed2a8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..539f8abb2c9db73d40051bd3ea4061b67365b383 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2edd4507ec43bebff168f1e66da4694cfc1a3bc1a90664d4b95f6e2c5d976eb8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c5294160d192064d460a4f6a67a4a5b3ab68b71 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a064e0cca6b1c9c08833ec3c62087051a8fbf006d44aad6f3d455308b46c433 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bd068bcf1f20b834f87c658ebd3484ef22c89a9 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:211a8f19dc0a79d36c50efb2884cc7b19ceedda1691fe8dedf6f10430f6f172e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bdb167c360f9bebcc1e2d16a23094141d9d9c3a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0c0a3fc769de34f0bea16de70462c4bc118690658f037373b84e978172e7371 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..193c02574247cff6ec416692dd5090faa3269a02 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baee2908e2aa35fade1fa52458d2bac634f7943b58be869c622dd861f9ead8cd +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e1209ae4526cb68ad93fc7dfa9deff732c1b5bc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca5a77bf2f031dfe9cd293104feee95b8f43a77f54c6eae326ae1b5f55a25ff0 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f749b0fb1cd02d22d0c18f6b27491ead80bfac22 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f574c128032a2e5fd6e8d7501a5169f7f790bd5d6222a7fe58a07f1205fd950 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a4b5b3aafd77630e62557d909f171e59bb5ac74 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dee221af8bccbc9783dada4292ff0e40ac5b789291eb3cb61d8c36ca6e179ed8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07287b6f223f1172fd3d5236c2f775945df32313 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54b32f310bf9d3ed0236b8891966959df5d3394499f5727b4b9ed224f4a773dc +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2a908bee401397f27d7e688a02e228bb851ec57 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac8dfdc3b57f5f711bf9160ca2323d76ff31b3a02ea92d20434aa0dfeb8c1a15 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9057eb70b6303c8d96db1df0771ecdad34f98043 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c92c2217188e2b7ec5a0c3dc30888bfc109b7e4e7afae94d89164c208c6e39ae +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be705566c692b8140d7b8ac02ab171f716b3bbf5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47f846235735193ef53ef64334ba66291e471b1a531049db393dd309e34bc2f8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36a6cfba177a97c1f6c6a63829e310818afa9955 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:896dbe002b32a3133a561f7c4da28a636040aa33a54574f6fcb63e48e5554c6a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e5bba6dd8a6e9cde2211b6f8bab8b7ca6a8a926 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33623ed72fe957e5c0d7ff2245d3fd565d8a019414f67740e8de5f5f41f57740 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3196f702cf24c0a782b9389b8c61f292c1a0677a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:326af07309518dbffca1f1341ca34c473c23b3bebe8906a886e48637b4031fe8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fb9b1179c6bedbc8359325cc94735395f7fe1cb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43f9b2cb26e306899958e7e0d2e274f3993a571c5013b5efe5d546a689be56ba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c70ce6e88392ace0e0d7fe8b9d4c4a1b9af7da3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:690aebfa4a0bd6cbcc2f97cad755e753296602271de5603314c6a9e30d80826f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8fb3b545d0a1cbadc74c2f970d56ce388df5e5f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a18a7d6bb858e1f45d0042fb53b140656b75604836e77c143f4d3957d719468 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..edbb7a5c06799cc58d5f8f39f28298e614d9466a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5ed1ae62df89219e07dd3d7d9d5c586274c92e96aa88f5d72cc641728e9396c +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4dd6a87ecafb6ba1ead56b8703e9c0a613df31e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54069558f1896c1a6918f286aee3855a0f9590ee0507b9dd883aa12b0325f378 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..441d7946965bfceda39964c2a5e4b09c3803949b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c72e762a8371902f88cf0e930218b5dc9919cc4fdb55d9e2d8fc2483e1640b5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..393fb6711feaefb32dd707edc5e2544752b8b92a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a92236408d7af235dcd690e70a705cb944b265b93585d3082ddd73ae2aee14a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22be72e5ce6241ad699c3af93df2a561991e74c6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:940244f19ca9ea549cef44557dbdaa5bf50c06eced5de669da0e4aeda8b850bb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..998b0e2e61072dd9959d0836785e02628acf6532 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed5f25e2d7034e7920e13b4adebe848e48dcc40f279e06872a7705684f32dcf2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be3b8a6ca7b6833682f0e7aa69d65b71e287b5ca --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e623c6c113e59d5c287f74f9bed182fbb8ae315bbc0802dd9aad675018e09014 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca84ebcc44b7ef820fe59f59185e2869ce3c6b3b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:144408bcc289893fa48d448920068e65903d990bc05c7806fe0218c7eb36ef7a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca494581aeccf2facfa3b03d148e8eedd727cb93 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb822b6fcede49624cd712aae13a7e02540de073901a65fd5b2bda91d7211dba +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2fc9bec5f35d1a37bd5a95d45bddf6fe482dd54 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffa751b0b5e67db112bf4bb84ae1387aac013dda7d3de142337b9df3dc5e90c3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c39b1b64404079d700c51c035bc907caf877280 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:098d8ef7584bf049ed019ef4f93adc9a8ab35ffcda774e2d72879e810c6d5e80 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d646974b129ee77f0331ef392e9f226a7b7c0e6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d031609431f583a25aec8fd0467aef6f2d0c34dc6b42c26155666d7f43f342d +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c95ac65d25dfe71633702caa885374485e4fb680 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:522927ea8d36709fbd1a0f1317ca1955ef4f64827c507563de81d54e10bbbfde +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..17ad716212ec909eb1335fa438f942f54193e017 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6a57a1dc9cb7f6d3c3e0aa67f05f467912cc3f06040ea442f868ad4d21b558e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40d3c6a78499812a8dddfdf15acf127cf079eff6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75c952cb943f21cdb3b4ba367ab7c96d0545933ad4666bf09fe580cb67da1828 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..edeeadcae19c152c330dc7a77be89cc793280fd1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:788f00dc98ae5e1b96f128ef1f0d0df3d528892faa8d53876bc7c611fb08f5a1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf454c76df5e9df7bee3110d34bf03b91d1b874b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23634fc3aed8e17d720d278730d660876e538f6d81a6d08db88a918c0e264654 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e6d0376668adad754406a1718f0d5ef153fa3eb --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4e5fd5bf3652a696796e2667d6a4845c9dfc424ba92d2c30f15d91a58797902 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad376b058584c3356864c09f3ef58df3df9e3f08 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08f887549bea36d9a646303df8ddee39c092791b5f0e280aa2d979e736d4d28f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a1ca544293711b5a909efd7d31050c81bde125e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:798632ca243f082e62e261e733fdbf8a4e315bdec14d5d8e1d303947b19e522c +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..edc032c20ca37c2c09a252e02049ccbd09b68397 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02163e682026e3b316b30c64f6c5e6d8e0f79ef508dd6f603cb0b5e1c6c31196 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5c25628232702f75e8da8152798db0dd1fe055e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d187fc9e81a9de68b75cb076e3a75749bbc9aa63f24d5a2a8e1e88603090c396 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..83c331b328d45428c072bad3700281928928bb1a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:778289ef1813bc3c8e9191aa79fe859d27bf83cffd448b093c61258ac267c6b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..662ef2ba7d7797e3595d40480669f18f490562b2 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b69f2e59aa3c6a2fb2d0357279b4f1f78637937ed07f82fa20090869e0b98dad +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..62250c6e1e2bdbfe321ca6dc383aa931cb610c3f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:593c7742473912a543f5024c632889991132a502bc70411bf4cc3ac8be277775 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ded631edc32aa8ea1b22f3c099a88ed98e6b7283 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97859f2cf493797e95d66678a19ab9e852e347983a8dd0af04d244a280279d76 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..193b06d14d1c31199c74fddea54d50daf8341e98 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94d28d7a7fa44897a769a98f2e71c0205101dcb60a4c33bc74070db30afde609 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d612f29e3ff5caab23c98a4dd6cba889115b99ab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0306ad136e8422da0c90f38a14115cba915f90fb9f919c37235974b12b179307 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71dc23fef7173ee05947d561b844edcd46507a6b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a328f08fac7baef4f707237e2765950b6686770bdc1259fcd7d382ba580c18be +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..40e07f00c96031af7796471460ef54295fd96a28 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc34de2be11b1ec706f04502318244835e2c64d68233e7cc0e16f1492324615 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c5424e52f9e8817840e13e2eca1a9c1312317be --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a56f81bc95c96a7f210ade5b0a516ace1f0d6d4ee9a314a0af0489df366c519 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8e8b8b874de613bd434d688e560e1025d05920e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee643731c76b239ffa384589f826ec236ae53ed6b883211735b81de457534d88 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da6101da5ef440eee3a3561529927b2cde4ca81 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f73f7841e5d685934d31ac836b36b8d1c21f1f0aacf721963ceb11a0f5b4dc93 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c594f69d78e1bebffaad3a5efe84980503c89b7b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d56d68ffcb649675aec76f24bf15a018bea346bb570681abf88c36b664aaa9b9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e578d0c37aea28f5addeee907ffc29109a863116 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfe6cf658a0382803a448c9d6284933fb4d6517b4ed350e6ca0921dfe2719ce9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3da26d683671804b7783587896001671319d0044 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:909396567c5ccf7b9b598f83f38ab49b7c2a1d442c304c1b8c03fcee7ed7c8cc +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5352f91e81b6a7aea07efb68b5f71f6e73d48bb5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:630238d1b1f7449ecab67ca0550aca676cccd5beab4c05045caf53e965468582 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e6108900718a02e790fe183a78b16c1af9a5706 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9613c5f7a9b20e10120e3ad4ce5df68f1812a9e83662d89e4d166d2be7920f91 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e6455a1985004f190fd7210eba70fb8047e6bd5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d937cf2f30b1e1f9f7fa042ea6fd969042444a80a05cf81d0136971cc6e0a28a +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..46c4c8ff962180f7984bbf59aeac219790965eab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a79bdea87c414fb64dfef0a4f2287c8ebac97db907454a928b9f802b30b41dbf +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7b538cdc858e4efba39a6f786e79bb78c08526c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67e508222798dea42549c90e6cf35edd865975016cacca57943d28f5835c8520 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..70a912f9baf256b211f3967310a86181677d4572 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42ef5d213dad28040c59ec9971b02b60f82be765cfdd67e50ef2a073c551d3a5 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..71f71f661e92a5c90db700b1283af7fb0f31cb1b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84ff0f7f75f08c798745b2f6f1aaf87b1c87fd3ba0ecd5b1798de7bccec0432d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c17723dc6461d97d552ea0d04fa85e999834d09 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00694be649f65d951bc4524a5317f239d3f4cca66ff5b43639d6f03b43eb37ea +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63666a7a2a6a3c1d0dd56eb2a83f04e46584a894 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77db6232f799b1a7616a512ea11f5b5754ca7f9054b0e3d0cdd5383aa186ba24 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5931c1dc5accd970ee389981615a978a0b408b9a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b07cbd2f9a8013bad37b39fe21432af7fa128c5119adf281dafa3f0f875db7f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fd6579f8e978d209634061579aafb6ef0a0e679 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6629996de9f44da1908ec9c446b5a7e9feaa3cf76cf52c6f0862b3ce3d96fc93 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba1e71291aecfdea267da365eb15278246f5d764 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:237c3365f2166be3136a3719fe62aaf74b30215723be85e2401d69f78737780f +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af6435005611b049c16508e174d1ee73b52d0d80 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db0a223e53acf01b420e5fd33989cead6d00a0cdd8b1e23a34a52d89b7ee1e59 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d24aff6f32bc42261fef44734ec8617eeb1a078 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5713272cb8cdf3e67c1c3bc1dcf06cfa2770d7cb8d7a07b1734346c5e150dceb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ed7971ed5c90691c64979a19c57c04c702c1f20 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1f4546348d52ef57d4764e998dd778c0a375281da5f9f0877712f660781e3d7 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c07120be94e78ca2eb7a9b0b18219bc6661c1ccc --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d908fa837c577b79adbb8596e6f5305abc37a528b6af4dfd9bb7d91de492af83 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4293f8dbd5ffc2768a45e929600d3d5d9ef214b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6caf21d1712f7d71f61f793f90f7622547a8cdcfa1cb0b0b617278e128f471b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f86688b5f238aea7b90baed97c0cd08b450bc88 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d39595ce90fe349fb2bdd12762922b61c1a99a2b8b2d95c13b99b58d11c0e95 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29d0ca0a375c307b2cee0b8b13b591982266b608 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34eebc5495e5a7c6cebe89b1e697e1484ac4201f57afc991ae0806881a97de36 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cdee8d67e0d7e1c97badfbbd0a409bb17967492 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4c88fb391f6bc0d3f11249a406b1b4a9b9d85d8c079a419ca0189b35f4442f1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eab359a6e88f52b0f4fe0b7a73433c86edcce94c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6038124ff7d4811ac0163d7c842d0845184f9677c6203a82815dd7797b1e4212 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f852552612cddeb3e5ceb953da03426babc3bb1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ef647ff64553bbefa5c0a64e98183760c2c8fe61c67fa10010457794a7a91b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7a20a45a54ce04544e2f1ff14ac3bd7c35d9a00 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e0db1c4ce39cf85ecb15798418beefaf4690662e50915b77209af5164c7497 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcb78dd75dc0dd8cd04fa8444cb21d6b0aecdecf --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d78381d287947bfbae0a287a1f37c75bd4022f9b40fa049f774067102842f70 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a5bd91757afbe98157376c30a86e4f3c52ca4fe --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab6d8ffd0c83bf0254c0efd6890d2dfe958580207f8de4146ae5c18030abe280 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f50a1b8857da944eb43358aa1e2540feb9f0341b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a82fbf634b4ff2b0c398ed3877724d80fa374d328a22e7c5e2fc14d1f8570b4 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07b60fc750d5dadfd1fb506be9c8fc80f835012c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:952c7f1ff485ebd1ca62f4ee5452317eefed071772ec19993e37f3efb90f07f2 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce790968d566aacf42977ed44a62986737b46c4b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a6daf6e8c9d62c843f78dd0caf4c40a3681ffa30528dad2d7c0715a5f719684 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..661bd79de0115d572b1f85a328ab39875277e94e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b544f2e7c17b5ecc2e968d344a09d7294128324b79ca3ab70fdc5757da9d4623 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fa875206cf4f846aecb02fe07dffed78d1f80d7 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1e5074d485ff05793efc45ecbf8726efdde70164bce5847fce6183781881a40 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bdd817121953fc314c030e470f06d83d38c3b32 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4aa670e805194534dfaad61501faa1ec347ce1c2989d7e7b292015fe2ecf4da +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..682c0a276d501b71894692b0a7de21a30e35b72c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc919f581bd787f757de34a15b97e128908328e72d46b5c46aa0a275f8ee305b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38ca9b0ef982064b740761e2c70d3f3b0465abf5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91bb01a35290e972ff5be708cd20c423c3b84a3e93f6447703a86686e65a0428 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ea23ee8128abfe020e2209e13b2c00a0a5c1196 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c52977e16b77a4a29412cc7d01f5af79f830fb456020eb9bd2dbe06b9613889d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..334ee2778bf5c0073789065920843e1873a0ab17 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c170673cbdfc9abbb99aba815c036881f95ccaab96902b5558b9b2bce6cd14eb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..98940c262c1613b7fcfa059d6733d00b60d5c008 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bba1972bdd1ac47e2ecb2afeacec2732720c032a1c52003a0f0cbda7c35b9936 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..69e63c6b0dac8327786956cb7d4f5666b2328a34 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6cd9beece838edeae738b0c3b1a78e6248fa9a5c59294b248ca4f5a3372c8c6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1616e5c31a5631501cbefb757f02f4c9edfe66ba --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d3a14feaafd4c4cf3784f40be9b766f0c97c90e75e6779bc7fad4cb5c14dc3b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6020af787640c49e764db228c4cec23a267281d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc7c207143cd0d3a03f3cd46cecc3d87cf02ee40964d8ea4ff726fc9cf938643 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac8e10d2c07d71042e30b519d4b68dc5e8b9029d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7774ced485e44ca00715dad97e1f7705053040d3d01a9e29a74ea2a8ba780816 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..217a496e7ff015bdaa6ea10587e3f887cff88d9a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f82b28503f58a42685224574999d1ef0d351d4dafcdde54e2cdfa5e840010007 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..54cc489313ddf094f53d660fbc877ec27e8599ce --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c21cc38222bf0c6d5174668d696c3b146be3074a07c32235e554b2df6114aa06 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d36282de8767e35e0fffaf093b40cf66d4c5bab --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b7fb76cadefa5f120f2b82d6f4be2b38ceadb35b5638f98a052ca572b3cf070 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f33a94e7f64b3f284804a50fe07fc653c7cf1748 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25c748999ea41d45cb14c61ef9bb9d32244c98aef14939f0148800d0c0a93cf8 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2d8ad2fd81a699a06bf88ddd6cbda2103f6b324 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95dfb30f7f708a66e9f0035143321de4465f4872554a77d0196fa9feab9af688 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..43ff0866b51dd319cc94864f0f6f815b9dcb106f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f097eb19b3a8b1fdb31f92d60c117fc485a6d0594420d027e7a9a10eadcd227b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ead11d9ce3fe211f0202ad9b00e2ab8f9f2eeb59 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3f07fbfa227d8a4eda4c0a88ac7da434dd4aac052608df1953d0e1794490beb +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2e65cafc2ef2d8a44253bf19e3f5dbe6e78a3c3 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a714565c754df0e1beae21a406361bb0a2c68a8c6139bbfaeb0d5f1cdcea8b36 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..12598ace51f43b79ce8e9a987ac22249399153c1 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51097d98764454f71f47ad49b0269a9da284af292a0cb9d20dcb7026d7615d71 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..921cb87df962f9ee34450393e533cc548418d560 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5479ac01ff8713dc7c054e4bcf3acda6aa06718afe69f097876984805fbcf495 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..65209d45cb71e7675e32f2653510eded1e33d11c --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d16ece854942848bafc53886d95df17fbe5e72c221e87842e9facb3e8741fd67 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7feb4762af251f3261fde868291c4d79027f780b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40a0345edf15c89354ccba175ca81804e411e3d0092d1d908f719cc3f5393ad3 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fa78df9ede8a564a44e12076152508567d6b833 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4676037a9bbc1965836008c0f0d478ec90e2ee048d9a6de394215a9528f4d42 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..558a0c6beb83c26f86ec18aceac63282f19757c5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce7d019a6214eba1e813f5ef141a2b4ac3b4921dd5e21317613ef4d14af24b39 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36a2a6aa19e7b60b69c4e875707c2e69a14cc55e --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f00d98ef6cbcf895da12c52a0ebbf603c21e345bd9a91054c8fea53092dfd062 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fae4222e7fa2d602ed8b0fefdacbcb7aa9d11f07 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e17e5c6baa8a88d97402c45ec1237d0785923fb932c352a1b48a393834b896ad +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da609d0c66b7d0d0d689b3b46cb87f2677795e15 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:850fbbdad8a2914512795baa6196ea77feed0ba7c0673444eb648960b34ce643 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9740017789e7db52ef320660305994f20727c348 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff8736eb97bfa39866879b341370423a8502db5c622fe6fc93dd899f4baca1b6 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ff4ba764c1bb9b7e30d17f41419ad79af7f4524 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e00a4e2f05bdc1381c5d7657d1f7b643b60e9b093da8a4761f225669a795542 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..857384b7e10bb4ac11847b2832d544f433c9ee0f --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:013ae34b229fdb53ad38a473d60f69aec7e5bd6528ddbdf4424fb96558ccf7b6 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a16bbfcca8984e7b12f5e3880cd198b03ae1a0a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ddd96c3fd9c0fb3de744b58e8f14b7e2ede4952fa445be0b34e2245c4113686 +size 42115 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7bd6b959319f8c9c92a265f5a5636165c542d9d --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ce0ef05f870a8929fa5f852549b10db3a025a9ca669b337bf8e163fc4a6930f +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..34b226e34c9e07251c3f8f5a78e4ca88bab7b494 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4040ef861373cceffcb7846ecee9a681b2b7810b9f4c52639d4b3327765cad9 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f88984616cf6e35001ed5e65ca45c1556d2556de --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7958e2d28c80c28b695c09d1b53eac8ed681500fa1cb6c5251a16268de88b1e1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ab8abdca0a92de34c341be5a44616665505cb4a --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:484bff5dbbd5bda7762bb69559712d9dc7a58980f19de6952738cf1491cab8b1 +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6df4f0f3db5006b513379d92f69137f878dd550 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be5f020b9c020c6970bb8422bf630c0a3f001532f6ea00acc0d1abaf97d86c8e +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2effbc9f5274f1e13022c6168e5bcd2832bc88d5 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cac6f04433ba94733974380d2ed7222f4e4ccd3d97cbc9af7920708eaacf10ee +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e011e24b2a9d00cb1f13fa3c2308a3b211b3f31 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bfff402ee4d1afc83e3a70b9a1da07d7c675ee0d5391021d674f8294193635b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23689697e7093bcba0c20f304a1e03667eb8ea9b --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27e44fb1d55d56beeb7e09b1b20f798e73349c645b349ca456ce3ca39b710e5d +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfe9d6368c89df8d11e4f5adace3b4f722158055 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12450422835b90104ae85755ce4945ae51dfdcdcff9afa5b8988a3e72b11e66b +size 11395 diff --git a/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..904bf68afa572c0cedbc3c4d770d98bb0deca4f6 --- /dev/null +++ b/params/phi/8/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:321b5b6be98cafcc295987fca7f8906ea3b03ae8637374d6373ff7aa6ae9b1d0 +size 11395