diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/lm_head/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..400e27e9d670a87b1c950985315fee980e98030c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c29e156c1ff233ab1d70419ed039b29645b55825ad507a9e5af986fd4ceae9 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/lm_head/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc3c2524097167e7235f18189986253a616c5240 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d346fb1868be25e65a36c477cc576c41073e90f91355004b4ece08f51507ba39 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b973855c488540058219f9ca0051850ec1e3748a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcb5815c1b18a1b2b7e259a35ad053f0f92cda4fe7f4aedf842b5b7ed8b808a4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39c7155b04a32a590201e2f191e81fda62c1f4b4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b58251e8be6fc242bb11338b4e72059d1c24225a11e81011f089157a03475c84 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..05bd2a2e3c5eb904f7efba2d9b52db2f29f0b863 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8670b7161dda66e877fd697aa19f0ed6760930a209cbabf4bba66000da82b96 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c15cd3bb4388c877f007723f151d3656afcbec9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96a20d1c3c46f99d4a952058d675574c2d376135c84c58ac18e10eedbf7c6210 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd973a806a1d9866ca4ed9efeecb505135c8b5e6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9db98c10b45da156a30cf94cb0ab116a8bf76c6977826240037b00cf661ca109 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aac264e040e98ee46584e72db79c040b24142cd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98dd0597bcf79ca1adaf0334008170bb95a9677bef86cb2c1d8e13fc0614cc80 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f452380d5395a5c63dc61d4154414aaf6669fe5a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ea0b10a2e63b7ad75c1ce375c8b042f910e44049224adceda5f101c1cc8fa8b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccba8a7dffebe2bee6e4b066e7cd6a229aa73c06 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ab01e415b5f34ce287ed7142a21f90fbb3cc73d0a9e70274a2c1c6960f5803f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a94b00cd15617fa7ab00c05e90f18c2c8d4a6f0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae62ff3dada06fe225f1817368588e6b38d8f63d4eb46017832e7c461fe75aa2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d43b0dc011e5eb9a569b04b6dcec86b07e2a720 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f645ef58a615c7c1c06e89b3a45e062b0a42e90133604080512db48205f0c83b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..44fd0b01ddcb4309ff9d566d646e08d111f1c2a6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65ba868c6018cc4a41523fafe05a90bfbfd3b3a64732a2ad610ec57fd55621bd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad5a71777278a5ca9af83732ffb39319472d6aa6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f263d72134d900da89acd3b68e4b4fcdd391d1e23cc47dd083d70404efc6d48c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ae8a9458ed00a81a2606e05e62e83e12e4b5724 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b2bb9b006a2687fe8d66019b9149292e3edebed2c1e36a99227f5bb2d1266ad +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fcec441b2fbea3e218de87d09d3b5d0053543ba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89d5a200ccd415e8f45c315cc038d952973f4a324382a750c3716b62faf39ddd +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc412c371247d8318bcb7a983bba8372af951717 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba127639cf89f2db267418e4339129bfd566ae9b48fb2d0898dbfe83c6b56a63 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d96d8a94e4098e2a9f2a778afdd5dc120e53086 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61ae708a59af5d5f044a3bc7b8fe22721b39868bcfad64844a2c2548e2c1e6bd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae15d76cdf8e880e7adb1794a8f82b0341a53085 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fbf53499d0b961d8b457a5642533af6124febed775b2c340f1b1dc9f9c0a314 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcd9c016106d6eb3143c15fd93e54036a3fe96d0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d0613b6730998620e96bf6df4ffe630b399618a846115de6aa07ca3a4deb1dc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8a1fa2e59269e3b63132739ce732e72ffbe560e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:166d9368b7dd5e03c086ac6cb7f4d61538010eb4946d2ce6e0edc00d5cd4a45d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8026f101ddbe42a6712c22fcab88bd23e31df794 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f16686336e2fbc835e8ab9e048cdb6d2b1f2c64c7337ad7cd2ba3ef84dcc3f49 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a9faec0d34238d390e7027014187bad08e31706 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a4721bb786edc811afa4d6dfac898c523f54ceb56a89d0089294a0691b322be +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f345bece72c60852058a2c63fcf9c2383052486 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2280e9ea433302c05ac327510bcef89d58ccb687846388d35f8b7d8c0f108ac3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b143db1273aa7a6f15945c2916aa844263d1d30 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5c9efae0456f2cf88236e3cfe72a5c0161c60f7297606e2dfb4ece03b7a4c4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a7eeaf30a0b0523564a43b193d61fb7b8a24490 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd5d14df4c4ef9acd22b8734e928b143c7cd050cbc4dd595a42964ee061f2d79 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..165af206d306010c7b7386d2b41df869ecac336b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36ae0877845c22af89536d5f170183b92829cf538f22256d356229287df522f0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e888b47f8dd1c6c89d1c3bcb44c24c552c9d8c2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2031a4a649ba4fe64e717dbb035e8c720146d356c71e0d99afca695ba8839b88 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..703e0594dec9ea823ce6f6714ee3a7ad650c7a97 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3c71b49e954ca6219d6dcb4a80793d7486f2f094ac822c7bf88e1b51f48a83b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fe73a307fdc297568cc76c5282f46f3055fde9f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:090ae87bca05f307b84a41488d4b89b2cefe97961bd0466e6fef3a5617bc9a12 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba662852e4c3603b0ddd5d9e0806063bdbbda415 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06c163cd43d7876b8c49b30ff6f08841f59b9a50260b52523dbe1114b8129565 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f54b6d30936d496c34368ca9a2b0e2868b921fcd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2a39712623c9070dc47dd547ded64f6518e0e919250f2a470bf5c7d9d370282 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1151c80712f21f8d13ca42e6d0f11623b4bfe8e3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13a3b8c9b49264e82953116ed27e5e9fd9bd45be972975e47b6ec27edfe61e74 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..70512128bf37a86e7e6f90b4b0470ea003b2e1c5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98cc3accdbbdec1a0680375a54b8d107191c952b69c86368d1c2b8bce671dee9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b59ec84324f684fde53e9890cc80edba64bd97dd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86288984309925d031ce55aecd679208931648b2e4b3396a0ef9fba6c98a1edc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..98c370a1d3c503474b7fa4d952e24913f66e71ab --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b64f4a444c6c36c86c298414602a03ed88323659110b91f4445b46f8ed9703aa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..93ef0ca5ecace251bb7955475835a8fbe7fc7224 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f44b4a22fe2179e31665b577a606c2ba0a948851a9ef2305fe3e6b6435b2f36f +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8acab5dfbef9d4f07dec4043b0ad626ba977034 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1783ce80ff5c90f0d4ac3f9ae49d643f17e989727b4e43eeeb2e38359026491 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..370f6947cceecf30170b7dc74996511d0e1ded50 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a496c89326d3ac07a5231d9fffb395764a3e4c6126328e3002cacc8bc668bacd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e96d92634d6e18a9e22ae1f6608dd114568e5ac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac19444de3bfcce1e566a6ccf04aff3e8804146716e44694430f248960aa7b1f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9714af9dc48f53a34b47a5151ce1455865956943 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41e38edb8636814862d1ab3aca379f542e655b25c30ee6bf97251b5f46fedcd3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a1df4882b6f3d8dd5f7565810ba55f72d39fa13 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c1e3f9d2ae3ce68108b38ffbe955836bd4c15ebecd9bb07ce4ba5b7f140f4c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..709c5f9f7a1b462304f51b785e17bcbf9dc12f69 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf579fdf4b213d79ae847883ba3bac2692b5d3a8f5e4f7a6a535fd948d0bf49c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e96c89fe2b7b839545ba7f022aef9c84f1f1e279 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4089a43894e8d941b5c1f4b422f67a2f68ffc5e43f313bf49deee385a597745a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d83921cae43996c7bf2d642b86a32b182b0369d9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbeb469fa01bb4b52c274353485a7196e06ae703686fb7e0cea2ec843f46e110 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..372ac28deda0ca10013e3378041abefb746ecacc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d8efad1799ce145a7a9248fe5d42d7ee17b03e8b33c639e7d36d123f4378ea8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e1b340e9ebc25d905a319013930b196d2d8b084 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a83a3cc595ca4611a1f482bef6b791f9e79085297d7b00e8bb6a09c95507c365 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7099c4c7ea72474fb2c548254d8259b287ba9781 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:025537805c4027edf17819e7e8c1a28477dd4366ad18b7aa46b6dd1596034da0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa6505e2127d9ab4925354f24c792574bc394829 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f6914ab02de6a8ab14a24b446564f89163442fd4bf96a20decfaeac1b7baa51 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f22c1fe839bce8adfb37292c63a080218df5e200 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adb032966c51966d26024ad8b05722b2f6f3cdcb8d63115f78e53bdb8e8e6698 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fc046e12265ff593b08d9f44875b050d0f8a237 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bce4880fd4361b3f281f1ae733b39bc0034b436be6292b16ba7e20ddb7e747c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c73d177865df6e9aceec8acdbd7ab2dcde2c1098 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7e5222e69c0bececd4e46ca597759f07cab909c15bc72c6b2ebdeb18fca9a7a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5143868441205b7bb8e70f930cfa828288332ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c35a26f43a36ffcbf49418d4020a5c3948b372dfb66cf0d9661070ff7ef79627 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..16f399a3e5f0a95de984e74d25d780695413f64a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3949149edc9f36e740b3dc258d4839a65f0bdcad5837cbdef0e38da7b69f0346 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6dfec9a5cf2e93dfaadf99c4bc00cfec8e345c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:548321eb887c10983693a522c915d48af055b6a1c2e39adae6c5e2ad8feacd0a +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4756f877a6bd4c840d8c065613aae9352ec01d0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6b48437cae937a164d24dbdc148e00fa6c3a445f98800be748460b56cb32bdd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5630f6b47cc21be45ef7f46c7149630c3acdb4b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5cfb7372a7b9849c735735081e3d295f3b685db69b6604bd60d5ef254f0d71c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19aef3bb9d38facb91ff4b95be9621ceec3fb076 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91f8b958541a826724a8d76267f77c0ac8017751e8e5868730e84174862631bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa4d135a3326c8c452fc42a948fa893aa5276d4f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f8031e10086d80d07a4fdbf6636d4c35a3f6d7c85ba1c514283b445df293940 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..355b8d78526fdba9cbfa3e1053a6d91fb3ba55fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d53177c429beccdd982292ac57e326e7b659b2f6bbb133a2294015002c50a9d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a40a2fbd0e12059faa2f0c0d02098b29a811e2ba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe55e13170b8b6b8c8ca078b9753b95369bc1c5f8dd0aace179f94b1fdfb67b4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..03eb82b70f58c78a4db6e226647db8da6f0a8e97 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d70bf975ec0690ae8516da065f1a4823f81bcee3014d9e7f7e280ba0a7da82a8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..356c414819adfb4ac225e582e7978990d57a646e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e9d02abb1f75b22e745c6eda4ad6f85abd5718117c9e873ee75492d984f69fe +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0e691f7733f1094c118296bc4277d0c41dc6d11 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73acdc4351e73cd70a2d95f3a3e64e95cfadbac7a89881388f39d8781a2ea058 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29bdd4437cf62cf5f358a64f1db23302e3ea4a34 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42c6cd3f90615dd1e1e90a2f02b1eaeebf2d410e22ffe349c76c220eefa8cd7d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ce6aea0aba526b6be51aaeee8b15c226f0b5a8e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b98f54845bd2c4fd49029a933daca7928b8306f01db4e6285ba6d2c5b3ceec55 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2b2521f95f8214bc61a3342a770be5cd03ff650 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dba4c85bcfb7780165ad5f4b53fa1d00d1065384dfc766ad0e2e5fe7fb21c2e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd9e6232fe9380b09c2267baf27711a1b992b2cc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a24c48d83a1d628407e89a9eefb722ff697b7771aaa10c0f6b65c6e13f87ed00 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9469a7f6e54dc7987608f036d915d33b5c138c65 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:173a71cbcf13292855e2c132799d8c4d294c72a2f6995580ed577dd2ec3d8562 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19bd69ad69a15ffc232b0748baa9548e0c184e37 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:442632029cbe3374dffbbd936ab0d073a278049d4252759cb3e9c01e42d33051 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1646e0bf2a1a256526bc823eb71cbeda498d3639 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37aeac91461c1e4fa14fb4b0733bb130a70e5d3e5e0bba251a0d71238c6e59be +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab5498afcd063acc2ca231c869afa617d7888f9c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55aa9429bb7bd3eb06436a445e3ed4ef6bbbebf6187faf9a8772de6953cdfe5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a0e1f09d2d1b256c0475573734c827013e11352 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aad40bb3deb4429554cd13081debd276bbc3f6db52a0127d878be7df2ad9c72 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b661b76d9d3d4a9367594da0628521d816b20240 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98157e1cd4b82e8705fb8e19b5be2d38581dafa3a3baea22cf3d6944735b959b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b273c987983e78cc5ea625f0a6887036880a776 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8fe23beee6f09839ae0119c66cac8a53f594ef34665f6e8419b457dd9c59369 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e11eae78d04c16781b98deec3b521baa14a3c210 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce046ed2db81fcd8268d7091824e1ee23fb3c0074114d9356044350018c056b4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3ba967878af6c979156ca4016cc9206c08b9b55 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3e9b698cfa2e240d716797388e90d8a805e81804006bbd222863bf227db7587 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5c1758e90a7a5908d82bdfbb279c43803a3cbfd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ab460190892b22b451ec3b61d3f46c3bac50385429fa9c62452dc7ae522f9f2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df88b4011cc838ba4ad6fc508364f39a493c8941 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:669717836b41c2ae3be5c1c2dcfdea2af70105464eb9482cf7d53b6b6223a508 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ab642c8e652e7e9673b1eca929d80973f09d25c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f130193c58bcd110ce8cb7fc10aeffac02d5866b827602be14d227111851fdef +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f845d19819c58deb8a3711f69411960f92f239a2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b92bd3e40628a35ccc46a239c65fe16397ad1ef3b30deefd2141a1de8ab34d0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe08a499f5dc4221e75532f4ca50c999db70c309 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0389abae124383ab89afb1aa0e8b751a7bb8f8d2abd7e858fd1a77ef497ab6ca +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d60bee7ba90d84fe4f1e4fce978a0061a445821c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16a456c1733c68b8357350e50cb9129e3e77f523409ffd2b6c9110d4539af535 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e277ba61c95d3693b8819caa560003a7a78ea195 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:132ea0f43b6eb89e458463b8220cdee7cec9f9f5f6e516e8f55467765389765a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9cbf95dc65db8b9a3884932e8ad76dfb1b679d8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b904bd020e1b802f68ca6df963c26c2b47da5eeb5ff21321989db579f3fe687 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88184fc6c82dbdc64e4974585ebaed1b47b63c1d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83b3ec6d267b4fe47eb072f2a7b90fc2d5baf6e4c49e61df87f5bf3d7db43e74 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc9b1dbfae87490e657879cc2f1dc632ef337ad8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6890a07290093875f85e1be4b87f1840b086b29daa3ed11fc196d5baf9820010 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c460cc77f6c469227b217cb77fe44b79e352ebc9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12b656bd7ca0d80044667d791fb9cc69a51e95d5355ff9c793c60c5a10896e67 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..51d1c6b317b739163f69156cda86a4b0402eaf40 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f26ed9ddecba2a952f4ebfb7c296ab19fbff083c0281908829baa15e33c9ef6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe042ffd60acad683bbb788a4edc8ba78b2b256a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01796cbf5a9cb8afec0a5fd8dddb5da7f81c2250139900c0a46b29e13278120a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8c56c5d652e98842160ce360a1d869b3b7096d6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c02b113a6fb173c29e0f0ef959932665c7c62adfcf691e7a8131fd08843d6dff +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4389f338c4eec6ef99e8b828f6fcb423ca51920a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6077a0a22a3b38ca77be7a9ee292c01b9970b0bfb817c3c450ad30f506e14a2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f612fe123b8a359d0f65f1a41f89e0a19da95eb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1785103fd6e1e8a1904b6de578c76b46605fb487c3fac8c55ac054803b0b9f3b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d808324e26fc0d80af6283acf48db4b9c9d3c140 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8233d193c335ec5755f37e8e89dc5352029ed9f6b844a8622ccfee383d18fbe1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b565670f5250d553e2c1c076c6905baeb100fb3e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:113b39d436e73a6968b177fe5bdd5e66a851d0d9e0e72b0ff6dc6ba38742cd43 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..120669d759e0196fa80095433a3ee84ef579aeb2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5aafa1ff8cd0dcf1949d6b25d55ad1d279a5c97167ada5e0e18223fae6a6207 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc45e58622b919abb89bbe28bf992b2754f4db52 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0753c47367182216009954585fc3b6b59fd66889bd307f4943a09fa909032c6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f052bf0a13a64050a4bab4ecbe8aeb78960c866 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:259cfced05de9c87b99542a119742c3e21041450f9b900fd338c54ec7cc89247 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fd629d8b409ac918cc8251042ea0ec5197ee2f1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac1cd4d0b4281a702b2d27244b33c5ba08307a95feb1eee56b47e3c1aebb6992 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f52d943a6914e0d38503bc807dfbb3f3daf5205a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a3bfe90e6360f04bffc026529fe04acefadbe073794a40263ed2cb1e5eed8db +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d5afb86de00ca0186362b1ca555c2f22718894c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4e7f3808f8062d62772556413be6a0076ad03d658388c81c13b47c5b8a42d34 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ebd5e8951a2dfcd1ca6e9c6c6f9be08637fb23b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27a50bc972a7f13e7736220a17c865e34905ee77d9692b1b1ca0b1bb84505f20 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a6d657a93ee9ada456e9db52d01a10158eadb46 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3662c02f25bf372dcf6b2de13ecb55bc992b363f5515830f809e688ff77eca29 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a987bb8803b4aa2c519f3a1fcc1f4e2001b3e2dd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c6481dd6a02444bb04f2b2f0aebda91304b14b9dec677435320e272c8c61a01 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bc0eaf3cd71176798581ff3c0057edde93c59ac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5505795e1898f6dfe59f42a29917cdd6de4f15e6d8518ef2b60c70f6d97bd314 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf0b492da31e04f4d984a76d5db29e1c88ce3fca --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddea9bb14bf9f90bff173c86c52a63d487bef3874efb75f507fe7ae955398404 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dd8ee48ceddedd13f8dab091d35854c18a9e6dd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d52d4876d5b434790fd3907713de0c18a97490389f729a5c679d88283e23539 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..810a0a35c6ca0b6715b1b37face871fca751d880 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:948ec075d32cf5cef7dcd4835d627d455c28079765fed8a6a443711e51b70255 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..92b223e9f0a236bdbef8e9b5d25ea67aee20caf6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b6639a6aa514be352a9027362b1c16326f31fa4e90add4c8423c5bedf652354 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4811889d4bf5e05179e680f4e5d4dca736f0f172 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a481e98771326ec5c08a00b2b244c72a3b80cb9b8bd1d67d45251a04b1e21ba9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a353d654efdc854eb2dcdd12b3afe8828f19441d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbcb0e9dc6b5fd648a0eb5ad63ac916d68d86acdbc37a471e5a5c71665388581 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09768dcb5a63b9676daf550a91db450e3a9a319d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0719fe2480c8163d6b76b8e82ffa426fbd19f48a4ab12f45cf26edab96c18179 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c7d3c13c5483ce00df40f8958a868671d4e426e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6990934d640aa2044573f06a04c457a75a02eb2c804db41384358268ed65137c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cf276f07d265f8985e8200f7686cfec1a417d73 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba2cba79db54440d492733593276553bb4a2eaca63bb67c828b5c623a870d04c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf782270d2ac1e69b41a1223a7d5f207185f9ba7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d45d6f49e11f79a45d05d4c592b724789cb855f0fd59c9d7221cd8d28737bb +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ef5c856b76f44a8c8c9ae14bb883b9afa8a8e4a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e43b9a17d8853773e5a5fc6204b9fefb3cc9e15b69d843a2339062e62333704b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bb762136da418e2015ad8f2245adffb5013af52 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c49a3b33ad42fbba60cceb55c75c51ebbae44b5c9fb391f9e8daa5f8f316e7b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bec26a1c6df8d558fe1fe92d08fc8709e6da781d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88925669b700d2040ca8254dc1d2de485497543afd3518734daefbcdb0cec156 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e31e9cb3783a34781605859c1550b8db00ddc69 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60ff796990580b9eec0640a63cad5efa80b110ea2020ada1a6304077702bb41d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..07d2c97c5c1d6bc5b7268dc3abd4ad22bada241b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96db077052dd1eccdd4e8e29e1dc6f7803ccd5e647541462c8c725ea6e528664 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2c4494a7f18d2d0c275de7a1713a460b61a7ccc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a526cc57fbe8a32151c69f3458f6926dd32517333a449a70c5330f8460a9f978 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d92df20da7ea4b3b3da0628f576156d1d7bf31ae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63a04177fc808d1af37611837c590e9e8639999c49acd0974c0e1e3de76c7274 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10b4b4f5979c39ad813f77c058f8926e3d84e4cb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c9375787442cd15e46416e7e580ad9a025fddd47c2c23356f44f8a859bb4c9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0318b02575c5a182c3e8f745fd9185802ef7600 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a2ca918952b656999f821f80eb1ffc34361797225ca979f019ab7b55a325a0c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91ae1eeaa1666fa34f0934b921880daa98ec1d54 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b68b2404f7907ff32a5ff6297b4d391fc69d2ddc12d9bbc490fa72f3f16afeb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10b0a725341b9972eb05bcefbef869f3cc1841bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea085ab4f6f27304c6478b99212bc2e6127b773421ce7c389be05fbbc4798045 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb55c8e985146b3428eeb442de01e20158368e33 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca869259706f4b30d2831f215b11c8b310abe4cfb2de9af59c53e3db4cf16761 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc36b5a9107c66338916644d4d07f60ec343a066 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c52139f7add459cf46b90b49413495b30f337b1d8903d9c720bd448a43f5f8df +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5220620c79d30460ef162cf8a1821c6af9488044 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:694e59a0acad258c70bc622f59e424f0f8b795b8aaa2f5ddd034ed752edf62b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b4eb10bd45e6d56cad8ece9a62d4c91cc12df8c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a15c25a4983dd36523a5db37098e5af7dac68de6acf2162328e465910a652d1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d22a0767194eb89d51b341edb3144e0fe79afb59 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c145a8b8bf86801d85975f23630595a3ef16b9cf4e7581004363ec6cda3713de +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50441d3b139bd0f4cf6fdb2dbd10981187fa4791 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b68bdf66e89ab21ff66bdf5c08e9d03db2ca579434c8e062c33c1eba1c655ad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a8229e37f5cf98fdf7723ecb9c89dd1c4712e01 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6130f47a07e63ffc43aead1d050516b5770e23a67d8d0cb1409971e01968635a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8108ede08779bd334db64edc14dc13de4ff0886e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac23cfc9206eb235d787d8c8c0b221fd54432f38317f690aa54dec409832d3ad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df06b470f5913d7a8bba4c6c2f0b852bdc82abb7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:630c9d350636e7f6bed96d13ad9be89db8d3cee40e5539d0afe0e57b02dcb3d6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b40048677af6418943a77f8cd7a55ee372e76a61 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc2bbce47460c2ff07f4081907777fea28e1c20b18fb3507569c732217149298 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0049254efede3000ff974c619893759184ccb81 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf6503a3bb1b1ccf24f41ac7af8ef929be1a18cea420a1dca22b1271d8ad0d02 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4170ab233792335b455830863fcbdc2e6f69d9e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f0d122f2ebf533ca8a14954f32d866b6be8059e82fd41560d7a62091867c5b3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3fef3e4bbbd3a0f24f767936f3bd9914eb2de8c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee62d42eed9707f6f6387c3c4c3ba5c2a9b3cda1669534ce120e66ac2b12452 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bfd13c5351035d7fcb2eb3b94e62d7891354ea4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:100a6e9a4d70075772e953996b956bb6c88731134add793e2966b827c0a412a7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..965a45581441073b9a39893509a9109890253ae9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:798b2b188391363f6692346a6c1118ac73ea0267510bbcdebbc42bbe25d5f02c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fad67eb76e4ca0cd593ebb54f19857b2b1dc4e97 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04cfac6209731f986206b555bf4ca120f90a0aa0f116df1902c2a795ad258f9a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6872294d68d5b6c9cec036d47bab75b1bd176104 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8673aefba99cb075535abfda3517cbb8a3ded404783af4b85161f54d35ee9ba8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd849b83e2bce2eb424ffb28c2609310338d311c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f2a70498d8730ae33b97f2ff983c9ad80827efe60131ba98413dba21c6fb161 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..53e420d0f66477537fd5c5e48f766e5ac136d915 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a80407e296e143e5f3a778b615afcce1915897e26da4a4d8d642596887f8a57 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d94191e80f7138a7b676c14f77978d7b78764102 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6595f5820fdc28a39c665dd4e4317df79786bd0ad52de86c63ed7fc0d6e2e929 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f45d715c016391a45d5decbc18beca808a5843b8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1519dbea81607acda44d9c3d672917b07e01ee6f74de0fb16b864b196cf7a319 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d00fab6619e6180128ebf78774838a49f3d2ac8d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78ce5150a7f8d198753e61e2617a0cead1533d324870ddc84d5d4b237ca66fc6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..909c311a190725944d3a50ad1913812713fd9836 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:303b66aa0b35882a2a41a6b2d87c9a093563ca162129fee4049f5b1ed6bf4fa3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55257d4469831e55d363506c2f4ee4904dd49144 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a97dd291ac2474f41a462002004c306ba86329ab99ed49308a9263c59b7423e9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..200bf4f34d42294b80f960f3843fcb67638a9e47 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c751016b081472a177d6b01f2f7aa360cfd9ea8dd69f7d9cdf4852f2311dae8c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa35c185f1a7613b4030676487a172a65ddbc39c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cb1cd9efa4cefde690ee9851d435e9ba118de771c2b3b81e932677fff69462d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7af297d6fb7efe84342670ec6f3655d369e848c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfe4bb2f2b893a3f523b7ab812acf633da39cf5ab13c6a013130638770c9dce9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b975d6784bafd47fe899c38442f634df0db0448b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:217cfb859ea545cb41f903739bc11f3e9d3662a74b4525838f7e449fa29c09c1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd698429bee940e83fe55aad644e0ef54e438e2b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f41b90f55f5d03393fa6e0c8a69e92c0a988e132ba7f4386ad1878cac265203 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d1de2ef2ef0e7a37f0f1c12558d8cdf4857eef2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:380523fee556ef065e9c5c62e0cfed2ca100f9d1fa16bd23778ab20d2c7c7aae +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1149a8495cb97f61e92ac3ea4076ddd775d0c8e0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5f06f8971e7aaf3a4926c4f712b89fd1da3bdfe673dc182f0d30cf09a6caf0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..aba53974db6a220ab99701ebddedd6ab9f8a3a19 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfd20965688ab4469449ee0a1a41f0b8937a91e1c1d3a0d83d7a1ee01417b285 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fba9a8f6672d78d0c5a4e045ef165242139cc868 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:398e4c809dbed50be602c35e3cc2da230b36eb81270c087487f7277daba3d500 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ae2c52c2c501e02b5247b228960f48a8bd7c14d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e24f09dd7c6438a08abe02cfb9d646a151d12d322017269bf1f431626780f572 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ed33eceb5c552b6b03d0c4dc5238a84278908bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5906e21ab435a898eca28c6f4d3a6056525604abc7e003048acc78105ea9869c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c6c254707f32579815b457083a449afabf5d7ea --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7b63582933986fd036ee728c12b62289262cc3a3402cd80b0bd68459610f00f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a3657fcd4ff6706a006d893df6b288fa8be4eb9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e979014800d22c6280182c84e4377820ba6652b2325a00576db2d3cc45864566 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..33e52616a7e3144944d9e8de3dfdabe68221542d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95a0bc6d252a77d60656ecd5494bb563d2bedcf506e9df5d9a3625572703f04c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c472efa722b90fae8ede334a006257c1e6ddd06f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40831768a56e76a944c3638febf234cde8b8ac7a522eb02eb8f9be5102fab2a4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..523562c9b4ec97568f0ff795408c4510515dc56f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15269de5775d9ddfd47c09ce132f6a8d5c2b44e71d96376af832d977711369ba +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2163b5d3261b5ddf59c9474f93a223fc14dbe495 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57940bb13e91ab006e60402a373609164abd71e670700fd19afcf1d992ef67d0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38dc9171235079f2fc7f4dfe605f995e3d283594 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85be944846d77f32db3776f3a1a69bbb3d7731fcc27131ea106a07adca406adf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..57ec3342d32fb6e1c4903bfe710e75bf612ece6b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2fd6e90320379900fa020a27037132db16f7e35ebcac8e78214f360f6125fb1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e0fcba2944c0285234b783db1c7664fc759a523 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63a3f169e7b6b203f8aab490b4fa05f42d54f34b8af8e374838609e5a0cdb610 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b520a5846a591aed6faf8805a6cd6d0d49859506 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0fe8d82d3365a55387efadc32f3c3ff607f07fefc2284961703e3a95452cd8c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed9f1bf2433837d9f60f0abcbc5b71f22821c71 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:928fdba683c2f66f1b6de3d85d97a1a509940f0e57b731650c4a7f85e81f1753 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eab9ab0a5cb4ce124ac53fbf001c69ed07004b7e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1ccc712317679dd278639ac9460606f2635606e3778e9a1da468277423f831e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e48e0c3672ba12b45a4d372f2f53b57f641cda0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dbb415e8f1dd151774796234b4a033f013fea17c037975e8bba007bca8c5e63 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..13c9fb26de5ef271e818a1af300d604e0ad1d6da --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51a5a31bda1c433f3e9266442c0af4ef886b8e13a3d1784dc7ba01e4f5090dad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de871e15f2c3ba9522ee30cf40c7173c995748b7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71190e739f2abe04aef7801099ebd9ed27c254e2fe5cb0d78b19158478df080b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfa237206443f5297e817e6ed43d9f32ad01dcc0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd77d3587fd4514656de0559930a4c36665e3f6c4482df3fecfec77fdd03b346 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ec1db5d99f52950444a2996713641f64fcbbe7d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3253c60c043726561f0d445fe3926675e61ffbf75bf268dfbed7d12e13c643bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..083a09027ec0ed7ac9845d3a71dc78fe99985032 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbc2e5276ff7897ff261139f64d14833381740ecb0c2b8d775aefa9cbd55e7a9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3897bd06d0530a31807e5ba06531afe5d754678d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b21f1ae70eea2ffc1f8c6e91f58a767a042fc22e339438785d00f5fa1c74f745 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a93f706fd6a4462dc602f7761eff178eb5fe0cc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c1d38f81713681c5dad411937e65319d242d7947869e01888603563ca76cfd8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..842e8532536a6099ff2fa3490c50e41a17d36919 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1bedbb3a22f9afd5a57ca8b2aa513727af86c8fc60be870097121e417b1a9cf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1d79758ddb1d36407e9b1178dfd17fdcd316dda --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4e59dcf947b72df1bb68ad15c77a22b7b91a4e10fbe8aa9372c7febc6f3b04f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c829053cc57fb12c613a2bb81a307f7089d4575f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8957e0ffa05d6ec233552c6518b7ba57ec729abf9dec0e5897e9ee4601f69bed +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a07e1b2ed79250421c69609373afebaa8b898e8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3177b8551cbd9f67c5d4312fc7e8cc8f891c3ca19dda66e9794b2cd9e39e33ac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac72cdbd5c3df13d28afc374b1bbc2baa7e29e20 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:113495a6fe27aced5f14af250578730a89f8710cd88669405aecdbf0cd61e6cc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55abaf3e50b06875af4383283091d6f70de6b3ba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78d5ad6ab62fb18b239455fac7256d7fadcc0ca36791adf870ced729d866ab2f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86fdd4087e1019870c4c04ed7f170a1d59ea0d04 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce106152689ad5d4c1b0e68785a36b088a706c7a48f32ae467e4e3485395bc8e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd1f5f99ba9becb62e377f9f459f4dc6a9cf7ffb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fc2c916d6adb5863512b09ce542ede8421ad46b14fe515c0827f4498668d435 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bac69c8f7c41b9431b9d20a9e5d3799a8442fab --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71bdfcc4f9e043a949c7f44a51d20e1b0b230dc842971d2ab6ab52295fb35346 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4be3f8ed32cf7cedee404c18838750451f9d0db8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daf0b5f80bdffc8852ffd43e395e088c350cfd7f1e5e5e2472d8d7790f686994 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..124c9059b03bc0c235c965d4214f3942cde497e4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6e9575a33109aa056b19208bd3f0ab7df4d61eaac74bfffd22e642a092087e9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd14cc03962f74612e2e9ca41e64ac94cb42d35d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0a3bdea8571a8d597fc047c46527b1f47c9ef58b066db0f3afdf56b034231ca +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3343bf8c022eb74b8607bc703196222ac7ab43c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfe1d0ad08a203bb16791f3d81680c51f9ebb4647b3da0f05677381528b082fb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..55f900faa1461958e7d661b66f6ce3429054456e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45fad3ca8d08523beac4672c0d80af773a77f6c199e52e575824a62726a0593f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..77ac40cb6b694afc769145e304b2adaa047cebee --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d42d414a0b6babc29c20267b4b24cd64e3185c7e7fa2cc31d2ae8b567a9551e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4813b679a3741936331ed355ce518a9ed28047f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc62112e5bf1cab38758323f6f17b9a604dedceffb3c5cf57b317793237a6c93 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e15fe0913e970aefb86473e943f0b5a3082fb77 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:918aad4e8011f7d13afd92b82705c92044b98b37b26297b5b0f2a1bfb7ae9aca +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..43f9be9419788f2ab264ea0127aac4730d888425 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b11054c1b8a054da45194e02175859a00fb0840b537cdc44203d977308663c94 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..521bf2eab219f2c6ee61d479a6dd43827177d073 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f06c31579b77f627eb4278e0c8390528ef70147c50b6d1d8f8a75df5e7e54137 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..397a1aab0fdff2543676a067ec21fa2b6f01e462 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7090dc6762633109eb3f2056beb6ed0bc31d85d2b7931571e8513834c69103bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9343cf6a9afa2fbe8b758ae35c3a316385686273 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ab5be78cb5d89dca1eeb2bd8d3fedfd9dc66e3d183e2d3da5050f02b45c864f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c92104e71d9d287c273b06f5b747cd3228f7a4f9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0b40c542183963bcaa88f5b1a256ebb4dce85e25c10b19f4ec709a2a13de3fc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fa2d1bdb81fd1ea3600095e50b9fcd37e7078b7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20ef1e082b98c28dfdd48b4ab7573f94f29375967c3005a96651d25a774c44db +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3a404aaa50dbd9e3da83d8b144df715ac7bcfbf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6feadad8c5d9bf2518f4fb134f7b2422618b1e4b61d661c7a651825054cbfcf9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..323342ed075f2eff44786e35bf9512a61bffc0d4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7908f74127afa95ac88b841a511ad228968920679aac5e259b9f0baf97d91203 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5045a3f91aab2b92797418ccba57789f5282ce5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d04b024044b70acae9785ff8cc54023023608f0a7585cedb7cf50eacb985a895 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6600e0fb0b2a380dc0137e13b5e4fd1866c487a1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0929e89cf9d749626e3b05731883d15f8ab4823dd1ecddb85aff3a97f3874558 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..307a3a04a9940903f72072442fadf3a725fabd92 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22a26f5025f0586880b55c300044f549779eb3acb0cdf7f73da920102ec61448 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..da64869ab5ac1c786f0fac87f741a74346c15c02 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:834a1177843042d515138acb68d0db01f1b44a75ae8f6a68d7a38f121bf7fb4d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a8350d873cbaf268eb8a62894f8869ab5a1df36 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06e3d562266f337172b8db5e8fe376829987b7b9fe3cb0ce1af61b3ae355fd2d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bac31629e66810beef1aad8238bff75e38312ff8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a25665fb4a27ee8b19899ea03b2b85024cc03b2f81a3f01a1ba98c13ae9d0424 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ac531bec3e1f984cbc6da2072275eebedcc848 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aae49663620750ef1b42b31d5204777eb39a1af1f1e7ab7f27474ddd4803198 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..97b5c57303bfe47f10713f63b3e015a5caf12665 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe783e4323581e09e2ffcf11a22ab8311c5082f5d9d17d1f5e64f39477c56c31 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a74df1dd8a7263ae35d386de80d319ff935d1e89 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec9056a98bce9499f25ea88a500e36a40a6db1bfac47b28806b76c30a7ee4fd4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba7285d5d9af4eb92a70d73a1c090a421c4723cb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:382c38130a622bc5185bb959db165afb2433afe32d338185db7551c33e5011bf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..762bea624993ab94a294c690698e36567b0214bf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd12ba5e0edd5d791a6054fb5a42ff63af5521f977c071d13f9b0ef90d7afe68 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09ebcc7925fbd39a4ac6130d429bcccb445c31ee --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60c6136928942505a213147dc5db5edebeea9495c812388dd9003c45c5c6668e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b1e93cccb805ae11fc781958f0b52c87aaa315e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89e6390fbf9313243d9513823cc3fd3d3284b169efdcda9be2cf093569e96767 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2152222b205ec1f811c4859ba52aadd06e0d67e7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad0bceb649d40ffcb2ffd5a2a5644b187778c5ae78f283cce00a62621ae641c9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ec00ad8c27091f88a70fa09166d8fdb56e96529 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:203d0c0a9aa7ee61b5a3627781e4a624952823ae33eca56134e0db4503c60465 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a56f95307137aad2501d17e0a58fc61496201077 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f952506ca03376f4f42edc2cbf702744335aef7b308a9c2f2faa5d6e006f3946 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..36e3b313b2515f96465b2d508ffdb1950d7edfd2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5295f8b399c6c54880dfcd6391eb9ee3e9732ddc1de7506127ce9f2c28d64a8e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2429a9012bd3f88fa6a1a501f9af11ec2ff905bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e1a9f6726615e6e1030cbe64543f1177103d98856a617e60b0fec1a05ccc555 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc3229fa5266b52448d2e7772e6f254355aaf7c1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b2b1b81be653dadb8c34e6b2d62a5e32b1fcd589ec5804ba6bee6c85e37d563 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32ee18bf2f25e623153f8e8e4fc5f1257a361dec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f2cf9d8508ef8ab0f1fab002987be0430f7eb52b87c158492cf04b7033c1d2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d3f8ec947cadc343a79c0e588ab757e26eea477 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/init/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2de2e9f4ddd3c5abb9c3f64f8db0fdc6b67925fd8f55bbe2f384dafa6e8e254 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/lm_head/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/lm_head/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..48e49b70712d64fcbf53e2817d1a25b65ef9245c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/lm_head/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d37eb8dc96d7b089be6ee456d8077da7eecaa3670aeb468e47867dcd9a72434 +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/lm_head/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/lm_head/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d84b1ff8684b3c2e81ef0ebe1324f87f7e55a903 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/lm_head/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b318d588d65c77686d6feb0d13ce129ef7f0679d7e41f9e34a01a099d247490d +size 205955 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d6968952d4d5fb7e452cfbf0bca2f6d0f80de5f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c28ecb836531f135060a1382f3031292c930be3117bb1eb4ae9239c688c307fc +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..25d65bd318313f582e9e0d1ca6cd297161170103 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60b3c746fe1ed3fa33a4c9470bcdf1089a20ddf6f907c2daee321cd0e6da5f71 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..60f2fa21a21b40309551464718f373e0ed17af98 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f6cab409c17fea4e1dc786b6d57ded795ab72b6ca3a9605385857f0227610bb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50f74ffd390c1a94ddb4422d5946ac88ab39c54e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:528fad1f590a6019319d1f77836fede1611b1447a8e14642fc55bc5b4af26272 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..05e9da763fed8106ab17c4ed076cbcb3adaf9d52 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f280ec0699009d5f2971bbada4e528df829328fa5bc5ae164232edd4b815c9a7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4a2cadbb9d56fc68c2ec782fe2559712fd4ed92 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a7e3b52930e78365c46065e0192f644cb7e46c8852d68a38e60ff3c99ecda1f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4b23980a1bddcb8b8f200dded53f9df40d330ee --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5476998efb65f520d91fa699ab8f412c7c35cc0f6f1968fe2e9d5a5dcaa11b1c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9af70e786862416ad68611b3596507c705057cff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:117eae4959c3d80f82f67a8708154cb6267672f89a270a52f18e38fab1cd5d25 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..485595aac9c3ba722e328890d9061627e23ce8ad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fdc225c228c4ca318d573efbf31da90b7e1eb4b6887c1efa44f72cb91b35344 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6bd18f720af5efdf7925a6628921c666cd17c80 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cbb5a262b70f946ea1493e67ecf9ead1b2069b122aedfe51a4bcf446c7bd8b2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0aaa4c0156924930c1d81ac423104fe85716e764 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b45f83a941fe4af8938b6623b9408a436688b3ee5693eafb2fdbbce7ad161435 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3c0920f4f39bd44dd47f048f18baa1f713d6ffc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.0.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3069fc5b194d2ebe74c9bb8544e5f3aa74ccdf29b78d4be8a83408a6f7ea42a5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0db29530f811caa4e274ffb55630537386dcfa6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c61db6a1254b5efd47b0dcaeae81051191e2493c7944fea51c11b3de3de5b0b9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aec162452b56367a3ddebf46a5973762f663d8d6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f00621d3a1e626b362cde67abe4d31507d04a4d03744fa880f7ca7e8d0aff6b9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1edbaf98fa0a4d2c997bbe5a4f7f7df378231da9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49ef312578a50ed00608f90831aca3633bdae5813539c2c7cfcd1da363f9f6c5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6748b9957c708877fab14f551bf93c1796711f1f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9605e1a563ac59d837cbff15752ef7210d9ce8b616fd0ef573a4e38a228a4d10 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e59825b7d316997cbb0e5dea30d206198e11e50 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:662d9e38461fc715e512cce94feac78e59374507751d3396657d45672f8a0c35 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4eea87ccbc5ec7331b3ca0fdd1c96c1a728e38e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bef39ccb1118c3d6908ba2fbce30d5e3e802902236c9c00a09848686cdede3c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9484fc17a88cb101084d4aec64926b5cbea70e24 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:678ef4c68ed1468177898870ff0f494b17363dd7d930f315a6d88917830e5b27 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd14ddcdc803eeb4d7b163162255c5e4fdaa3ff4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f8603fbea9804a67896d2e7e3a5c477d20d443dcb8082707ca14c15bccf794c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..87d8aa8ec6e28fa4143cc6b1551e1d66a46296d8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8297c21ece51fbc166204721f4e44f3d9a15a671de6f6e76cbe54050ced0b28 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aab69d70a4185c017f41c41acdc818b6f6363dc5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0036a637eefaafca017350aa67ff486163b37562c9ece2852089a771d58aa728 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f61623229f1165b59f91aca771797d75b87b948 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:917007312ef30413c7f486bf4c7b4ddc07cb917e9c18a45ff76f02f7ab407ce8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c5be9327429e259f14acbedee196dbb1d91d74b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.1.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fe796f2a708a95e11713874863e953a690ba397583918c6a223147f83cf1748 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e2a44a2d4c71e6bab1f173acd1a5ad9b346c3e3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32f2bcea0974bdb786fdebf7990674a2b54f04438fae2bbcb1a7ba81aeec3799 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81a369e6d6ed939bdd30d45bd701e2be4d674165 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db746fd53ce7969227a149f629830301340cc8766112fa9b1a1cd4b65ae24238 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce0180d1ad56cb45e831a62a551a8bb8b8589e81 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c56f00e6b2b96a0d6e3f1af82519f6657423660b32d04669d28811bcf6c9b783 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e682f15a0401dfe0642ea73539076aa8219e8b3c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96966213860910c074300c2901ec059ac6809806917f92d6dae00a3c0ee155f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..abf67333c775ac8df0775a742aee28a2ebe641c1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18bb891a02054099d411fb681a0f98757e1b5faf224848bdf757b869a6a17210 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..59efd7943dc8ec6dca5a9fa43563060a58393e2a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36e42ec55630a88baf961f53795b439dc34ae1a1e53dd18132c55293603e1359 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..af2e542c489f5f0463ad7eb085fb7ac99ec38404 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c0537d570c036fece20534ba060093db7114db986cfa80d43041ad088fe3170 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e86fbc2598aece8a128a52ad719beb9e1b0f009 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d87e8cbeb3f25ed0308ac72b970f7e5fd1f96dcd243502116536373272bbabcc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2718a99f9198159ea5002252a8dcb09f04379529 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e78bbf9b90c693e512b22545bd21483bdba8b806aac14af590de55c195fc39b3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a43cec3e253f8b4440115cc4ff2902068eb20a35 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d15c341d08c477ab46beb4bd08efd7356d981d62ee964f6d316695bddcc4f431 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..968286040657b7a87743fb3c4e07a26d52e95dd6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7677e135fd84290251ddbd4c9667e0c275aa224f98c011c99c17a1434a79cacd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..50d7215a81714e63420ff6e4bdeb08ede449c1c0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.10.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf352468702f57cb6df88738a8fd35bf293731be0d2fb15311509b25ef0d244f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7926ddd518dd310a43747016c01b2cfe091265c7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6760f42210efbb2efa68f258507754b93136502762762fc0860b1a88fc91ce56 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5afd7cf175fcc7ecb50cf6d838fb75e777e8861e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a1f24e9a37d62e04af05f91b8ed0a971d22785b11614554d8294fc4026050e5 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..93b61e03bf224ef96951dab56dc11816b07b76bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25f64c4f16ba7372c7638fe6c7dea81a650cbac1d45e9d266d6a5bda9bb105a1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..40595be9dde3ebce1b17e977fdfdc94655824578 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ffbb627cd3c5da77e8c0ff04b3d2a71af03805453856dcb81f407a20d76568f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9ed596871e7ef57dff917b824ddc7a8bc0f6b2b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aa0caca07ec73400249e702e6f5d5ea209753f9ba73d3a2152b4e7068981bab +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c885a9b2eee83e0472234f18ad1c13a655b0d952 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bc5078701a8de545c007bd9bb3db60185f4f2358dfd60f1a4e236e92bf8c281 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..382482cfeee9ad4f2c297a540f0dc94eac956905 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:766601fa64243e21698d38b844a990ea04c681840f57efece850ad79bbf24b9b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f7ee65e9d263c13ed102f196264e062c98d5f14 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88d983de23130d02a8ff01855172aaef36a06866af469cdaa6d59cec368bc4b9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..af8f1c347ad1a6a0c6041867022bff7d99306363 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49b2b23d5f0bbce99e6e3249429bb038e8d844ec2a90e14f0c0a8cd7b6cd68a2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c983e8a3a3b13176215625036959434e094b6dd8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d80d290bd30121f35e44980db5d1fd572c8b028b9f00de6edf1d9360c4afd357 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfb8d55438508e335c1b469b636c847ff5d329bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28a7fa2a38f8a6eef4fda8c132b6ee0bf32345d4ed99f59913b19312449a3cb3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fedbfb226047bc47026f8cb3ecac846ad4bf8df --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.11.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a339c92334860baa5b2dfffbe013a16436c8283de9078b86650b3b8717de900 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f7f12fdf3f1b414cf30c6b5d6b84425437d5b44 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8773b86c0e6ea17d9f8cdfd912e0bcc65cf0118c4b794b279e97cc27bab9cc05 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f1b97ce3028d9e030e61d617b9004ea6898cafa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8569512c215e4f904ab59500911c12bff76ce2a4dff5838639fe9d35b46aa10 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b892a794f49385c3b784e2a4692a16ba8fd16e1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eda38efa06e4337b073a660afe7e0d8666da5f00d112099a44a71f2f62c6f336 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b5928a42868724b1d52bfa2f3c130e24ca512b1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a2a0f97086adbf9676b5c321d56effc6bcf0fd58bdc0aa1e4be218781732b4b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b83c1612daaca1b5ff49b005fe14ab93cc1f2906 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab97dfbab0bfc711d02e8307f30a9be81fa74d882486ecd89c13126e2311e642 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..319c09063da19b400ceeddae02bebde28db7d07e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfebe0dfa1ff663bc293cb4e7ba6793ef81660de286b711e82a76f1ecc0ac55c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e2542aea6a7eb5adeacd64f1b3148b5d50bb455 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a1cb7de7215e1e357cf6b256c77b206b400f7446e8578647c4b44fbe240f210 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31662d97c1c246def2f434d93ff7ea376092e938 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2379c4273fc425d1cb01c31822a17b57624373fc6589505a33503ec9f8e5294f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..54ed7768c1e8176f4903163bcab1fd9280629bd4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67b89c47747ca7003d3221a322612dec6ba36c24d262578129426f9e3a88d6a5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f92123867464d910d356b3cc66213aa3cbb0d537 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:732e69ee6d73050743d49d64388747398300d5013d698760f8ccb05f08e67660 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba90b2b8eb5e6b8482c662d951357abf8dbaddc6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4894529677b05690446ac7d72ac638e8a5078826a1da412b8b28fbbb96c8d2d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf91ec899b2ceca4feffd23ff76bf3e74aecb1d7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.12.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:819e96ce319c631401cf6b68ad795b617421d3137b9ccf7d7914bd8a469376ec +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e08cf447e94b759c9ff2994472573ad169c382b3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a02aa646c2dadbb5f4a2ba46026a1837f96cd752d51b1bed0ef929b84ca0cb36 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c49a2ebec9ed0f4c715cd17b2c28e7c717ac420c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdaddd86988144243e3d6228fa84d32d45c533813def227a561784a8333d6779 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0ea1c8af6af5bc81601a1056b135cc7d3a4eaca --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48dbe78e107dbcebc68b9618bb9800eb5f3c7ea024ad4058ce9578c8c8dd1a7a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d31f24a2b8e269a403a43d18439a4c684303dfe7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c077e00e773403dde8be4f4de3ed81784774a56bcafcedab26a423a9210847 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a76e1c5cc1ef778a7ed22aa871e337754141ed20 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f08eb520997dcc30a0c079dd9d20b5146c674af552b7dd414aff32f4de4495fd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb95030c1a5893b5950d0ed60a357339ac0abc0f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a9cdd3399dea6d14371089f52fd937c342e22238139b05c8ac393275df9fe25 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..524420f0765dad91a87709021ce41b9a679cf5a3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:081d1cd6e370a94d40f92f35df9c41c25677396b4a656582d675e923fb6b539b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..31b18bc9d1a896e42d91031c821e9b8f1fd33029 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:134450eb3da02bf8de921abbaa652d616b0f5dfb8450a741c1fa82b0ddfc6a0e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f48588507e5ce64bfce71bd2ecc470a1e016785b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fee1c6a0139d951b57f98af7c6dfe5b26f3185a5808121ca74a0f22b8c378463 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9878a7b8ea35bbdf94ebad67c210d6c4c7a911ff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d77303db89d97eee91c1d4dea4a464907abf44495e73a9f696cd3a17a61cf871 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..840ff6a0b2c6820b5626dd337107a08508e0f1b9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe6001c5c9fc58422ede4fbfa3f338edb6e1738a6c41fa9080328de0f589aa88 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7563015a8b0f7175f27d4cadd7e089e30d269383 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.13.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24350fea3818269689b0b63d965801325f8d609109422cae6150ce55d4e62092 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..95f8c53e47e08d91d423c933a497ed8b1cab2239 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6647ef58b70d0a7235f9a43d53d64ef998dd2469dee0363442bc9ca103f3a0c0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..29e4508e02f24b560e84bc1188e126e064adf734 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a20c91bc5fb9142af18a2fec11a2a9ab6f83baa4e9370f82b17d776457d5114 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..93ea901db9063625feb29574344744f736a010bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8afb66e7fa8be88eeb4709f626938a43e903f2ac0aa785cca1b00a149c661042 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dac65a17c70c2757aa3461929c608653168ccbf5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d97b0e301a5b04f16c8f39acb88e691262e0fa23095427c4c2ca80de0d7ccd03 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..73113d337eadac23b9ad792bba25025eb4066606 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba16f66272a02ac1d7018e5c21dcd7bce9832975a5b563148c4ebf0a798c39de +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ba76a07920ede69512f2c5e06c2d4438bbbaaa6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dacd0c293f2ead4d688ed3a690e1326b0f8ebd1571df5dcb4226da3e5fe0e5e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..fad0ff66a4b89fc67904b56fe2abcf23dc641004 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fc360f5715fa45166d3b27954e080af2dc375cccd74abb69bb2c6c0b07ef147 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4329e60fb710694b8ae6c6e87d2ef9d0e3ca83c2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc7263c7bca908448100a07984a6a919fac68e70f45edec7631a94105a88f9ad +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b72f037388585fbf89f459f7bdd1025999b688c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afaec974955128ac503afbdd50d72992ab24a22ac027cf4bbcf0c10ceb81aea5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c89da5f6dde425d84e958a91b7ce0020f780dd9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:087f8d097f997599109d19e829da7689decbe1ee355f2e904f549ef88b7888f9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d8f9e2b1045dd0bcfa7212c6454a80d901b233d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:740f74bb98be43c8533a39bb7f16ad8cbcc7c0fd95e0968dee4c83104a6fa326 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bcd2cfa6e0a85d582d11486075e6d0f2719f303 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.14.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ea64df521606d48b24d923a9c111f400879d724610c83b7c1ee869faeea3d90 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea8fa7167af2aad851a40231822ee38b4df924f8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae12b2172b6f63640dfb704f12c97d1d75afdad25842a6e0d9fc4306f1340c38 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..22f8f9937734d0763616204f69eda6140a5323a1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cbca4e68bd08fe8a1c51f04f3ce003f125995c9280b41e8cf2cb87236442ec3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cfafed98b2e6a512030efd64d4ac2fd0b9359cd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1cb734f1662897af96caf6e335c622efcb4536bf5db4edbb2fca375dd11a63d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e5e1610adae53cf312e47f241a5843c0622fc0e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0be79dcd399d29c4960c02b86ca0ef6363ae58131328685af1a66064b999732e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8991c7f35dc9daf5cf6de96826227a24abfdf98 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc7c5932dd45c61b601d29c3753d34f6a95d0384d07255b85d26cd38d00e7bed +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bdcced6ea5071a8bd77b3d68a9aeda189d3540c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2520c148320feb15cf577dce694e976d90a02d77116550acc2ee6f29ea2a8a4a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..76c03d40eafb69a1e57695648d9d9dc12153dc33 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12a1f21616160f152632f3a63127c08c66b93b5c3da947f883eff1ac0c3821c0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..17d846c5dd84aa05d7e5bbb345af77830d195f02 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d98eb425974162e6733fd1faf6d926b401ca1d45627904d12fe572c0696bb396 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8dad44b66b92308d53d159be44342737e2b45aa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b89eb879bb3791f1d143403d5dfc3b62bcade73fe0232298ea37ac19a2c0367 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aa9a5b14d1eb30f15343c2f91354e4ad5a53ab1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f0a4a0c538d12d056dcbdb69cf9a354cd9989f061de54b38e0ebc6c17fc515f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d15a486541e843eafa6b0aa4a2ebb40112abc83d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e98f708283f5a09adfd4ba89f3f231881340907be2820e4cc9d19890e30fe83 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa125504d63473659ba7130c7af3dbf03d5b926d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.15.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e78010c69079fb2b7d0180f6789512b20f833ecb31a4afd4e726e3590e4648c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eee8ac65546c093d26c67310d0387b9bd968df5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc7dd9553f3deb25878991856ed09c5e8a16636891934b1ea8b1ea646a1bb780 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b3f68e84a8d837402a72e5cfb35a39156f1f80e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc16a523a1804359b2f644e018ae8672c2f3e60270fd3290d7a479958748acc9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b066e9462e4b091adc62d19776b8c7c770697a4a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55f0828401036b1f49dc7cc0fa441b2bc34068084b432645b6b33458eac100ce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..495f9c20f496d6f1aabb37c0fc10f5f67728e058 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e3bb7973c877516e427edd966b8722afc59c12181d2984354d4f3d630b22232 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e48c0dbfc8bd883ce62f86e0f557d24e8571f332 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3d8a1d304bc0c0401bcd63db16a6aac193b10b028a7fc4c5151c1b8eddc2166 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c6525c4b0fdab4cfe19558fb8afd73c9c45b70d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5932983aa595e42574405edba828301e5cc8fd3c96aa0c17786c7a4dbd6f6108 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..41400e39cf28dead5843a39e8974cdf6a4c0e297 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71f7574130bf3fb596af5a125422ed1b239b5773172ad2b387ed7394d87cb58e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca8dcc62dcb75bba1d9bee194c3574d109926fff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:568ac1760e000d6040a357b9c2283acbe54ec1bffd31fe10773a7454b9ae4f28 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f72e4e45f0d5cb64d38b360120683d23d34d640 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e76ca6e280147c5970731d61e1e4a84c2145ae428488a7ed07047aac137a11db +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..67133a128f3f853f43e317bf85f40a80b73bfd8e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb4a1c48c5f7c905fbdc56c4366e4098f3827fdc7e5ae7e14139ed4486c23157 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d04b062433c5abea242174ad76b429e7be645a8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aee7c91b60f70269c5445d05fbdd78a574f73089beecd6553b8e1e9d1b8ea15 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ece882e81711971c6263c9787daafb2d2586708 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.16.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beeef765424806ae272d21f5d03405993b4f728baf9985ac8c34a39232b10faf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef6ef4fb326d60bcc8564d866b111e8fd1ce5d64 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43d90574c5c4a2482c350d2e4f636b8c86aecaae7cd2c8eadf5185c125b59538 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91e5506b025ed97df7a694ae4a73b6ccf8ac85fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2175e8aca7965a3a10c4355613c4192376c8a9697124b6c88337f1b0647ea8bd +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7e305023f758a5af5ea3f8e3bb522686c823ca9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27edce21c65ffc59e79a05f9ef38c946861096f7e6c14b621f08c001347a7b27 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3f7337496f0990f80014336caa3ad55494a2125 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09ec71745ab6c14fda032341aabe06816d111eaed086c20c48eb327ce4cd8f6f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4591bda4ee41d58cc5ccfc797d5b139746a26d46 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4f72f2a0238de1d8a5cda65e6c23bcf277badf91187220a283d28ce1f6e16c7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..19f0556e779c32f113993a3b3952d151dccca9cd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47a186ef3c9536d5955694b2564b7a1fc2b481fc412d8a7778779922f8aa101a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..765639659b305eabf954dfe4883f1760a99eff36 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aaa493150764734bf0ddbc280660dd63507b29a7df8a5130f236b175f8869af +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..81ee35523904714c55d65df317553d00146b1ac3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c277d24f851e220ede9667539d11a1e1981eaa2deb99ac1b7855886cb70477d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d70c7f544eded0173fbb00a1a218ba92a27d175 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9987140c9bef48477f98e99c7727501ba26cc9a1a87dfcbafc1822521167aca7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6303cc2024262a29235dcf7b95a7a2f05272c881 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68fca06b88080ee3d95052e7e65782ab00114afcbcaf6eb857e4a5e9ee855ffc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c391241561a53f0503e64d897c70650cb1721c47 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bcbe944c903acab875765a8cadf2a6bfe2d79f48f05d77254c0ea29f6f4ceab +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c7154a6f41db28dbaa4628c48c67515c72f701f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.17.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a23fbc8d5f2086ef5a60b5c387c30da3ded05d77cf25b37960b24193b2dd645b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7db7db7a9c38e176625575db8fae6f1ebd98b20e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13524379dc291968a6df8a0cdd6cc6009c71db8278d555726207c55cc41b78fe +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dbbb760bf0601f54f561ec31a37545e63f6714e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7cd38834fd36a865f3d6d83ab93b75d78a8ea9e114eaa7cea219e49d90f8ee2 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc0357055454aa7637fdb1acdd1f0d3915d957dc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e2685bbc9bc59095d3db76397b162c4cc061f55b17a03075cdf9ee080b172ca +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fe7e107c8829a8115ef5ee1774feffc5a8e0892 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31a771312c1555c9a50d4833daff2c2a437caacac99d66e941163b3a1f32754c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..933aa75e93b7a1cea0454edda03ab713c433a205 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0a06e7088f6db38c6b90e9ceeb764ab921834cbb96784c295c1313f9aab107b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..770f59074a80e52e7bd8416eb44dc8658a068bd5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ef74adb0acc343740cd8fb94a5b729a349936a6b38a1f7d360ff57926960599 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..edcd9c044bb83ce5a3bf6c734ac636ec2874afad --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca0c4714196e38a8f72eebbc85c1c10c74e3328949f4a5e8e09dd3d6d214742b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e6d9fcfcd62753293a21b65af7f4dcba5866603 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2989f3feb6af1d1bcfe35289cb6a41dd1a7c9126e60527216842b06ddc768b43 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..02b23648db02c5d566a687084d33a9104ce7fa1b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad5830f4ee1922ecae0c2a87a4150d49142bfe2b65dee10943ceec422f625b9b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7181a07c1339fdb43e18fa3e9b69224f046a4e23 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b971adb01c169c32b875b25865bf358726fb988324f03936412c3d85fbc1245 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdd0ecdf0d6513c83501ce4bdbbc44370a18d971 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a0f734215698a183498861012aee9f8cf85500e70b0b834ec9adcbded0cecf0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cb7aa2c5bc08fc45e43285628c35aae810d0c94 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.18.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7487d5519f901094871415925c736893e760569a67e9c8f7f0ebc2c73311830 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1084e4bfb559b0e090f10a7a733db8f16fcc602 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e60c3971e7e76cad3a9d211ecbaa0c8b2cf82d2ec21c6dd002a49bb59a6b6f1 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9be1444fa4419f380ba7c7da517cf6afc3b01a10 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d7a6054c372a3c8ba6a288e6a5427e15797d060dc0c7fa752aef21560d05712 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..690276f3f019df2b6570166317ff718bc56d2320 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8917e531645799ec6bb7c805f40828e933fad08a25bbca39450bcd6e322e0aee +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..76c18026b7adc7e22603a53942f3b720f045339b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8052d5e87ff31fdb69dd0334155c3b2f361f77cd2a11ae33084d937929047c3f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c863ec69dbd77eed4cbbf9e62f0f74c65e4fa74 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e222e7512f5d804fc3985277326bef61e6db8a1bc49ada1d0ec509c4778ed162 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ecddf4140e53b2c25172fd9ed35c8e7d58a480d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85f7032595d8de1bbcd2d7532cf61256069a18a115e9e3fc7d6af4610955a2e5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bef5d2fb42ff4cae670a5d2412bed745f8ead82 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1175a7866bac710bef0f9b0b2c3237532b0a7bafc63b8a562700c367822e8fe1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f12f302d33b95145567a974e88d5477fcc4cece8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c02857dad2932f2563c8e51077bf6f82c6e65f7ebdd6f1e8c6c23fc097b40f92 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..38264b7d496bdd92ca1d8edf01691da7485f7fff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:776b454d3b006921fef9f367df1beee2e725666b77d3c361a0ef1eb19d92443f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..38a3efbde8ca79bc9cc1af0cc237e71feff331e9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d445af2ffff1d1766ee71eac3907e3fbb09857b7d92ae5282f5a0d276fa931ac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e16b3f215c6e84cc6ede99f036ec2329398e352f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7240fdc023d40ccadcc32fbeeeb1094d0bc95aea8a9836cdf9ec7ab41b26bb8b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..46743466478de324cec5178059d8d5d776a0f4d8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.19.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1b177c4c6695715ee3c413563bd95543f4def9d400a0f630ad73210e3d2f719 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8bcd498b1a657ea8a9bcf88f7648b8c67a8faaf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebfa63b86c82a4313a81634589440ca34dc66873d78b80a8bb7f13a41dad608d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e19c4e96c2fd926dd8188c9159ec158011e35afd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ad70e94f886732576735dd6679c2f6f51de5da3322ce4e5107414c8b4927f26 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..85421046013ec3416778b52ba9e87a73c70d36bc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f549733125d05b49c6af6fd7594d62f93f66639322f932ff55dce9cc9e9d84b9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd5f585dcf447f83bec9186325a2cdcf9e7b128b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24cc60c5a51d83871faaf76387da7509c866a4524f9f1f8a39b6a265363672ac +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5339ad6d0d4283659204fbb9a7c36fa6a5f36f7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:515dcae77cd672d40f597df3046d32a0eb59220775445a6c6e8343c3e9ef1f8a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..74a2bcfbf4a2af36040acbbdbecd807a554781f1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1b891dd31404b5d49265677d7800c90568fdf759b78c2fbb88fe07c47322275 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c43a67e39d20c5734c0fbcbd7bfa70eed1d0084 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59b90184f5c7a3ee95b7be4043adc1711788fc37be3a56c4f6b5096621c43af1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad197ab01ebd35dcada3cd91768ec309f046ea8b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:980c2c1f2cf3081ce96838f9a178eb76a3f4324bafc1dac11a97a7a2e46b8a79 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..879b42346ad94ed6ecb88003b03fc9837a2d2bce --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07b9d81b5c98e230509cfcb2bf85c68490967ce1185f1fa8bae8f7f675e92f1d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cf50dadc7b72284b253996d194c6bc8ed7dd122 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd416f91ca60c600a625b716fc69dfed22a17d0f8a9df9d7f110f24e49fae91b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..575c91142f659cb54154acb99bea009b05071880 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48ed6f7796a9cd1f98f6c35d78a390bc0ef14ebb93d6b9a4c01179e6fe8d64eb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e362ba56d058bb931a8edf0298e2d2c7694cc442 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.2.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:773b4b855febb6e19214805227df3453698f1be90a416b03a041fdc32fb2556d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ec2fc1163e3d6cfefcb92db77417b972d4249b9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b97d0c5abb230e04018f37ba2449a9406f7a3e4e247ea500eae3d0b8326ac7b0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..06f297508fd7fddebf49b21d42303a844a463cbd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b58985c5b7c6cac47bc5725ac014c152db99ffa48b96cf20415511685155bcef +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..308cf6fd99e3912574183fbb579b33df2dd4091d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16eb43a283add10a8ed266f295fdc155f155c42d3848201bc2bf854ae320a737 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc6bd9229f0768b0a32773fad4e9719e8659dc89 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fac417fada2536351fb222d45b24bb099a1a1b99c2988fc287cbafa57018e15 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4a00a9eb0c7e748b86f8bf6b5befebbcd6ad0af --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:142488c5038c6f2bc3a1ad84e165cd8f08ea6e4e747bc7f9e8709e2a78d4b820 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cd334ca4b0d7c356fafbc5fd425cdbf244f04fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:800352e59d6b0ca2032e553ba6268f6d96e56061c144c5a325a23d131a80c2e0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3518b8fe75107b83aaa319aa84369e9cdaec09c2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1673249df6a364cbbd44a148d580315924a0d3ef0eb8bb11283af695e7da8a1f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf508f6f57058647059dbba37f4f48251ad9914a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a95e972858b1cd6a0826574ddd0ba68faff01b3846a787017dae0619fad18492 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55a155a1b83c796b498401aac67a3914d8a324d1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a918d7fcc2473aa27d8a051b502e1df2ec514163e78f7f6b3e1abf094488e48 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f37d4f18917755a4cd98dfab5477fc326cb614c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d61a81d12ef305e2a505787a1b177c14bf4be0dcff20374526886d9bf3b6dce9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..49d228cff45a66b7a7f5c8f13e5d2e905dea377a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed7bdc32f2fe2176bf9b5c28f027812bfe2ab0eb7f6b9a4cd602d93a548a8808 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af3ccf0b1f6c4cfd5838884329dd39ee47675314 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.20.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3445df2d224a955d551ae22f07cd557e32e668f2fb17885c8a8d292256cbaf8b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..14cdf9d855d483fdb2d4d5eb0dc684b398a2064b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f6ce8ace448ea851f4e795700399995f1bede135a99fff904fef4e086d9e1c6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed2b72aa9b3043ec8afa9c069f5b25d8084a6f69 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe7686a8af5a725bf37d63cb57f9dbf1ed96a90ff649f7f9c6a3ada79d9b9a57 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..55dcb3145153ea2b10a6e28b99c5ea0e4c299781 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9ba4c8e44ac1e9ae4792a8b60f04f5ec0765b71733a73a0792fb4de0c8c525a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..68ebb801abd142a58b2a587d2b557e49226fe7e2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9284b0bb4f1c39ac420084a02bdd26b4d8ec5aca00b03ef9279c98c162dba80d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b52c609cc01a7ccb6fa1df85256190c7b4c2b24 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0fcb063aa990fef83c989d760322c51d6d2923301e60e7bb83b2a4fc99fb8ee +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..15ff33d13f8a0b4e51fe1596f10590fd49b5ceb3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7098c89a9214090f1e90b9eb380f9ec79758ddc68d0118421e89f55becfbdc42 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e561658f6fe5d38c1729e66a71832716667897a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1cac8d00fda9d10ec138ff39cc61f29c782582a6a5e205fadf010fde21fa322 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..266cf3513026fb9bee22899ac0b70420a248c2a3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b85dbc829fe60e144f1c6586eb72f1addbc447aeabcc295a38422a668a842750 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab8dd61749efecb1e39878ca41baf3d52602e3be --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6bea36f30877bea78226b04d13df1b7c76518257e32c8e566e9087f8c33167f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f415df5962edc65704d41965790a26a073f788a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fdf8d8ecc45a02d6c14bba5829bb30cdf05d36563dbde66d3ba3ee8bb6d06b7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..757fce31a777a062b542cbd7fa2753de7caf207b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4063efa31b7edbb3c4bf915ea272e6fd5c05c1be8643d1664698dfdb85d33544 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..03c55100f6925648bb15ce91bec595482695b0d1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.21.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c73c48a8e40688289874490522bc1561198325913971a7c00fab8fafaa8b149 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d7b258c50b2a1d7d7c0b645d7b00adf0c911467 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:386957daa3f195844189ac14b59ebda33ec2c402286517972710e6680359b017 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3366b5e553e1d356c32fc578be52ce035496a30 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46a93ff1f9cc61b3ae6900d3dad37ffc99ec155306c9071755c23da9f062db92 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a52a6bcd2cfdabf102fbe11c74f22a29a467d0ae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a5f36fdb16fc1db6f9b5a9db2713c47c29364074974043d8ca3f1c19d6baab8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa131bdc0eb5b0b8ec6a913f1d02e411863093a5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327ae7323b710cb10f17e8218c8c25190bf02754e28e713452db6c4fd455a0fd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c441e41aec13612535370434fff99742ff414c6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf6cf7fb25d9589303378a2759045db084a685d706d9d081452d70d81ec649af +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bbfb0f02c15214ce6f03f170b3ee03b45a0e8c1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36ba4d3a99571554a087ecfb061488c0d56bb0c41277e51b6a8998d65565226f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7f84237e4639bbddf4897e63f1f3e43a8b6b4c4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e02d26b550047b546b667c03b55daad89b2eb3510a517cc5a926e39b4961bd52 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a7618cb1de074c29df1445a54a4b87c4e66fcb2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f469f6661ff6dc347482cf0463716e570077cd20c297cf3fc6912424cc2db2b3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..730cad8696d28b61ba64b2ca8bb52825989cd601 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c72ed86305c2c17e7f04175128d82df01ec9e01f8f5fb3c273ba2fcee7d88a4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..42b6d55b4cdec748cc97008a338076f70e0ab8b6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:195e12be71568c3b44443b7e856984af7d13c3fb166e8082dac5f6ca722cbb63 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5771b17f2ff932ec06462e829ef3d7a2d50ccf7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70fd8970db0ac84adde2f76d9892e224e934fc83a6dc45fa5478e5d3cf86b0ae +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aae94ac8eb6ca5201ce96efa571cb8a91e535a6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.22.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c72b8f5d9de438ebff2f004ddfad92a7e639753f9943155d0b16ebbcc18783a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..316ebc2b17afdcf8a146e742601840b7f6e565a5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9439f6e94d03e96329e53e2a2f56979689eefe99b6cd4c94173c88a2de57d70 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb9bf5990ea61929b2ade7718a9d644581b2edca --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:527922a7b47c60802d262b6b93b4adfddc895c7f7860f54b9c39d4961380dd68 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff71c7838e90bf9e7649cfad580e921127c8991b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e0c7dbb0abdb75298865943e4c1cd778b50302bab1852725ce264d22b0b511c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ebb37ee64353a2eb62cfde16b4c6417ffd7cae1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4ae214eb3250dfc4159cb487ffc5e7f145c6be488ddad59f3614b5ce6beddf1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ddec764c58cb4b4507e22c4ce4f9d01388503e2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9206857d7258efab2ea3b013f981264755fd4f31fe22ebf67aac4b83244d733f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fd9a33f5669b712168063dc6cf55bd33a80a842 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d47d46b2dabb8371c91677dcd81c24dce0fa235cc4a770834fad986fab3cb205 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cfcdfb6072d675fae4a0e76cc5df1c53f66875e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7780af696d3250e000c0df7f068c944b39a68b9adab8384a5fcd670240e8b596 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..37bd5e7c84e7d03d3f88fbe5f4d92a88f9b25786 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9712857f1cf976986d55e99d5d4bcfa6e47623642015613d71c099168f01be74 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb8ac127e5aa65fcb5f5a6dadbd0b9c1c6320c41 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1693431e496e2054468cdbbba47ccf08576e075888f3f7158697a2489e7b3b5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce2c9261175c7eb454dfc96a2444f910aac05036 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98601fdfd8640ce8af5a8aad18b9e89de5877143709fc99c48278fe24e7aab7b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb609f43b702b83341b5f09b3b8f37bdc70ed889 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:701daef73e560b7b8f67e53a907d886c00132a39ac13d69fc73c4a477c9cc207 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e605b86bc6df68899c84aada3cc89b40705bbddd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.23.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc42a6bd0dec3f0b599585afe86338968966b2874d1a791ea90ab2d9b53a4af7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9b9254a18d298d7301cffe068dfddff42446e56 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49b1f7e4d50677b2f4a917be756608cd331b5f112caaa0f28d15e378e5a03d19 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..669e45ded44ab054756beb5a31e9993c21889d26 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:294756fb24beb343e8be178079ed2e5e45f1cfcb844e2fec0d205b3dce3b0531 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f7f2942ff0b4defc021cd93f5f5a7d5eded85d7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8538808c9601856d30b7d15dd029c837bf2cf83aba65f698bcacf0f1d5c432d1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..809b4608dd05b544d7d7caa47b44fa92b52dc983 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a371b492828c1cd368ceca8f47a458a39f9e9ceb257b7f277d4afc82c377a231 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfb90417cc173a301c4810cb07c33b55eca795d7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4632b17ece1a3781618c508223898ffb3388a554c53e33e4cdb8d9cf387efdce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa65f673bedd89ffa0810c7791a795fb5e85939b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4428a9e3f291f444d8e436409d4a2e510b8617c2550da48ac41dd4942238d275 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..05301d68fa524b6621f7649f528b2e9d53c1daae --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06f6402b788344d0b7cb3fcbd789fbd55c233c79d96a5d91a2bb376953ec8523 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef65c87c1d98278e470580e2dac547d75cc87bbe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a63cdb1f65ea5a9978178a3c431c7bd093cd3e13859e7537b928bb581c91d880 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..abf47e29a31653d42f666b7a5da4ece341908295 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b66785bda7074f9f60f4b38e9fd3944118b95bcfbbd80fbe45bc71141ffe9f65 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..64864649afeda02e2c5219edcccdee27b245e6af --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9fa0d7d2d721f8683aff0afbe969ad351e2e30cb89da48d279e4fca617631d7 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..446ee448e0c254d90cd9311e0caab492eceec2b0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43a098717b1f78f89092d9644c233f426a7cfa906a08c8b7dbc59ecca6dc6de4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee0e559232dfebd04c8bc96899a53fca32e8ff4e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.24.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dd689f3fc581e8025108c076d870b431a63eee54809c258bd2df5c9fc498dfb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c09d09ecab805edc524370fdb2d8c6422a5d5ce9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d929c81cbfee8bb12415dc2df33b74a86500b56af16cc2fc130ac18c5601a715 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aa7aa122fc0fda25f419aa4ba409865747c4fd9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36fb81fab84cfbc8218d11a6402a7c87c0cfb71428b9fd4b32d4e2897854a520 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..76d7461f61652772930c7c9f753f7285e6aa476a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78c9daaa0a2e7bbdb06bdbb473beee6726c4a7db52007832bdcfd322be012c01 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccf5491841bf0bc44ff0f005752b97bdaed49d12 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:667f4ce1b16628e4f93945a6d0a2c9a16741b79cb5ea92fcfd6f5983b54ed9a4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cd1ebce71dfe93c7a4167490a86fa22627bee1a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f619c04f1894e8fe74e9a8482737751aa6ad4d279b23538d9ebe03f7d0bd62df +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bf868772983ec1d61e0842fe2e4f69724eb80d4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dd13b38b893f6825217a48d8152883dc3c4f355dfc171b6b95b441c92585538 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..32f9c17f65702588fa8fda1aa0d67db9f6cd7980 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3334b711ba1b1c821e88a079f82d8b480793b00ca89e2c1174f9c935e652c4f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f69d26d3befbf34b639ea733c9cde2b0248812f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9ef0d993f5041c7783e1d8556082fce36df58541352a1dd1e14193c8053617 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5aa77e1306a98ead091d7c5e95e03c3de04e1cb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0495dc24e0de9cf866e738bab5016643d2d3e3505e7ab298c593a74584c87be9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..510da2c7f20bd8cace7866338ab763cea22e36be --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:761600daf0dfaa240985f81aa383f47a14df3a544d44c60296fed38b77296cff +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d127ff90b30410322327228d8c01d65bda485ff0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7138d61c002ae0351b4582270b2dc29395b65927f01e1cbdf2c9c9c5150679c9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3267c5205303f73cf3aeccbd30c50c4f14e0e9c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.25.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e6203bcde6b92110ed25879dc90b65c8be553c0ffa3b9041030006967da2c70 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cde90e9fb4b0834d36db0bacbf905fad184cd2f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0ad379f768128ab7f428764d9890dabe6b9359229c3eca836fe8ff244fcb577 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..343f25a7408fffcde5e46069043e2371860943ac --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87f556156348229234f609941e411406b6dc23c1e6fa2a7b73013c000080e1b8 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f7db0be82d6f3656b9251abd795d5740ee2fa60 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a26a6d71981089f4f8b2fb890abf4da67806dec57afde364a09088b27df9c2bb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..92ae41b09c56c32687daf8981be997f0c45f40f1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71783dcaf7e30bd3413894e6f16f3e6d49e74cef0d2abcd10bece474eddd3555 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8688435d67fab8441f0810c996b198abf2190fe1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a333737b8afb3e6858680eba81d36a9aba2859c75593cff561bcf24efb1cb36 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..389ca01d28519ac9d09f82d50a4bc59cfa2a7171 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e5a56f1f18912690f9c5cd907e911f1f21616397ffab3ad87728052464818f3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..da1468adc609005a29fa5f0ad3167d6464d9cc9a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:279bcd3a06670030336079b256a99062fe19a07a68ee40c76cc23a3a83412e4c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..75a67b56e01e8cbed53d52cc6ee76d7b497a4e14 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5ec816d4791708d59e351e0026e99d2589a545ab9ec3618630fc0229f375f6e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc614e9c8afa52f8a61ff9c4298abbe422d0debb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ce1a36ef7ee0e216d20c592df0a0ca9a4751ead65ea84cecd3589e2045a56e0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7918d11b48734baf336dae88085f67040ea1f53b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:329d4e2fd8639d386903041d20dbca228ec4d51865feb11fb3beaec7f1d3ca7b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab81cda04f9015c5c8e3bafe9905d7f6842586a1 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:069fa91bcd2136b06c47669aacbb2309a8ba0a497d5e3c2cce1b723c834b25c8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..79d5f957c6b6b7658ce8daab941e4790fcf73b57 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.26.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50a97a8a392df33d1b427e3af970ba9f4fc1690b5c4a361ee0e48432321f3540 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5611d8c2d58fbc823a24f8de6daf01154c431c36 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28c435147a18d73df88f763e3fe6da96f73d87a8261eb0f242cf09127880d27c +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..a578d765c90e4eb88241dce3b9c47a7ea903516c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c3b61171a2e30349c46bee52941c33adf991af35db997765eec2fb28855a897 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..986de11595467d9e5bb0e2cdb6edb2b873bddd45 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa6d6a29e3742852f8062e6232b35b259d42a1182f487f71ef2a132db7b3ac34 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba1a327fce0db7d42e9e37693b149115000dac8d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1de42fd3aa4edeafb28f24623ded450b037fbdd759dbb4336813e32dd71be4f5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f180ae1f38809716df02a86349c1748daec889fb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6357a0ae5ed5d880ad9cdb31582cdfdc83ddb5cda8ae8c2107cf41cd3f2cb4b2 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0b3ea8e1218d24cac0856696869422113cbcf30 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:719b82bc99fab9068e623beb1994377419b0b76d2fcb27e959c05c45fa7b2a3e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..71f62a8d6fd572abf98079c34cded7cf5caf39fa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4925d13afc181f8caca541b52b2576d5e0f1f56a733ceb3510ee9a431a41b1c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf9c7dbee2f8800ef391520965ecbe91833f2e7c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31faeba3067902a5b27e37e3adcddcd3aeda8a9c086a04c16879831aacd85ca5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a19b72fd1b685324d4aa9d50e39c1346a89f512 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:322cde19a98de54fb1cdba944f7516f5834b7859093b2c9159b46a2150b33950 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d5d007e59176a940c7158f1525336a2282e7b24 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6412ed51411560ef10ed821e001a6e1668301aad1b5005c50b1c7ed9f8ad85d5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..12250ab29d0a6afe6f4a85d008f3faa6e00fe2a7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:769b911f175c586a521e2e18eff393320d40fdbb75f5eef36005531fb3c54c04 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f08d73504f7575777fcb5e18c9ba3cf27d794197 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.27.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1ae082f35acf86a480f23c544025a4ff75d11c1b1ccd02c97e477f7a5525122 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b643678b69acca5b08a7334e40f430d57d7186ec --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62bfd29bff795ab9c7b8026f66754fe2974a0fe05ba4d20e5a86f556c040b3e4 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7418beb21074bf19003ed43dff3c7d92030e9aee --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d173a337667955ad6eb1c17ee80d7b59e66105b7fbe4b1dc93d489cc13a6af6 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..86ac8acbd9ae581d7cf921311e982250d80b896d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a30bde8c8e782ad54de6940a3724bab9f9f8f97caea42f95c06e4b70b85f6abd +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..63147274345b50bfdf73db80be5c975736e92992 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1653d8d7f5cbda8f01ea53184afb7672584d94e63760afa8ce24687f593b978 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1a5f90b6ea560d0416ef30f52a5deaf2b9faccd --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be9510f115517576fa0a4c72844caff0ef9a59e6d6a783c3a531d088d84fb42b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a55762a60816fffb4be7109cf0ae265de97f948 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72abc7af823f4df1a759d4317712da36729b53f434236419bfa394ca25720719 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8b956c8b6cf27d686735c15b90d0f67f0c6a4e5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0acb37f32ac3754f88c1b297df472dfc1fd1aac1b058bdaccb2aab4010b32d8c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0b4f27e394e2ac8e2bad7664a4b94da9698c1ff --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd3d2e16fb23446fcae576c5da55ee09c4c4022302091038a1cf5de6608127a6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed424e36036b610825a72e1e368fc4539d8db463 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bdf2cedc60e99d64f10c8273ab0ab9b5fa0a5d3bd4b3d1e30dcaf72476d402a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..074a001c93e3a6f50639162c9d297eb25d3a4d86 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:853119336d29cbc0f76713ee86af134ece9dac8a2fe608d645fc5c0e8e8d1f7f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1117fe2295968f6e86d62c8302eac82b58d70f88 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4b33b4744eea3a844f1e9c5bf9f8bd66fb1a4267fa1f7fb1978440170af4f3f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..df8298277e2dfabb391207eceac9b20a5ef6d799 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.28.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:651a6d0dbf3bcbd2bee7aa7fe6793fcf7b06c7f0b624c48b54ceeda11978b43a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8f64d29d9f2f403477c99c3bc0b2218df78285a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba7cb7bbff5301aaa2398bbf0fc08b733984ede5a6fa641af29b02bd643e49ce +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..10969481262958dfdb929bb52b33106ee8cc0a04 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b563ebcb4afaf0427dba521479788095eb6fdc8804cc667a004057d504ae3b83 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..826048fa07ae790d05d7526cfbe767939e142f16 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78c4e391f3019ff01f9e71baf615804444805aa56ab7efa75cfc6ee36b31ef4d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4b13baa6e94bca866ec109e45172e82219cfbbe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3bef694c10b9f285424b72e62449ec315fc95d6243763543eb76cf14248b605 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..691c0abd0d3e7fbcb4a517d20b6f2cde29a31892 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:949c249c4eb79088c3d57c723f8a57823835c4ce77aec4c4f35b65855df2b942 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..017cd4c12de4c0111c2498047901fe9a56f2ea65 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8c585e28c1136032f1d5885d8c020888b765d1fa3860ff422ec10f061601ab0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..35c0561519ceafa1ed3809c651b519e9af38d0a8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e80ac1260e588b5374d594b2c89267cf65357ef307c62f84764c0c804202c773 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..674353bf21f4fda16e5db4f5ca3f0d94cea21c99 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc7a177473670d513cc97e86a6d58e5a3587cd87b46b76858a6f89551a4aef93 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b475b857362bc202a99b795868f2f5bf663f08e8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46b64a10466cf79e0e201bdd304f471e06bbaeb6aa73d47aea554fb04dd0a013 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a11442dc279bfe65f3d4e819533b69cc3b8866b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b4c1b40e6ad1724ad8163eb1c699e6596ce0bb99f88fc56549469496b150653 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f34680cbfe0b4ba293c4cb5164f7fefc810db67 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad82bbd913c96bd4d39d52eafdaf9fb92fa5db9dd7a11eb965ed15ebbc049c1c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..be316b8a1ec03ea71fa826bbdf2656198140ac39 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.29.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7174ed26a6a19b5c3881923639fd48f374dbb3e5911bf84f740a44086b82adf9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ba3451cc965c4e2bbd4308ae8618d4816278d49 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2555f759c3ac8b07ec8e966001b6c6043ab1ec9ccddd9c01e5c93848fa9e86b +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..39e9be816737ef39ea7a3cc7f5b13794a6a1a7dc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcce76c02e913d4479a1df85a6c071a078d88da14268ba02d5fced3adbc89913 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a85522180829167ce19d11652c59ed2b438e7e85 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94159cb2308b79dcb7734203dd0fc6773b475b57903951294a5e591b8b67b836 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..855b3113f44cf38c9b379b2525f83465e4147985 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c159b36167a4a7afb19e420caff6e08a7d7143f5f34a4fe8a5e2102159cd1c43 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2ddee3b380c90cfcaa3701c813b526a889ee174 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc39a911009393039bbf207f7768987e394765f5d5dc042e1e6d49b907465acb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f11b61781e6fc2f3aa072de34fadd068009c04c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8471f23d4c17b3bbc89cf4bcc8318f9040d2f87f6e9306d70413ebb454fbb13 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ab05f354a2fe9a13c3e1efd5dab49bc592eddd2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:624e741f40347a3405e3064ac52843f20b50fa95fdffafd1392bbfb49a6322be +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c5fffcf6ee2db11ae80d682c89f158916c28d2e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d02c7a4c4218c3f3e0143e041b7567a6f16706a8d97bcc0123f4dda414f5a8e5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e7221b70fc3b3c3483370d5c9c75d332b9762cf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ffca6026fff0b66545e786a238b5a0d3eea257c4af2e9dbebdd5a638bbe21e1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..33b9e9c0c86483c293c7f6066bc5c06b5ec8e741 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a5b2f4bd197a064782aa5ce83460f2dd15352d96ed26318760404e903cad414 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..abb361c11405f306e5520d77c10a8f9ee82f36eb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52bb43565d78179b6d74c6bdd3126ecf1b86f83ac059ce95bd0962bfca26e777 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..56669f847e6be20f8dadfc8415018857de37a1b5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.3.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53d5e3ea2447699fc24a560076b576b2213d0dd5bec547bbc7acb4d1a1a491bc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccbc13c548e0fc8d8065bf115d47b9d20271afc0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f01fae1ad3acee8a8fb42da7d6f673b0eee9525fbd523bb86c85025bbf7d5464 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..afc54436f6d4c8f6fc357a706524ec32349a0ab7 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41de393d1b1bb38c536891f5e421c8698d61cd468ca22f1dddd4a075665c2f45 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6876706e7a05c764061e8d7fde8f07a255a1c0c8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a765b1bded581654a4ddf06679844e1d3a75bfcf7a2cdc98c480a237f05392e4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4696b7ead490da4f6a2d11d84ff1bd1641b0ce9b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:661ff3b7c44a130b4ed69d206f349c3ce68780c8c56dc654011fdb7b10b89f43 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..368aae3e6550fc14c9544f96d0d2a9b3091ed6b9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfad2bfb88b65c5f8acde22d74d71067afc8de6a0010080989c7e2b3206df0db +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..de57dc25b27c22650ab1a1f2ef13b66df41c24cb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae8bff97f2bfbe34b8582126eeb37f88f73c28d8ece316094e3956c6171a808 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7f4f5d970ae8aabc08e282b79b9451fa0aa4c25 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bf54e186b6432cca46be93ebd91f3d245f963da1c4317af1dfc730203b4a7b1 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..86433679eb8115e01ef15822f009284838b6c771 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e7538b359f167038b5f46c277922e5a5a63df40f831be9ab374b669537634ff +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..36325e2e3ae89abffe282487b332753c9503909e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95c7672ac8e122095681a6460e51aa66d8e37f04bf374287afe74abd0f9e1ce3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..23027aa5d64a0512ddde4c545f6adc5ded32a798 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bb4483b790735f7a761585206f2c04e6fbebc8ae5d5814895f8efe8afe68bb8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4914abe6f08791fd18f7383c6d29105ad63f477 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d74e8f5c366e135d21d13c504814218fb7baf3076805e1c35150cdffd9369fe9 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..214867b52c9deaa3ca6c178293a2501e10b83a79 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.30.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a82b2a2c32a8895770def8973a3e167e380b978a36455d773ca5b62ed528f272 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..744561ececeba8e2010298eae773894fd124bad3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9189fd59d7de18d0974a470ea0963d94f0ec338a78b8840dffc8017ff91d449 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..27ca0e97eaca56e5e99c0d3b10c19db39f0c41ba --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67ece18640bab21a6e9f4f73b960ca80094e2af463cb074b004f7032779be0dd +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c232e0e10d392ce8c190f0fbe6b192f95264de2a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b13baefc56afa96d14062f25c006a3c4d9241d686001fb70e4dade868c120b32 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e450c5ad001cd7c038a7bcc118243d9efcd0c4b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:825f676deaa815d09f328259aec6bbf631a2b5618129b050a1b687c223e1ddca +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fe1184984e0f688cca28bdd4165a1794d10b8f6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4017a182327e5cc96361279deacb48c6202a45fd4586b4aef91b7582d60802c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a01ec23730f7d43082f56520a55fe65e2a2002e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66b4a4b8660f174453f180f986c3aea601514a5723d4a84d451c79a18a01397e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..461cb14d4eb7fa9e5f39a3ca17fc324ee22bd6c4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:107eb8ac4b2be76974fd196ee022e23c15e822a68bcecc22e31a671e5535b720 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b32e949b119bbe21b6e17f175a2e0e2d1613543 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f8f818895589e8c3742320fbae7ee9c6ce57b8f579bb903701a913cdf14f9a8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d30ec93a4b423df5ac27658a26c446e41110eeb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:290f7af0b6b7bb09bcea3d73d46dd05d4cc5f201c4bf9dd2de6d6f628642eadc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1ce23f66ab1458494560c174aa67b7bfc3ec265 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e7bfab3a9e31b97d89d5a53a209258b5c1a85b60511ebd11310834893a3ef8c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d39e70d5ece6f5bdbab3162f8b2def2065c97282 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66963ce22d873ad068b4784a322cd79c0ad39b002bb0a84569e4d67108078d9c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c678224fc4c14240783362b491668ddd1cef08fa --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.31.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f82adf2e1c35b40155ceb629532192c46115e5efda6c069bb1981e96f325d97 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cd543d3157771e25fc65541a8e3cd9f2bbdd179 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e40dcbe07e5557050411759b0561a32db73f0507b045608e152a14eb74bdfb97 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b3ab276c46ca90b3ed577a002b1d191a5b17cb0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80135bf0900116c60ca379d87ad8ece424c52b09f788cc764c1bfd05c58ee93e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7072a7c6d29573f439a46bb4ec7ba25a3b1e196 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:384e69eaefabfec5de3beb2dfcb6e95fa939bf4bb7d37398056eba0baaa792aa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f554c77af5fbebbd64881fe617d0c8ba05de391f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:089e592b311d571c008311375397cb284e11dd7e3297c8ad50659726aac67fd5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..be728f93c170c886b82f085f1b9965906c1b63b3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8114c65db1ee00685e9a91c07583266dfef7e041c10aa8551a4c2858dc7ac542 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3c02f70acbb1f9a47515a379b06d9309432ac18 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d13750853db16225352801dd25a93d6a069f79fad613e6ab3d6bc960d64395e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f4e750e320ed9d37341bbb6cd12f5ce0155c258 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a90d61cf296e4418ed192453d0bf41b3bd93f19ec9adbbfed99348ba0ea754b3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..af1fd90a73ff335180cffda2c5e9776c7f8e5459 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04351f071a8d8c6f1ae6fd4ef412362da62f591d74793e093b513c4aedc0f5e3 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..b376a459c652b1ea7f655ab02974dba7ceff2667 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02ed7fc329b4c2f33521226feddc5a99b469d234028d830d35b0620a72d70188 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b401bf63d00edaa7e2489984f6cf1804f4360432 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18616bedfee9a84eb078673e37652623329a239cc7fcf3c10fffb266ad7e9b0c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e30edcbb5c94121840e839f6fadeb0babc0c64f3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b3d7ac02122d4186918a45aa4216ad9d5916694ca71c265bf1d2d1723a5bed4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..00888c4654cd62b3d813fc57a59ecdff56e0bcaf --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.4.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d28119677316d935840fd369b4957499bf57105fc81baa09bdcbe77a664ed12a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3883e4acb92dabb1a5e5c0be381778d195b92f4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e4466725efe6df7f3b8abfcefd7ebed6c91704aa95ac50f35291d552987c4f9 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..45139c7fb4b0256a3f694ba3228e6272e06cd1de --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e804619c707f31ad599e3e17815924986e3c6fd39af68e96c97def0a87c2e66 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c331e5b93d9b82d117b225a6b6b61bb2e2a93cbe --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60cdeff15075a3e871ff320d67b3fe0266b96c9648f2e75606fd885b36e6156d +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e50e2fddadc8d9f1ebab15f1027e7e1987dfa8b5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e50e98eb578ffa081cd1c1fdfcd399e2984ae5b2bc33fb02490f80040dc734e +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b8ee03e6ab1bdd542a2ef67987c106a9f0dd3db --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7e57c0633ac379e68036a7f67561ef54a07f0a8709d9ed0604a10721cdd317c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f84640987694878898b466d4e34d20199f73cd3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f916fa3dbf2f91a0a8d8cbb94964530a32c2ab3455bcb368add51393e45095b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..51987a0ccb55620e304db600effb9a538ca14b74 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:087d499030bacf6506727e3e7db5be45cf83f3c47c2741536f5cf140a93c0ef6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1fe8140845880b109254cd7dfa2c15a506058a4 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfaa6b8d1bf76ecb9a3e995f3bb29d0c4cd6dadfd9995531ce654b376c6ba0d0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e48f9c0e5e4f48de46c7e19bee6a702bed8298e3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b60eac183614d65a12f3a2069feec51fea1eb42be2b8a5c5a4d857d81edd6a2b +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c91fe37a0dab522b3ff369ee19ff78ac534aa0d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cc843d1ca94269111c66619b80227d7601ca45241ce405c61910e374622f7e0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8e3e3187da7249cbd038ca58a17c553f64f4570 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08e504b07ec55d5964bdc77832cf5513f1f8c4dd37e58751e14089a1817c5d56 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e481475a2d739c5671f41e6d39feae6a0d0fac39 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.5.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e329763b2b0187122528c6af173485445442d05bf7a7ef9e420333a41134c653 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..740049d5c79134a51ae77de9415105d94c22d0bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dbb2aa973c8c26cda612bed9b626eb40a5334acdb34c63f7db2be56578ef135 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..82f5fff58b95cee485c7a2a1089c3bb8cec67d1c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc25735f707fe65af04f441bd4b16aff33c6e039f3f2900b0a5d5b3b08e125c3 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fb3e8bd9fa2cba11e424b704782480cee1b2108 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4698c88365b5a40e1e7c2f740b14e74ec2794d9ee048fb7850bf47bc6d7cdf5 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fce2acb79b831ce4d14c03ecb3ee444167c4e9b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2984c42637cc5f54aad4ad3221f87d781574f032d6c6983af227dbadfac3f9dc +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..c84d56599ea463f0562af2b14e80113003f78d73 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04b906f9bc10874b855144ddd8bb51c2797caec404cbc80ecea49c68f640bdbf +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..371da23f030d60e347176b92e1b8f61945620ed8 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f374cbf849dc23a4a9ab3a0eace05ffb1c3c372e5ef3492d7909315ce4701000 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..78d26e4c70cbd29b870d315b9838d536ba475ee0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77b73a42da7e567968ee21a45f8516c57b8b540307e3e43c34bf643c23a228f0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cc6a3808cf15333ed21d47f48ac9cddadd742b2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e057438413a42a9f69a37663adc3bcb608ef4e7dab79ef23f48e6ab91aa3fcb4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f61456bb808596be2d54d1d9ed126c245603a34f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1231d3727f39603703e7f82fc790c5fb2a6f57ca0b96d56bc7d443de2f0281b6 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09a0fcff10092715510c7ad211ed02f085815c2e --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcfd571c2b802baad381c0c2aefbc30bc71ff17060793b30b7fdb748fc20a8b8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bd36c926355f5c6130c1db4ae63e0e775ecc015 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66f3c31f072a14f31cb57d859a11d58226bb4320b62317c851db79dba4c1a855 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..88d4942b81d812f2c984a74f18bf2246f68540c3 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.6.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eab07cdb538678f58672ae3385d91259df799a881e69c8cae73bb3d3b42f3bb +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d64fcc86bedc57a78ccd706c1f2b0631be452ed --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16cad8098576ee287ffaa9ff55d169d4f48afcb8cff67e3803a011b53266584e +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..09c920573622eb08a976d753813ce2f7a968a412 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:257205230637a4ba7856a228591e9b3a02055743f4cb6eae2d7494718d8d7b2d +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7135a08d7a6d383540c6f1f6aadbc26978ba789d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c59b2dcb19b948c4f60105ed2aca3c08963618d4fdf15d65af9d947a39a82b88 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5ec967f60a17077b8e8b4c2dd504e6994d7c18f --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9846ee644c13271ebd94efdd06dc9cbcaa16ac3e0950b57b2521037ac2d4cc75 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..95489184adfc6b6345dac0631294cba7764faf85 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfffde0b32f7199eef6390682f6f3d2808865f946579bd5d075feb4dc33de8a4 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f359e13c4d815e135c37f5b573deb37e9e8f43a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98567da0a641d924dc23d01fabd49223cdee117a34839e6bbc5480a081d0f1aa +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ec4be9aa2eb82a1f08f9b2d97ade123954e838a --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48382c0b5e454e43808846f4dffc41ea4c72e9a2097a407e68a1536d3c5b6f55 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c51e1d99e0dee3420a9064c930551e09726f4728 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59f2f10a6cd6faccd43ecbc383a7ee394d12ed1bf3e0d30271d376fb86870884 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2bbe4ecaa7ae800db85377d86b131bec6766911 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcc2c1432be6d27d223211afcb4bc9d85a632385ad668bf7947a13a8d76f23a0 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bf0e3fc90bc0d9397be7decec1f6fe70a646ff2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6fa3c4699f36bc19d5703b508713d99fa8609d19688ae634bb7d2704567e2ca +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7e98f5d7f72c928368060db0d3168f18a2b608d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d27b5779c99cc48436510751e698e8495382e45ccc190912f34c8a17d06aabce +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8fd78c5ff3a0b101a68cc7923aedaca1ae33995 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.7.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75dc947374273a57f440a39809c138c4c9f3fc1ef10a58cbecfb3c065aabc35c +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..06bc43be3236242610174c5263993a6cfc0fd2b9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:959b05c55686ee1d1ad615303ecaed1b8bad0f2236007df9701bf0ec297e1869 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..6649208eab0ee8eca4a48278e16c8e00c356aeca --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:556c08cb9ebded04e408ba0e4d3ff080d1e4e02a2c07d93bc7aaa35bbdfd9e18 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d9e83751bad3e97eb1723815d3a552405cf8290 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f19bbc3443c7d1770163ef9ef73753e4db59b6a3bb1e99b0e0c807a1faf9a31 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..f063c9be4561b7fc2e0048999c9aec3cac2e4590 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3963809d0ce3ecbd27b4b87c9a8c61e259f4c82386048e84d3a01ae6692e43ef +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..f758294b97d5b519c37c9feab04ee6bac3be1d20 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:659eb11c2426ddf2fea7934fd37276c20379807153e68d58c3f21fb597fbd37f +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..5be0fe19c752281614231dbaadc4da405ef2c337 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3bb6a5feef81be632bc98824403012be7f85b21c3b116b500410b8c1ac8cc25 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fe12dfe05b49b6c6da14b51fbc953ca285746b0 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e4ef7fd423e8f2b95977604cf5fee41230206f4943fa309dc6efc5d8b9e47da +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..d15dfa094406da46bc4f91d15bf311e0da13b6bb --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d076d19c434c3976d5cade6c4891a4231abe1c158e26b497038357bd9d11542 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..a364c843e9e3148b82fcd4734cfaf3ab7ca57515 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1953e565002e9e3046f52e267b2cffe351da9f64f89dad4beb17d44d2b119c88 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a1cac9ca0f5a969da9dc7805cc57d171a4be849 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f04411f98ab6ce490c5db39762714f6b53d663a0fe0398bc3deb9dc9eb7a3171 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..46a454a4d0cc6f38f9aabd0e875d8300bb7e216b --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b11c402612ec08079af1a9cbe2ba3e54e13c91efd0310beb7e5a363a6f90c9a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e16b7d57d78dafbd45533fc4d67ef9a53a29a31 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.8.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c40bf9abdb95c4de7d1eb4cc01e4d995ba229fbd129af4f33ba0f49a0d440e67 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..d18b326933cba0e68765d1a9cf9582faba3c0643 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d98d55be428d3478f8c38188af38636739bd5b64e2ea8d1a87654e4459990e1 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..91003583418f59ef483c60196d227505cc9ce58d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc1/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:209113d65100b1e66af9625c48706099fb189362ad180ce1571017afb58612f0 +size 42115 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..e167c85878cea821038f0a91082ececc024212a9 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4c1b2dfc905e50c48f724d1cd5cf420aa3f2ec746b5371833b61417c6618e3a +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc9e3bceb414758995b4539de052984cc46b0109 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.mlp.fc2/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe37987bcf191f187f698335386002576b90cf1fc2b6ac4e1aca37fd6d5fed76 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..7df800643b0c3a88dc0f029b346ec6ceaf09f274 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5f30ee3323a6b90e456a56c9f5f8feee95d80f0cb53e9dbbe9170b1858aeaa8 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..21361c77872c595c74d4bc787d65d66a082334fc --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.dense/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:693bbf43a1fdea8a3fba52d4e70af444c02dc17ce5b76fbcf8dde3b43be11e50 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ce193e4427f3a5d0b9e00e60f1b49c5a99adaa6 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b16734aff6e995cdf93e663c2b76251bf6ee8ae243bae70098fd4cbd96fd235 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..137ea93fcbf5d9873ddbce6fb91463b1e64e88b5 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.k_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcbc0bcacf3989e665f28436f99b04ce64b66ab986d1dfbb9e3c1908e976ab27 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..960512c7f6dfcbdbc0a4aeff3228251265f03cee --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:423048fb7005ca1191b44d361b710b1853633b7bd31b3e0dc7aac18f12e36979 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..c97ad12739e54f7899e24a11f9160bc67b6b2cb2 --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.q_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e007714163ff997d2353de0c1ca738a4ff189b7d1a4c72d434e1964fa5bf32af +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_0.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_0.pt new file mode 100644 index 0000000000000000000000000000000000000000..141e571f1f54db7ba816afd5360e66ec0dc7d10d --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_0.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72122ac65f0ef9079f7f24b32e1711c6392ac704011fabfc2251b32baa636438 +size 11395 diff --git a/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_s.pt b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_s.pt new file mode 100644 index 0000000000000000000000000000000000000000..b196697ea614754c6e451ea8a104c0379cfac26c --- /dev/null +++ b/params/phi/6/rnd_search_t_no_sched/comb_12/trained/model.layers.9.self_attn.v_proj/_s.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3041f6545054674113618cc9b61da66f2096f933b3d15e3518882dea4d00748f +size 11395